# Licensed under a 3-clause BSD style license - see LICENSE.rst
"""Source catalog and object base classes."""
from __future__ import absolute_import, division, print_function, unicode_literals
from collections import OrderedDict
import copy
import numpy as np
from astropy.utils import lazyproperty
from ..extern import six
from ..utils.array import _is_int
from ..utils.table import table_row_to_dict
from .utils import skycoord_from_table
__all__ = ["SourceCatalog", "SourceCatalogObject"]
[docs]class SourceCatalogObject(object):
"""Source catalog object.
This class can be used directly, but it's mostly used as a
base class for the other source catalog classes.
The catalog data on this source is stored in the `source.data`
attribute as on OrderedDict.
The source catalog object is decoupled from the source catalog,
it doesn't hold a reference back to it.
The catalog table row index is stored in `_table_row_index` though,
because it can be useful for debugging or display.
"""
_source_name_key = "Source_Name"
_source_index_key = "catalog_row_index"
def __init__(self, data, data_extended=None):
self.data = data
if data_extended:
self.data_extended = data_extended
@property
def name(self):
"""Source name (str)"""
name = self.data[self._source_name_key]
return name.strip()
@property
def index(self):
"""Row index of source in catalog (int)"""
return self.data[self._source_index_key]
@property
def _data_python_dict(self):
"""Convert ``data`` into a Python dict that only contains
Python data types, i.e. is readily JSON or YAML serialisable.
Quantity unit information is stripped.
This is mainly used at the moment to pass the data to
the gamma-sky.net webpage.
"""
out = OrderedDict()
for key, value in self.data.items():
if isinstance(value, int):
out_val = value
else:
# This works because almost all values in ``data``
# are Numpy objects, and ``tolist`` works for Numpy
# arrays and scalars.
out_val = np.asarray(value).tolist()
out[key] = out_val
return out
@property
def position(self):
"""Source position (`~astropy.coordinates.SkyCoord`)."""
return skycoord_from_table(self.data)
[docs]class SourceCatalog(object):
"""Generic source catalog.
This class can be used directly, but it's mostly used as a
base class for the other source catalog classes.
This is a thin wrapper around `~astropy.table.Table`,
which is stored in the ``catalog.table`` attribute.
Parameters
----------
table : `~astropy.table.Table`
Table with catalog data.
source_name_key : str
Column with source name information
source_name_alias : tuple of str
Columns with source name aliases. This will allow accessing the source
row by alias names as well.
"""
source_object_class = SourceCatalogObject
# TODO: at the moment these are duplicated in SourceCatalogObject.
# Should we share them somehow?
_source_index_key = "catalog_row_index"
def __init__(self, table, source_name_key="Source_Name", source_name_alias=()):
self.table = table
self._source_name_key = source_name_key
self._source_name_alias = source_name_alias
def __str__(self):
s = self.description
s += " with {} objects.".format(len(self.table))
return s
@lazyproperty
def _name_to_index_cache(self):
# Make a dict for quick lookup: source name -> row index
names = dict()
for idx, row in enumerate(self.table):
name = row[self._source_name_key]
names[name.strip()] = idx
for alias_column in self._source_name_alias:
for alias in row[alias_column].split(","):
if not alias == "":
names[alias.strip()] = idx
return names
[docs] def row_index(self, name):
"""Look up row index of source by name.
Parameters
----------
name : str
Source name
Returns
-------
index : int
Row index of source in table
"""
index = self._name_to_index_cache[name]
row = self.table[index]
# check if name lookup is correct other wise recompute _name_to_index_cache
possible_names = [row[self._source_name_key]]
for alias_column in self._source_name_alias:
possible_names += row[alias_column].split(",")
if name not in possible_names:
self.__dict__.pop("_name_to_index_cache")
index = self._name_to_index_cache[name]
return index
[docs] def source_name(self, index):
"""Look up source name by row index.
Parameters
----------
index : int
Row index of source in table
"""
source_name_col = self.table[self._source_name_key]
name = source_name_col[index]
return name.strip()
def __getitem__(self, key):
"""Get source by name.
Parameters
----------
key : str or int
Source name or row index
Returns
-------
source : `SourceCatalogObject`
An object representing one source.
Notes
-----
At the moment this can raise KeyError, IndexError and ValueError
for invalid keys. Should we always raise KeyError to simplify this?
"""
if isinstance(key, six.string_types):
index = self.row_index(key)
elif _is_int(key):
index = key
else:
msg = "Key must be source name string or row index integer. "
msg += "Type not understood: {}".format(type(key))
raise ValueError(msg)
return self._make_source_object(index)
def _make_source_object(self, index):
"""Make one source object.
Parameters
----------
index : int
Row index
Returns
-------
source : `SourceCatalogObject`
Source object
"""
data = table_row_to_dict(self.table[index])
data[self._source_index_key] = index
try:
name_extended = data["Extended_Source_Name"].strip()
idx = self._lookup_extended_source_idx[name_extended]
data_extended = table_row_to_dict(self.extended_sources_table[idx])
except KeyError:
data_extended = None
source = self.source_object_class(data, data_extended)
return source
@lazyproperty
def _lookup_extended_source_idx(self):
names = [_.strip() for _ in self.extended_sources_table["Source_Name"]]
idx = range(len(names))
return dict(zip(names, idx))
@property
def _data_python_list(self):
"""Convert catalog into a Python list that only contains
Python data types, i.e. is readily JSON or YAML serialisable.
Quantity unit information is stripped.
This is mainly used at the moment to pass the data to
the gamma-sky.net webpage.
"""
return [source._data_python_dict for source in self]
@property
def positions(self):
"""Source positions (`~astropy.coordinates.SkyCoord`)."""
return skycoord_from_table(self.table)
[docs] def copy(self):
"""Copy catalog"""
return copy.deepcopy(self)