Source code for treecorr.field

# Copyright (c) 2003-2024 by Mike Jarvis
#
# TreeCorr is free software: redistribution and use in source and binary forms,
# with or without modification, are permitted provided that the following
# conditions are met:
#
# 1. Redistributions of source code must retain the above copyright notice, this
#    list of conditions, and the disclaimer given in the accompanying LICENSE
#    file.
# 2. Redistributions in binary form must reproduce the above copyright notice,
#    this list of conditions, and the disclaimer given in the documentation
#    and/or other materials provided with the distribution.

"""
.. module:: field
"""

import numpy as np
import weakref

from . import _treecorr
from .util import get_omp_threads, parse_xyzsep, coord_enum

def _parse_split_method(split_method):
    if split_method == 'middle': return _treecorr.Middle
    elif split_method == 'median': return _treecorr.Median
    elif split_method == 'mean': return _treecorr.Mean
    else: return _treecorr.Random  # random


[docs]class Field(object): r"""A Field in TreeCorr is the object that stores the tree structure we use for efficient calculation of the correlation functions. The root "cell" in the tree has information about the whole field, including the total number of points, the total weight, the mean position, the size (by which we mean the maximum distance of any point from the mean position), and possibly more information depending on which kind of field we have. It also points to two sub-cells which each describe about half the points. These are commonly referred to as "daughter cells". They in turn point to two more cells each, and so on until we get to cells that are considered "small enough" according to the ``min_size`` parameter given in the constructor. These lowest level cells are referred to as "leaves". Technically, a Field doesn't have just one of these trees. To make parallel computation more efficient, we actually skip the first few layers of the tree as described above and store a list of root cells. The three parameters that determine how many of these there will be are ``max_size``, ``min_top``, and ``max_top``: - ``max_size`` sets the maximum size cell that we want to make sure we have in the trees, so the root cells will be at least this large. The default is None, which means we care about all sizes, so there may be only one root cell (but typically more because of ``min_top``). - ``min_top`` sets the minimum number of initial levels to skip. The default is either 3 or :math:`\log_2(N_{cpu})`, whichever is larger. This means there will be at least 8 (or :math:`N_{cpu}`) root cells (assuming ntot is at least this large of course). - ``max_top`` sets the maximum number of initial levels to skip. The default is 10, which means there could be up to 1024 root cells. Finally, the ``split_method`` parameter sets how the points in a cell should be divided when forming the two daughter cells. The split is always done according to whichever dimension has the largest extent. E.g. if max(\|x - meanx\|) is larger than max(\|y - meany\|) and (for 3d) max(\|z - meanz\|), then it will split according to the x values. But then it may split in different ways according to ``split_method``. The allowed values are: - 'mean' means to divide the points at the average (mean) value of x, y or z. - 'median' means to divide the points at the median value of x, y, or z. - 'middle' means to divide the points at midpoint between the minimum and maximum values. - 'random' means to divide the points randomly somewhere between the 40th and 60th percentile locations in the sorted list. Field itself is an abstract base class for the specific types of field classes. As such, it cannot be constructed directly. You should make one of the concrete subclasses: - `NField` describes a field of objects to be counted only. - `KField` describes a field of points sampling a scalar field (e.g. kappa in the weak lensing context). In addition to the above values, cells keep track of the mean value in the given region. - `ZField` describes a complex scalar (spin-0) field. In addition to the above values, cells keep track of the mean (complex) value in the given region. - `VField` describes a field of points sampling a vector (spin-1) field. In addition to the above values, cells keep track of the mean (complex) vector in the given region. - `GField` describes a field of points sampling a shear (spin-2) field (e.g. gamma in the weak lensing context). In addition to the above values, cells keep track of the mean (complex) gamma value in the given region. - `TField` describes a field of points sampling a trefoil (spin-3) field. In addition to the above values, cells keep track of the mean (complex) value in the given region. - `QField` describes a field of points sampling a quatrefoil (spin-4) field. In addition to the above values, cells keep track of the mean (complex) value in the given region. """ def __init__(self): raise NotImplementedError("Field is an abstract base class. It cannot be instantiated.") def _determine_top(self, min_top, max_top): if min_top is None: n_cpu = get_omp_threads() # int.bit_length is a trick to avoid going through float. # bit_length(n-1) == ceil(log2(n)), which is what we want. min_top = max(3, int.bit_length(n_cpu-1)) else: min_top = int(min_top) max_top = int(max_top) min_top = min(min_top, max_top) # If min_top > max_top favor max_top. return min_top, max_top @property def nTopLevelNodes(self): """The number of top-level nodes. """ return self.data.getNTopLevel(); @property def cat(self): """The catalog from which this field was constructed. It is stored as a weakref, so if the Catalog has already been garbage collected, this might be None. """ # _cat is a weakref. This gets back to a Catalog object. return self._cat()
[docs] def count_near(self, *args, **kwargs): """Count how many points are near a given coordinate. Use the existing tree structure to count how many points are within some given separation of a target coordinate. There are several options for how to specify the reference coordinate, which depends on the type of coordinate system this field implements. 1. For flat 2-dimensional coordinates: Parameters: x (float): The x coordinate of the target location y (float): The y coordinate of the target location sep (float): The separation distance 2. For 3-dimensional Cartesian coordinates: Parameters: x (float): The x coordinate of the target location y (float): The y coordinate of the target location z (float): The z coordinate of the target location sep (float): The separation distance 3. For spherical coordinates: Parameters: ra (float or Angle): The right ascension of the target location dec (float or Angle): The declination of the target location c (CelestialCorod): A ``coord.CelestialCoord`` object in lieu of (ra, dec) sep (float or Angle): The separation distance ra_units (str): The units of ra if given as a float dec_units (str): The units of dec if given as a float sep_units (str): The units of sep if given as a float 4. For spherical coordinates with distances: Parameters: ra (float or Angle): The right ascension of the target location dec (float or Angle): The declination of the target location c (CelestialCorod): A ``coord.CelestialCoord`` object in lieu of (ra, dec) r (float): The distance to the target location sep (float): The separation distance ra_units (str): The units of ra if given as a float dec_units (str): The units of dec if given as a float In all cases, for parameters that are angles (ra, dec, sep for 'spherical'), you may either provide this quantity as a ``coord.Angle`` instance, or you may provide ra_units, dec_units or sep_units respectively to specify which angular units are providing. Finally, in cases where ra, dec are allowed, you may instead provide a ``coord.CelestialCoord`` instance as the first argument to specify both RA and Dec. """ if self.min_size == 0: # If min_size = 0, then regular method is already exact. x,y,z,sep = parse_xyzsep(args, kwargs, self._coords) return self._count_near(x, y, z, sep) else: # Otherwise, we need to expand the radius a bit and then check the actual radii # using the catalog values. This is already done in get_near, so just do that # and take the len of the result. return len(self.get_near(*args, **kwargs))
def _count_near(self, x, y, z, sep): # If self.min_size > 0, these results may be approximate, since the tree will have # grouped points within this separation together. return self.data.countNear(x, y, z, sep)
[docs] def get_near(self, *args, **kwargs): """Get the indices of points near a given coordinate. Use the existing tree structure to find the points that are within some given separation of a target coordinate. There are several options for how to specify the reference coordinate, which depends on the type of coordinate system this field implements. 1. For flat 2-dimensional coordinates: Parameters: x (float): The x coordinate of the target location y (float): The y coordinate of the target location sep (float): The separation distance 2. For 3-dimensional Cartesian coordinates: Parameters: x (float): The x coordinate of the target location y (float): The y coordinate of the target location z (float): The z coordinate of the target location sep (float): The separation distance 3. For spherical coordinates: Parameters: ra (float or Angle): The right ascension of the target location dec (float or Angle): The declination of the target location c (CelestialCorod): A ``coord.CelestialCoord`` object in lieu of (ra, dec) sep (float or Angle): The separation distance ra_units (str): The units of ra if given as a float dec_units (str): The units of dec if given as a float sep_units (str): The units of sep if given as a float 4. For spherical coordinates with distances: Parameters: ra (float or Angle): The right ascension of the target location dec (float or Angle): The declination of the target location c (CelestialCorod): A ``coord.CelestialCoord`` object in lieu of (ra, dec) r (float): The distance to the target location sep (float): The separation distance ra_units (str): The units of ra if given as a float dec_units (str): The units of dec if given as a float In all cases, for parameters that are angles (ra, dec, sep for 'spherical'), you may either provide this quantity as a ``coord.Angle`` instance, or you may provide ra_units, dec_units or sep_units respectively to specify which angular units are providing. Finally, in cases where ra, dec are allowed, you may instead provide a ``coord.CelestialCoord`` instance as the first argument to specify both RA and Dec. """ x,y,z,sep = parse_xyzsep(args, kwargs, self._coords) if self.min_size == 0: # If min_size == 0, then regular method is already exact. ind = self._get_near(x, y, z, sep) else: # Expand the radius by the minimum size of the cells. sep1 = sep + self.min_size # Get those indices ind = self._get_near(x, y, z, sep1) # Now check the actual radii of these points using the catalog x,y,z values. rsq = (self.cat.x[ind]-x)**2 + (self.cat.y[ind]-y)**2 if self._coords != _treecorr.Flat: rsq += (self.cat.z[ind]-z)**2 # Select the ones with r < sep near = rsq < sep**2 ind = ind[near] # It comes back unsorted, so sort it. (Not really required, but nicer output.) return np.sort(ind)
def _get_near(self, x, y, z, sep): # If self.min_size > 0, these results may be approximate, since the tree will have # grouped points within this separation together. # First count how many there are, so we can allocate the array for the indices. n = self._count_near(x, y, z, sep) indices = np.empty(n, dtype=int) # Now fill the array with the indices of the nearby points. self.data.getNear(x, y, z, sep, indices) return indices
[docs] def run_kmeans(self, npatch, *, max_iter=200, tol=1.e-5, init='tree', alt=False, rng=None): r"""Use k-means algorithm to set patch labels for a field. The k-means algorithm (cf. https://en.wikipedia.org/wiki/K-means_clustering) identifies a center position for each patch. Each point is then assigned to the patch whose center is closest. The centers are then updated to be the mean position of all the points assigned to the patch. This process is repeated until the center locations have converged. The process tends to converge relatively quickly. The convergence criterion we use is a tolerance on the rms shift in the centroid positions as a fraction of the overall size of the whole field. This is settable as ``tol`` (default 1.e-5). You can also set the maximum number of iterations to allow as ``max_iter`` (default 200). The upshot of the k-means process is to minimize the total within-cluster sum of squares (WCSS), also known as the "inertia" of each patch. This tends to produce patches with more or less similar inertia, which make them useful for jackknife or other sampling estimates of the errors in the correlation functions. More specifically, if the points :math:`j` have vector positions :math:`\vec x_j`, and we define patches :math:`S_i` to comprise disjoint subsets of the :math:`j` values, then the inertia :math:`I_i` of each patch is defined as: .. math:: I_i = \sum_{j \in S_i} \left| \vec x_j - \vec \mu_i \right|^2, where :math:`\vec \mu_i` is the center of each patch: .. math:: \vec \mu_i \equiv \frac{\sum_{j \in S_i} \vec x_j}{N_i}, and :math:`N_i` is the number of points assigned to patch :math:`S_i`. The k-means algorithm finds a solution that is a local minimum in the total inertia, :math:`\sum_i I_i`. In addition to the normal k-means algorithm, we also offer an alternate algorithm, which can produce slightly better patches for the purpose of patch-based covariance estimation. The ideal patch definition for such use would be to minimize the standard deviation (std) of the inertia of each patch, not the total (or mean) inertia. It turns out that it is difficult to devise an algorithm that literally does this, since it has a tendancy to become unstable and not converge. However, adding a penalty term to the patch assignment step of the normal k-means algorithm turns out to work reasonably well. The penalty term we use is :math:`f I_i`, where :math:`f` is a scaling constant (see below). When doing the assignment step we assign each point :math:`j` to the patch :math:`i` that gives the minimum penalized distance .. math:: d_{ij}^{\prime\;\! 2} = \left| \vec x_j - \mu_i \right|^2 + f I_i. The penalty term means that patches with less inertia get more points on the next iteration, and vice versa, which tends to equalize the inertia values somewhat. The resulting patches have significantly lower std inertia, but typically only slightly higher total inertia. For the scaling constant, :math:`f`, we chose .. math:: f = \frac{3}{\langle N_i\rangle}, three times the inverse of the mean number of points in each patch. The :math:`1/\langle N_i\rangle` factor makes the two terms of comparable magnitude near the edges of the patches, so patches still get most of the points near their previous centers, even if they already have larger than average inertia, but some of the points in the outskirts of the patch might switch to a nearby patch with smaller inertia. The factor of 3 is purely empirical, and was found to give good results in terms of std inertia on some test data (the DES SV field). The alternate algorithm is available by specifying ``alt=True``. Despite it typically giving better patch centers than the standard algorithm, we don't make it the default, because it may be possible for the iteration to become unstable, leading to some patches with no points in them. (This happened in our tests when the arbitrary factor in the scaling constant was 5 instead of 3, but I could not prove that 3 would always avoid this failure mode.) If this happens for you, your best bet is probably to switch to the standard algorithm, which can never suffer from this problem. Parameters: npatch (int): How many patches to generate max_iter (int): How many iterations at most to run. (default: 200) tol (float): Tolerance in the rms centroid shift to consider as converged as a fraction of the total field size. (default: 1.e-5) init (str): Initialization method. Options are: - 'tree' (default) = Use the normal tree structure of the field, traversing down to a level where there are npatch cells, and use the centroids of these cells as the initial centers. This is almost always the best choice. - 'random' = Use npatch random points as the intial centers. - 'kmeans++' = Use the k-means++ algorithm. cf. https://en.wikipedia.org/wiki/K-means%2B%2B alt (bool): Use the alternate assignment algorithm to minimize the standard deviation of the inertia rather than the total inertia (aka WCSS). (default: False) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) Returns: Tuple containing - patches (array): An array of patch labels, all integers from 0..npatch-1. Size is self.ntot. - centers (array): An array of center coordinates used to make the patches. Shape is (npatch, 2) for flat geometries or (npatch, 3) for 3d or spherical geometries. In the latter case, the centers represent (x,y,z) coordinates on the unit sphere. """ centers = self.kmeans_initialize_centers(npatch, init=init, rng=rng) self.kmeans_refine_centers(centers, max_iter=max_iter, tol=tol, alt=alt) patches = self.kmeans_assign_patches(centers) return patches, centers
[docs] def kmeans_initialize_centers(self, npatch, init='tree', *, rng=None): """Use the field's tree structure to assign good initial centers for a K-Means run. The classic K-Means algorithm involves starting with random points as the initial centers of the patches. This has a tendency to result in rather poor results in terms of having similar sized patches at the end. Specifically, the standard deviation of the inertia at the local minimum that the K-Means algorithm settles into tends to be fairly high for typical geometries. A better approach is to use the existing tree structure to start out with centers that are fairly evenly spread out through the field. This algorithm traverses the tree until we get to a level that has enough cells for the requested number of patches. Then it uses the centroids of these cells as the initial patch centers. Parameters: npatch (int): How many patches to generate initial centers for init (str): Initialization method. Options are: - 'tree' (default) = Use the normal tree structure of the field, traversing down to a level where there are npatch cells, and use the centroids of these cells as the initial centers. This is almost always the best choice. - 'random' = Use npatch random points as the intial centers. - 'kmeans++' = Use the k-means++ algorithm. cf. https://en.wikipedia.org/wiki/K-means%2B%2B rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) Returns: An array of center coordinates. Shape is (npatch, 2) for flat geometries or (npatch, 3) for 3d or spherical geometries. In the latter case, the centers represent (x,y,z) coordinates on the unit sphere. """ if npatch > self.ntot: raise ValueError("Invalid npatch. Cannot be greater than self.ntot.") if npatch < 1: raise ValueError("Invalid npatch. Cannot be less than 1.") if self._coords == _treecorr.Flat: centers = np.empty((npatch, 2)) else: centers = np.empty((npatch, 3)) seed = 0 if rng is None else int(rng.random() * 2**63) if init == 'tree': self.data.KMeansInitTree(centers, int(npatch), seed) elif init == 'random': self.data.KMeansInitRand(centers, int(npatch), seed) elif init == 'kmeans++': self.data.KMeansInitKMPP(centers, int(npatch), seed) else: raise ValueError("Invalid init: %s. "%init + "Must be one of 'tree', 'random', or 'kmeans++.'") return centers
[docs] def kmeans_refine_centers(self, centers, *, max_iter=200, tol=1.e-5, alt=False): """Fast implementation of the K-Means algorithm The standard K-Means algorithm is as follows (cf. https://en.wikipedia.org/wiki/K-means_clustering): 1. Choose centers somehow. Traditionally, this is done by just selecting npatch random points from the full set, but we do this more smartly in `kmeans_initialize_centers`. 2. For each point, measure the distance to each current patch center, and assign it to the patch that has the closest center. 3. Update all the centers to be the centroid of the points assigned to each patch. 4. Repeat 2, 3 until the rms shift in the centers is less than some tolerance or the maximum number of iterations is reached. 5. Assign the corresponding patch label to each point (`kmeans_assign_patches`). In TreeCorr, we use the tree structure to massively increase the speed of steps 2 and 3. For a given cell, we know both its center and its size, so we can quickly check whether all the points in the cell are closer to one center than another. This lets us quickly cull centers from consideration as we traverse the tree. Once we get to a cell where only one center can be closest for any of the points in it, we stop traversing and assign the whole cell to that patch. Further, it is also fast to update the new centroid, since the sum of all the positions for a cell is just N times the cell's centroid. As a result, this algorithm typically takes a fraction of a second for ~a million points. Indeed most of the time spent in the full kmeans calculation is in building the tree in the first place, rather than actually running the kmeans code. With the alternate algorithm (``alt=True``), the time is only slightly slower from having to calculate the sizes at each step. Parameters: centers (array): An array of center coordinates. (modified by this function) Shape is (npatch, 2) for flat geometries or (npatch, 3) for 3d or spherical geometries. In the latter case, the centers represent (x,y,z) coordinates on the unit sphere. max_iter (int): How many iterations at most to run. (default: 200) tol (float): Tolerance in the rms centroid shift to consider as converged as a fraction of the total field size. (default: 1.e-5) alt (bool): Use the alternate assignment algorithm to minimize the standard deviation of the inertia rather than the total inertia (aka WCSS). (default: False) """ npatch = centers.shape[0] self.data.KMeansRun(centers, npatch, int(max_iter), float(tol), bool(alt))
[docs] def kmeans_assign_patches(self, centers): """Assign patch numbers to each point according to the given centers. This is final step in the full K-Means algorithm. It assignes patch numbers to each point in the field according to which center is closest. Parameters: centers (array): An array of center coordinates. Shape is (npatch, 2) for flat geometries or (npatch, 3) for 3d or spherical geometries. In the latter case, the centers represent (x,y,z) coordinates on the unit sphere. Returns: An array of patch labels, all integers from 0..npatch-1. Size is self.ntot. """ patches = np.empty(self.ntot, dtype=int) npatch = centers.shape[0] centers = np.ascontiguousarray(centers) self.data.KMeansAssign(centers, npatch, patches) return patches
[docs]class NField(Field): r"""This class stores the positions and number of objects in a tree structure from which it is efficient to compute correlation functions. An NField is typically created from a Catalog object using >>> nfield = cat.getNField(min_size=min_size, max_size=max_size) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building NField from cat %s',cat.name) else: logger.info('Building NField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.NFieldFlat(cat.x, cat.y, zx, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.NFieldSphere(cat.x, cat.y, zx, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.NFieldThreeD(cat.x, cat.y, zx, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building NField (%s)',self.coords)
[docs]class KField(Field): r"""This class stores the values of a scalar field (e.g. kappa in the weak lensing context) in a tree structure from which it is efficient to compute correlation functions. A KField is typically created from a Catalog object using >>> kfield = cat.getKField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building KField from cat %s',cat.name) else: logger.info('Building KField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.KFieldFlat(cat.x, cat.y, zx, cat.k, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.KFieldSphere(cat.x, cat.y, zx, cat.k, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.KFieldThreeD(cat.x, cat.y, zx, cat.k, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building KField (%s)',self.coords)
[docs]class ZField(Field): r"""This class stores the values of a complex scalar (spin-0) field in a tree structure from which it is efficient to compute correlation functions. A ZField is typically created from a Catalog object using >>> zfield = cat.getZField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building ZField from cat %s',cat.name) else: logger.info('Building ZField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random_sample() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.ZFieldFlat(cat.x, cat.y, zx, cat.z1, cat.z2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.ZFieldSphere(cat.x, cat.y, zx, cat.z1, cat.z2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.ZFieldThreeD(cat.x, cat.y, zx, cat.z1, cat.z2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building ZField (%s)',self.coords)
[docs]class VField(Field): r"""This class stores the values of a vector field in a tree structure from which it is efficient to compute correlation functions. A VField is typically created from a Catalog object using >>> vfield = cat.getVField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building VField from cat %s',cat.name) else: logger.info('Building VField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random_sample() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.VFieldFlat(cat.x, cat.y, zx, cat.v1, cat.v2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.VFieldSphere(cat.x, cat.y, zx, cat.v1, cat.v2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.VFieldThreeD(cat.x, cat.y, zx, cat.v1, cat.v2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building VField (%s)',self.coords)
[docs]class GField(Field): r"""This class stores the values of a shear field (gamma in the weak lensing context) in a tree structure from which it is efficient to compute correlation functions. A GField is typically created from a Catalog object using >>> gfield = cat.getGField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building GField from cat %s',cat.name) else: logger.info('Building GField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.GFieldFlat(cat.x, cat.y, zx, cat.g1, cat.g2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.GFieldSphere(cat.x, cat.y, zx, cat.g1, cat.g2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.GFieldThreeD(cat.x, cat.y, zx, cat.g1, cat.g2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building GField (%s)',self.coords)
[docs]class TField(Field): r"""This class stores the values of a trefoil (spin-3) field in a tree structure from which it is efficient to compute correlation functions. A TField is typically created from a Catalog object using >>> tfield = cat.getTField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building TField from cat %s',cat.name) else: logger.info('Building TField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random_sample() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.TFieldFlat(cat.x, cat.y, zx, cat.t1, cat.t2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.TFieldSphere(cat.x, cat.y, zx, cat.t1, cat.t2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.TFieldThreeD(cat.x, cat.y, zx, cat.t1, cat.t2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building TField (%s)',self.coords)
[docs]class QField(Field): r"""This class stores the values of a quatrefoil (spin-4) field in a tree structure from which it is efficient to compute correlation functions. A QField is typically created from a Catalog object using >>> qfield = cat.getQField(min_size, max_size, b) Parameters: cat (Catalog): The catalog from which to make the field. min_size (float): The minimum radius cell required (usually min_sep). (default: 0) max_size (float): The maximum radius cell required (usually max_sep). (default: None) split_method (str): Which split method to use ('mean', 'median', 'middle', or 'random'). (default: 'mean') brute (bool): Whether to force traversal to the leaves for this field. (default: False) min_top (int): The minimum number of top layers to use when setting up the field. (default: :math:`\max(3, \log_2(N_{\rm cpu}))`) max_top (int): The maximum number of top layers to use when setting up the field. (default: 10) coords (str): The kind of coordinate system to use. (default: cat.coords) rng (RandomState): If desired, a numpy.random.RandomState instance to use for random number generation. (default: None) logger (Logger): A logger file if desired. (default: None) """ def __init__(self, cat, *, min_size=0, max_size=None, split_method='mean', brute=False, min_top=None, max_top=10, coords=None, rng=None, logger=None): if logger: if cat.name != '': logger.info('Building QField from cat %s',cat.name) else: logger.info('Building QField') self._cat = weakref.ref(cat) self.ntot = cat.ntot self.min_size = float(min_size) if not brute else 0. self.max_size = float(max_size) if max_size is not None else np.inf self.split_method = split_method self._sm = _parse_split_method(split_method) self.brute = bool(brute) self.min_top, self.max_top = self._determine_top(min_top, max_top) self.coords = coords if coords is not None else cat.coords self._coords = coord_enum(self.coords) # These are the C++-layer enums seed = 0 if rng is None else int(rng.random_sample() * 2**63) zx = cat.z if cat.z is not None else np.array([]) wpx = cat.wpos if cat.wpos is not None else np.array([]) if self._coords == _treecorr.Flat: self.data = _treecorr.QFieldFlat(cat.x, cat.y, zx, cat.q1, cat.q2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) elif self._coords == _treecorr.Sphere: self.data = _treecorr.QFieldSphere(cat.x, cat.y, zx, cat.q1, cat.q2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) else: self.data = _treecorr.QFieldThreeD(cat.x, cat.y, zx, cat.q1, cat.q2, cat.w, wpx, self.min_size, self.max_size, self._sm, seed, self.brute, self.min_top, self.max_top) if logger: logger.debug('Finished building QField (%s)',self.coords)