Source code for pixell.utils

import numpy as np, scipy.ndimage, os, errno, scipy.optimize, time, datetime, warnings, re, sys
try: xrange
except: xrange = range
try: basestring
except: basestring = str

degree = np.pi/180
arcmin = degree/60
arcsec = arcmin/60
fwhm   = 1.0/(8*np.log(2))**0.5
T_cmb = 2.72548 # +/- 0.00057
c  = 299792458.0
h  = 6.62606957e-34
k  = 1.3806488e-23
e  = 1.60217662e-19
G  = 6.67430e-11
sb = 5.670374419e-8
AU = 149597870700.0
minute = 60
hour   = 60*minute
day    = 24*hour
yr     = 365.2422*day
ly     = c*yr
pc     = AU/arcsec
Jy     = 1e-26
yr2days = yr/day
day2sec = day/1.0

# Particle masses
m_e     = 9.1093837015e-31 # Electron mass, kg
m_p     = 1.6726219237e-27 # Proton mass
m_n     = 1.6749274980e-27 # Neutron mass

# Cross sections and rates
sigma_T = 6.6524587158e-29 # Thomson scattering cross section, m²
sigma_sb = 5.670374419e-8  # Stefan-Boltzman constant

# Solar system constants. Nice to have, unlikely to clash with anything, and
# don't take up much space.
R_sun     = 695700e3  ; M_sun     = 1.9885e30   ; r_sun     =  29e3*ly; L_sun = 3.827e26
R_mercury = 2439.5e3  ; M_mercury = 0.330e24    ; r_mercury =  57.9e9
R_venus   = 6052e3    ; M_venus   = 4.87e24     ; r_venus   = 108.2e9
R_earth   = 6378.1e3  ; M_earth   = 5.9722e24   ; r_earth   = 149.6e9
R_moon    = 1737.5e3  ; M_moon    = 0.073e24    ; r_moon    =   0.384e9
R_mars    = 3396e3    ; M_mars    = 0.642e24    ; r_mars    = 227.9e9
R_jupiter =71492e3    ; M_jupiter = 1898e24     ; r_jupiter = 778.6e9
R_saturn  =60268e3    ; M_saturn  = 568e24      ; r_saturn  =1433.5e9
R_uranus  =25559e3    ; M_uranus  = 86.8e24     ; r_uranus  =2872.5e9
R_neptune =24764e3    ; M_neptune = 102e24      ; r_neptune =4495.1e9
R_pluto   = 1185e3    ; M_pluto   = 0.0146e24   ; r_pluto   =5906.4e9

# These are like degree, arcmin and arcsec, but turn any lists
# they touch into arrays.
a    = np.array(1.0)
adeg = np.array(degree)
amin = np.array(arcmin)
asec = np.array(arcsec)

[docs]def l2ang(l):
	"""Compute the angular scale roughly corresponding to a given multipole. Based on
	matching the number of alm degrees of freedom with map degrees of freedom."""
	return (4*np.pi)**0.5/(l+1)
[docs]def ang2l(ang):
	"""Compute the multipole roughly corresponding to a given angular scale. Based on
	matching the number of alm degrees of freedom with map degrees of freedom."""
	return (4*np.pi)**0.5/ang-1

[docs]def D(f, eps=1e-10):
	"""Clever derivative operator for function f(x) from Ivan Yashchuck.
	Accurate to second order in eps. Only calls f(x) once to evaluate the
	derivative, but f must accept complex arguments. Only works for real x.
	Example usage: D(lambda x: x**4)(1) => 4.0"""
	def Df(x): return f(x+eps*1j).imag / eps
	return Df

[docs]def lines(file_or_fname):
	"""Iterates over lines in a file, which can be specified
	either as a filename or as a file object."""
	if isinstance(file_or_fname, basestring):
		with open(file_or_fname,"r") as file:
			for line in file: yield line
	else:
		for line in file_or_fname: yield line

[docs]def touch(fname):
	with open(fname, "a"):
		os.utime(fname)

[docs]def listsplit(seq, elem):
	"""Analogue of str.split for lists.
	listsplit([1,2,3,4,5,6,7],4) -> [[1,2],[3,4,5,6]]."""
	# Sadly, numpy arrays misbehave, and must be treated specially
	def iseq(e1, e2): return np.all(e1==e2)
	inds = [i for i,v in enumerate(seq) if iseq(v,elem)]
	ranges = zip([0]+[i+1 for i in inds],inds+[len(seq)])
	return [seq[a:b] for a,b in ranges]

[docs]def streq(x, s):
	"""Check if x is the string s. This used to be simply "x is s",
	but that now causes a warning. One can't just do "x == s", as
	that causes a numpy warning and will fail in the future."""
	return isinstance(x, basestring) and x == s

[docs]def find(array, vals, default=None):
	"""Return the indices of each value of vals in the given array."""
	if np.asarray(vals).size == 0: return []
	array   = np.asarray(array)
	order   = np.argsort(array)
	cands   = np.minimum(np.searchsorted(array, vals, sorter=order),len(array)-1)
	res     = order[cands]
	bad     = array[res] != vals
	if np.any(bad):
		if default is None: raise ValueError("Value not found in array")
		else: res[bad] = default
	return res

[docs]def find_any(array, vals):
	"""Like find, but skips missing entries"""
	res = find(array, vals, default=-1)
	return res[res >= 0]

[docs]def nearest_ind(arr, vals, sorted=False):
	"""Given array arr and values vals, return the index of the entry in
	arr with value closest to each entry in val"""
	arr = np.asarray(arr)
	if not sorted:
		order = np.argsort(arr)
		arr   = arr[order]
	inds = np.searchsorted(arr, vals)
	# The closest one will be either arr[i-1] or arr[i]. Simply check both.
	# Cap to 1 below to handle edge case. Still correct.
	inds = np.clip(inds, 1, len(arr)-1)
	diff1= np.abs(arr[inds-1]-vals)
	diff2= np.abs(arr[inds  ]-vals)
	# Entries where diff1 is smallest should point one earlier
	inds -= diff1 <= diff2
	# Undo sorting if necessary
	if not sorted:
		inds = order[inds]
	return inds

[docs]def contains(array, vals):
	"""Given an array[n], returns a boolean res[n], which is True
	for any element in array that is also in vals, and False otherwise."""
	array = np.asarray(array)
	vals  = np.asarray(vals)
	vals  = np.sort(vals)
	inds  = np.searchsorted(vals, array)
	# If a value would be inserted after the end, it wasn't
	# present in the original array.
	inds[inds>=len(vals)] = 0
	return vals[inds] == array

[docs]def common_vals(arrs):
	"""Given a list of arrays, returns their intersection.
	For example
	  common_vals([[1,2,3,4,5],[2,4,6,8]]) -> [2,4]"""
	res = arrs[0]
	for arr in arrs[1:]:
		res = np.intersect1d(res,arr)
	return res

[docs]def common_inds(arrs):
	"""Given a list of arrays, returns the indices into each of them of
	their common elements. For example
	  common_inds([[1,2,3,4,5],[2,4,6,8]]) -> [[1,3],[0,1]]"""
	vals = common_vals(arrs)
	return [find(arr, vals) for arr in arrs]

[docs]def union(arrs):
	"""Given a list of arrays, returns their union."""
	res = arrs[0]
	for arr in arrs[1:]:
		res = np.union1d(res,arr)
	return res

[docs]def inverse_order(order):
	"""If order represents a reordering of an array, such as that returned by
	np.argsort, inverse_order(order) returns a new reordering that can be used
	to recover the old one.

	Example:
		a = np.array([6,102,32,20,0,91,1910]])
		order = np.argsort(a)
		print(a[order]) => [0,6,20,32,91,102,1910]
		invorder = inverse_order(order)
		print(a[order][inverse_order]) => [6,102,32,20,0,91,1910] # same as a
	"""
	invorder = np.empty(len(order), int)
	invorder[order] = np.arange(len(order))
	return invorder

[docs]def complement_inds(inds, n):
	"""Given a subset of range(0,n), return the missing values.
	E.g. complement_inds([0,2,4],7) => [1,3,5,6]"""
	mask = np.ones(n, bool)
	mask[inds] = False
	return np.where(mask)[0]

[docs]def dict_apply_listfun(dict, function):
	"""Applies a function that transforms one list to another
	with the same number of elements to the values in a dictionary,
	returning a new dictionary with the same keys as the input
	dictionary, but the values given by the results of the function
	acting on the input dictionary's values. I.e.
	if f(x) = x[::-1], then dict_apply_listfun({"a":1,"b":2},f) = {"a":2,"b":1}."""
	keys = dict.keys()
	vals = [dict[key] for key in keys]
	res  = function(vals)
	return {key: res[i] for i, key in enumerate(keys)}

[docs]def fallback(*args):
	for arg in args:
		if arg is not None: return arg
	return None

[docs]def unwind(a, period=2*np.pi, axes=[-1], ref=0, refmode="left", mask_nan=False):
	"""Given a list of angles or other cyclic coordinates
	where a and a+period have the same physical meaning,
	make a continuous by removing any sudden jumps due to
	period-wrapping. I.e. [0.07,0.02,6.25,6.20] would
	become [0.07,0.02,-0.03,-0.08] with the default period
	of 2*pi."""
	res = rewind(a, period=period, ref=ref)
	for axis in axes:
		with flatview(res, axes=[axis]) as flat:
			if mask_nan:
				# Avoid trying to sum nans
				mask = ~np.isfinite(flat)
				bad = flat[mask]
				flat[mask] = 0
			# step[i] = val[i+1]-val[i]
			steps = nint((flat[:,1:]-flat[:,:-1])/period)
			# I want to use the middle element as the reference point that won't be changed
			if refmode == "left":
				flat[:,1:] -= np.cumsum(np.round((flat[:,1:]-flat[:,:-1])/period),-1)*period
			elif refmode == "middle":
				iref  = flat.shape[-1]//2
				# Values [0:iref]   have offs -cumsum(steps[iref-1::-1])
				# Values [iref+1:n] have offs  cumsum(steps[iref:])
				loffs = -np.cumsum(steps[:,iref-1::-1],1)[:,::-1]*period
				roffs =  np.cumsum(steps[:,iref:],1)*period
				flat[:,:iref]   -= loffs
				flat[:,iref+1:] -= roffs
			else: raise ValueError("Unsupported refmode '%s'" % str(refmode))
			if mask_nan:
				# Restore any nans
				flat[mask] = bad
	return res

[docs]def rewind(a, ref=0, period=2*np.pi):
	"""Given a list of angles or other cyclic corodinates,
	add or subtract multiples of the period in order to ensure
	that they all lie within the same period. The ref argument
	specifies the angle furthest away from the cut, i.e. the
	period cut will be at ref+period/2."""
	a = np.asanyarray(a)
	if streq(ref, "auto"): ref = np.sort(a.reshape(-1))[a.size//2]
	return ref + (a-ref+period/2.)%period - period/2.

[docs]def cumsplit(sizes, capacities):
	"""Given a set of sizes (of files for example) and a set of capacities
	(of disks for example), returns the index of the sizes for which
	each new capacity becomes necessary, assuming sizes can be split
	across boundaries.
	For example cumsplit([1,1,2,0,1,3,1],[3,2,5]) -> [2,5]"""
	return np.searchsorted(np.cumsum(sizes),np.cumsum(capacities),side="right")

[docs]def mask2range(mask):
	"""Convert a binary mask [True,True,False,True,...] into
	a set of ranges [:,{start,stop}]."""
	# We consider the outside of the array to be False
	mask  = np.concatenate([[False],mask,[False]]).astype(np.int8)
	# Find where we enter and exit ranges with true mask
	dmask = mask[1:]-mask[:-1]
	start = np.where(dmask>0)[0]
	stop  = np.where(dmask<0)[0]
	return np.array([start,stop]).T

[docs]def repeat_filler(d, n):
	"""Form an array n elements long by repeatedly concatenating
	d and d[::-1]."""
	d = np.concatenate([d,d[::-1]])
	nmul = (n+d.size-1)//d.size
	dtot = np.concatenate([d]*nmul)
	return dtot[:n]

[docs]def deslope(d, w=1, inplace=False, axis=-1, avg=np.mean):
	"""Remove a slope and mean from d, matching up the beginning
	and end of d. The w parameter controls the number of samples
	from each end of d that is used to determine the value to
	match up."""
	if not inplace: d = np.array(d)
	with flatview(d, axes=[axis]) as dflat:
		for di in dflat:
			di -= np.arange(di.size)*(avg(di[-w:])-avg(di[:w]))/(di.size-1)+avg(di[:w])
	return d

[docs]def ctime2mjd(ctime):
	"""Converts from unix time to modified julian date."""
	return np.asarray(ctime)/86400. + 40587.0
def mjd2ctime(mjd):
	"""Converts from modified julian date to unix time."""
	return (np.asarray(mjd)-40587.0)*86400
[docs]def mjd2djd(mjd): return np.asarray(mjd) + 2400000.5 - 2415020
[docs]def djd2mjd(djd): return np.asarray(djd) - 2400000.5 + 2415020
[docs]def mjd2jd(mjd): return np.asarray(mjd) + 2400000.5
[docs]def jd2mjd(jd): return np.asarray(jd) - 2400000.5
[docs]def ctime2djd(ctime): return mjd2djd(ctime2mjd(ctime))
[docs]def djd2ctime(djd):   return mjd2ctime(djd2mjd(djd))
[docs]def ctime2jd(ctime):  return mjd2jd(ctime2mjd(ctime))
[docs]def jd2ctime(jd):     return mjd2ctime(jd2mjd(jd))

[docs]def mjd2ctime(mjd):
	"""Converts from modified julian date to unix time"""
	return (np.asarray(mjd)-40587.0)*86400

[docs]def medmean(x, axis=None, frac=0.5):
	x = np.asarray(x)
	if axis is None: x = x.reshape(-1)
	else:            x = np.moveaxis(x, axis, -1)
	x = np.sort(x, -1)
	i = int(x.shape[-1]*frac)//2
	return np.mean(x[...,i:-i],-1)

[docs]def maskmed(arr, mask=None, axis=-1, maskval=0):
	"""Median of array along the given axis, but ignoring
	entries with the given mask value."""
	if mask is None: mask = arr != maskval
	marr = np.ma.array(arr, mask=mask==0)
	res  = np.ma.median(marr, axis=axis)
	if isinstance(res, np.ma.MaskedArray):
		res = res.filled(maskval)
	return res

[docs]def moveaxis(a, o, n): return np.moveaxis(a, o, n)
[docs]def moveaxes(a, old, new): return np.moveaxis(a, old, new)

[docs]def search(a, v, side="left"):
	"""Like np.searchsorted, but searches a[...,n] along the
	last axis for v[...] values, returning the inds[...] values.
	Does not perform a binary search, so less efficient on large
	arrays, but faster than my original idea of shoehorning
	the arrays into a single monotonic array, since that would have
	required touching all the values anyway."""
	a, v = broadcast_arrays(a, v, npost=[1,0])
	if side == "left": return np.sum(a <  v[...,None], -1)
	else:              return np.sum(a <= v[...,None], -1)

[docs]def weighted_quantile(map, ivar, quantile, axis=-1):
	"""Multidimensional weighted quantile. Takes the given quantile (scalar) along
	the given axis (default last axis) of the array "map". Each element along
	the axis is given weight from the corresponding element in "ivar". This is
	based on the weighted percentile method in https://en.wikipedia.org/wiki/Percentile.
	
	Arguments:
	map:  The array to find quantiles for. Must broadcast with ivar
	ivar: The weight array. Must broadcast with map
	quantiles: The quantiles to evaluate.
	axis: The axis to take the quantiles along.

	If post-broadcast map and ivar have shape A when excluding the quantile-axis
	and quantile has shape B, then the result will have shape B+A.
	"""
	map, ivar = np.broadcast_arrays(map, ivar)
	quantile  = np.asfarray(quantile)
	axis      = axis % map.ndim
	# Move axis to end
	map       = np.moveaxis(map,  axis, -1)
	ivar      = np.moveaxis(ivar, axis, -1)
	# Store original shape and reshpe to 2d
	ishape    = map.shape[:-1]
	qshape    = quantile.shape
	n         = map.shape[-1]
	map       = map .reshape(-1, n) # [A,n]
	ivar      = ivar.reshape(-1, n) # [A,n]
	quantile  = quantile.reshape(-1)             # [B]
	# Sort
	order     = np.argsort(map, -1)
	map       = np.asfarray(np.take_along_axis(map,  order, -1))
	ivar      = np.asfarray(np.take_along_axis(ivar, order, -1))
	# We don't have interp or searchsorted for this case, so do it ourselves.
	# The 0.5 part corresponds to the C=0.5 case in the method
	icum      = np.cumsum(ivar, axis=-1) # [A,n]
	ends      = icum[:,-1,None]
	# Avoid division by zero for zero total weight case
	icum      = (icum - 0.5*ivar)/np.where(ends>0, ends, 1) # [A,n]
	# Find the point left of our quantile. [A,n],[B,A1]=>[B,A]
	i1        = search(icum, quantile[:,None])
	# This interpolation should maybe be factorized out into its own function,
	# maybe an improved version of np.interp
	# 3 cases:
	# 1. i1 == 0: We're left of the leftmost point. Should just use map[...,0] without interp
	# 2. i1 == n: We're right of the rightmost point. Shoudl just use map[...,-1] without interp
	# 3. otherwise: interp between i1-1 and i1
	linds = np.where(i1 == 0) # [B,A]. same for other masks
	rinds = np.where(i1 == n)
	cinds = np.where((i1>0)&(i1<n))
	res   = np.zeros(i1.shape, np.result_type(map, ivar, quantile)) # [B,A]
	res[linds] = map[..., 0][linds[1:]]
	res[rinds] = map[...,-1][rinds[1:]]
	cflat = icum[cinds[1:]]       # [C,n]
	mflat = map[cinds[1:]]        # [C,n]
	qflat = quantile[cinds[:1]]   # [C]
	inds  = np.arange(len(cflat)) # [C]
	ci    = i1[cinds]             # [C]
	x     = (qflat-cflat[inds,ci-1])/(cflat[inds,ci]-cflat[inds,ci-1]) # [c]
	res[cinds] = mflat[inds,ci-1]*(1-x)+mflat[inds,ci]*x
	# Restore flattened dimensions
	res = res.reshape(qshape+ishape)
	if res.ndim == 0: res = res*1
	return res

[docs]def weighted_median(map, ivar=1, axis=-1):
	"""Compute the multidimensional weghted median. See weighted_quantile for details"""
	return weighted_quantile(map, ivar, 0.5, axis=axis)

[docs]def partial_flatten(a, axes=[-1], pos=0):
	"""Flatten all dimensions of a except those mentioned
	in axes, and put the flattened one at the given position.

	Example: if a.shape is [1,2,3,4],
	then partial_flatten(a,[-1],0).shape is [6,4]."""
	# Move the selected axes first
	a = moveaxes(a, axes, range(len(axes)))
	# Flatten all the other axes
	a = a.reshape(a.shape[:len(axes)]+(-1,))
	# Move flattened axis to the target position
	return np.moveaxis(a, -1, pos)

[docs]def partial_expand(a, shape, axes=[-1], pos=0):
	"""Undo a partial flatten. Shape is the shape of the
	original array before flattening, and axes and pos should be
	the same as those passed to the flatten operation."""
	a = np.moveaxis(a, pos, -1)
	axes = np.array(axes)%len(shape)
	rest = list(np.delete(shape, axes))
	a = np.reshape(a, list(a.shape[:len(axes)])+rest)
	return moveaxes(a, range(len(axes)), axes)

[docs]def addaxes(a, axes):
	axes = np.array(axes,int)
	axes[axes<0] += a.ndim
	axes = np.sort(axes)[::-1]
	inds = [slice(None) for i in a.shape]
	for ax in axes: inds.insert(ax, None)
	return a[inds]

[docs]def delaxes(a, axes):
	axes = np.array(axes,int)
	axes[axes<0] += a.ndim
	axes = np.sort(axes)[::-1]
	inds = [slice(None) for i in a.shape]
	for ax in axes: inds[ax] = 0
	return a[inds]

[docs]class flatview:
	"""Produce a read/writable flattened view of the given array,
	via with flatview(arr) as farr:
		do stuff with farr
	Changes to farr are propagated into the original array.
	Flattens all dimensions of a except those mentioned
	in axes, and put the flattened one at the given position."""
	def __init__(self, array, axes=[], mode="rwc", pos=0):
		self.array = array
		self.axes  = axes
		self.flat  = None
		self.mode  = mode
		self.pos   = pos
	def __enter__(self):
		self.flat = partial_flatten(self.array, self.axes, pos=self.pos)
		if "c" in self.mode:
			self.flat = np.ascontiguousarray(self.flat)
		return self.flat
	def __exit__(self, type, value, traceback):
		# Copy back out from flat into the original array, if necessary
		if "w" not in self.mode: return
		if np.shares_memory(self.array, self.flat): return
		# We need to copy back out
		self.array[:] = partial_expand(self.flat, self.array.shape, self.axes, pos=self.pos)

[docs]class nowarn:
	"""Use in with block to suppress warnings inside that block."""
	def __enter__(self):
		self.filters = list(warnings.filters)
		warnings.filterwarnings("ignore")
		return self
	def __exit__(self, type, value, traceback):
		warnings.filters = self.filters

[docs]def dedup(a):
	"""Removes consecutive equal values from a 1d array, returning the result.
	The original is not modified."""
	return a[np.concatenate([[True],a[1:]!=a[:-1]])]

[docs]def interpol(a, inds, order=3, mode="nearest", mask_nan=False, cval=0.0, prefilter=True):
	"""Given an array a[{x},{y}] and a list of float indices into a,
	inds[len(y),{z}], returns interpolated values at these positions as [{x},{z}]."""
	a    = np.asanyarray(a)
	inds = np.asanyarray(inds)
	inds_orig_nd = inds.ndim
	if inds.ndim == 1: inds = inds[:,None]

	npre = a.ndim - inds.shape[0]
	res = np.empty(a.shape[:npre]+inds.shape[1:],dtype=a.dtype)
	fa, fr = partial_flatten(a, range(npre,a.ndim)), partial_flatten(res, range(npre, res.ndim))
	if mask_nan:
		mask = ~np.isfinite(fa)
		fa[mask] = 0
	for i in range(fa.shape[0]):
		fr[i].real = scipy.ndimage.map_coordinates(fa[i].real, inds, order=order, mode=mode, cval=cval, prefilter=prefilter)
		if np.iscomplexobj(fa[i]):
			fr[i].imag = scipy.ndimage.map_coordinates(fa[i].imag, inds, order=order, mode=mode, cval=cval, prefilter=prefilter)
	if mask_nan and np.sum(mask) > 0:
		fmask = np.empty(fr.shape,dtype=bool)
		for i in range(mask.shape[0]):
			fmask[i] = scipy.ndimage.map_coordinates(mask[i], inds, order=0, mode=mode, cval=cval, prefilter=prefilter)
		fr[fmask] = np.nan
	if inds_orig_nd == 1: res = res[...,0]
	return res

[docs]def interpol_prefilter(a, npre=None, order=3, inplace=False, mode="nearest"):
	if order < 2: return a
	a = np.asanyarray(a)
	if not inplace: a = a.copy()
	if npre is None: npre = max(0,a.ndim - 2)
	if npre < 0:     npre = a.ndim-npre
	# spline_filter was looping through the enmap pixel by pixel with getitem.
	# Not using flatview got around it, but I don't understand why it happend
	# in the first place.
	for I in nditer(a.shape[:npre]):
		a[I] = scipy.ndimage.spline_filter(a[I], order=order, mode=mode)
	return a

[docs]def interp(x, xp, fp, left=None, right=None, period=None):
	"""Unlike utils.interpol, this is a simple wrapper around np.interp that extends it
	to support fp[...,n] instead of just fp[n]. It does this by looping over the other
	dimensions in python, and calling np.interp for each entry in the pre-dimensions.
	So this function does not save any time over doing that looping manually, but it
	avoid typing this annoying loop over and over."""
	x, xp, fp = [np.asanyarray(a) for a in [x, xp, fp]]
	fp_flat   = fp.reshape(-1, fp.shape[-1])
	f_flat    = np.empty((fp_flat.shape[0],)+x.shape, fp.dtype)
	for i in range(len(fp_flat)):
		f_flat[i] = np.interp(x, xp, fp_flat[i], left=left, right=right, period=period)
	f = f_flat.reshape(fp.shape[:-1]+x.shape)
	return f

[docs]def bin_multi(pix, shape, weights=None):
	"""Simple multidimensional binning. Not very fast.
	Given pix[{coords},:] where coords are indices into an array
	with shape shape, count the number of hits in each pixel,
	returning map[shape]."""
	pix  = np.maximum(np.minimum(pix, (np.array(shape)-1)[:,None]),0)
	inds = np.ravel_multi_index(tuple(pix), tuple(shape))
	size = np.prod(shape)
	if weights is not None: weights = inds*0+weights
	return np.bincount(inds, weights=weights, minlength=size).reshape(shape)

[docs]def bincount(pix, weights=None, minlength=0):
	"""Like numpy.bincount, but allows pre-dimensions, which must broadcast"""
	pix, weights = broadcast_arrays(pix, weights)
	n   = max(np.max(pix)+1,minlength)
	res = np.zeros(pix.shape[:-1]+(n,), np.float64 if weights is None else weights.dtype)
	for I in nditer(pix.shape[:-1]):
		res[I] = np.bincount(pix[I], weights=None if weights is None else weights[I], minlength=n)
	return res

[docs]def grid(box, shape, endpoint=True, axis=0, flat=False):
	"""Given a bounding box[{from,to},ndim] and shape[ndim] in each
	direction, returns an array [ndim,shape[0],shape[1],...] array
	of evenly spaced numbers. If endpoint is True (default), then
	the end point is included. Otherwise, the last sample is one
	step away from the end of the box. For one dimension, this is
	similar to linspace:
		linspace(0,1,4)     =>  [0.0000, 0.3333, 0.6667, 1.0000]
		grid([[0],[1]],[4]) => [[0,0000, 0.3333, 0.6667, 1.0000]]
	"""
	n    = np.asarray(shape)
	box  = np.asfarray(box)
	off  = -1 if endpoint else 0
	inds = np.rollaxis(np.indices(n),0,len(n)+1) # (d1,d2,d3,...,indim)
	res  = inds * (box[1]-box[0])/(n+off) + box[0]
	if flat: res = res.reshape(-1, res.shape[-1])
	return np.rollaxis(res, -1, axis)

[docs]def cumsum(a, endpoint=False, axis=None):
	"""As numpy.cumsum for a 1d array a, but starts from 0. If endpoint is True, the result
	will have one more element than the input, and the last element will be the sum of the
	array. Otherwise (the default), it will have the same length as the array, and the last
	element will be the sum of the first n-1 elements."""
	a = np.asanyarray(a)
	if axis is None:
		a    = a.reshape(-1)
		axis = 0
	axis %= a.ndim
	cum = np.cumsum(a, axis=axis)
	if endpoint:
		ca  = np.zeros(a.shape[:axis]+(a.shape[axis]+1,)+a.shape[axis+1:], cum.dtype)
		ca[(slice(None),)*axis+(slice(1,None),)] = cum
	else:
		ca = np.zeros(a.shape, cum.dtype)
		ca[(slice(None),)*axis+(slice(1,None),)] = cum[(slice(None),)*axis+(slice(0,-1),)]
	return ca

[docs]def pixwin_1d(f, order=0):
	"""Calculate the 1D pixel window for the dimensionless frequncy f corresponding
	to a pixel spacing of 1 (so the Nyquist frequncy is 0.5). The order argument
	controls the interpolation order to assume in the mapmaker. order = 0 corresponds
	to standard nearest-neighbor mapmking. order = 1 corresponds to linear interpolation.
	For a multidimensional (e.g. 2d) image, the full pixel window will be the outer
	product of this pixel window along each axis."""
	if order is None:
		return f*0+1
	elif order == 0:
		return np.sinc(f)
	elif order == 1:
		return np.sinc(f)**2/(1/3*(2+np.cos(2*np.pi*f)))
	else:
		raise ValueError("Unsupported order '%s'" % str(order))

[docs]def nearest_product(n, factors, direction="below"):
	"""Compute the highest product of positive integer powers of the specified
	factors that is lower than or equal to n. This is done using a simple,
	O(n) brute-force algorithm."""
	below = direction=="below"
	ni = floor(n) if below else ceil(n)
	if 1 in factors: return ni
	nmax = ni+1 if below else ni*min(factors)+1
	# a keeps track of all the visited multiples
	a = np.zeros(nmax+1,dtype=bool)
	a[1] = True
	best = None
	for i in range(ni+1):
		if not a[i]: continue
		for f in factors:
			m = i*f
			if below:
				if m > n: continue
				else: best = m
			else:
				if m >= n and (best is None or best > m):
					best = m
			if m < a.size:
				a[m] = True
	return best

[docs]def mkdir(path):
	# It's useful to be able to do mkdir(os.path.dirname(fname)) to create the directory
	# a file should be in if it's missing. If fname has no directory component dirname
	# returns "". This check prevents this from causing an error.
	if path == "": return
	try:
		os.makedirs(path)
	except OSError as exception:
		if exception.errno != errno.EEXIST:
			raise

[docs]def symlink(src, dest):
	try: os.remove(dest)
	except FileNotFoundError: pass
	os.symlink(os.path.relpath(src, os.path.dirname(dest)), dest)

[docs]def decomp_basis(basis, vec):
	return np.linalg.solve(basis.dot(basis.T),basis.dot(vec.T)).T

[docs]def find_period(d, axis=-1):
	dwork = partial_flatten(d, [axis])
	guess = find_period_fourier(dwork)
	res = np.empty([3,len(dwork)])
	for i, (d1, g1) in enumerate(zip(dwork, guess)):
		res[:,i] = find_period_exact(d1, g1)
	periods = res[0].reshape(d.shape[:axis]+d.shape[axis:][1:])
	phases  = res[1].reshape(d.shape[:axis]+d.shape[axis:][1:])
	chisqs  = res[2].reshape(d.shape[:axis]+d.shape[axis:][1:])
	return periods, phases, chisqs

[docs]def find_period_fourier(d, axis=-1):
	"""This is a simple second-order estimate of the period of the
	assumed-periodic signal d. It finds the frequency with the highest
	power using an fft, and partially compensates for nonperiodicity
	by taking a weighted mean of the position of the top."""
	d2 = partial_flatten(d, [axis])
	fd  = np.fft.rfft(d2)
	ps = np.abs(fd)**2
	ps[:,0] = 0
	periods = []
	for p in ps:
		n = np.argmax(p)
		r = [int(n*0.5),int(n*1.5)+1]
		denom = np.sum(p[r[0]:r[1]])
		if denom <= 0: denom = 1
		n2 = np.sum(np.arange(r[0],r[1])*p[r[0]:r[1]])/denom
		periods.append(float(d.shape[axis])/n2)
	return np.array(periods).reshape(d.shape[:axis]+d.shape[axis:][1:])

[docs]def find_period_exact(d, guess):
	n = d.size
	# Restrict to at most 10 fiducial periods
	n = int(min(10,n/float(guess))*guess)
	off = (d.size-n)//2
	d = d[off:off+n]
	def chisq(x):
		w,phase = x
		model = interpol(d, np.arange(n)[None]%w+phase, order=1)
		return np.var(d-model)
	period,phase = scipy.optimize.fmin_powell(chisq, [guess,guess], xtol=1, disp=False)
	return period, phase+off, chisq([period,phase])/np.var(d**2)

[docs]def find_sweeps(az, tol=0.2):
	"""Given an array "az" that sweeps up and down between approximately
	constant minimum and maximum values, returns an array sweeps[:,{i1,i2}],
	which gives the start and end index of each such sweep. For example, if
	az starts at 0 at sample 0, increases to 1 at sample 1000 and then falls
	to -1 at sample 2000, increase to 1 at sample 2500 and then falls to 0.5
	at sample 3000 where it ends, then the function will return
	[[0,1000],[1000,2000],[2000,2500],[2500,3000]].
	The tol parameter determines how close to the extremum values of the array
	it will look for turnarounds. It shouldn't normally need to be ajusted."""
	az         = np.asarray(az)
	# Find and label the areas near the turnarounds
	amin, amax = minmax(az)
	amid, aamp = (amax+amin)/2, (amax-amin)/2
	aabs       = np.abs(az-amid)
	labels, nlabel = scipy.ndimage.label(aabs > aamp*(1-tol))
	# Find the extremum point in each of these
	turns      = np.array(scipy.ndimage.maximum_position(aabs, labels, np.arange(1,nlabel+1)))[:,0]
	turns      = np.unique(np.concatenate([[0],turns,[len(az)]]))
	sweeps     = np.array([turns[:-1],turns[1:]]).T
	return sweeps

[docs]def equal_split(weights, nbin):
	"""Split weights into nbin bins such that the total
	weight in each bin is as close to equal as possible.
	Returns a list of indices for each bin."""
	inds = np.argsort(weights)[::-1]
	bins = [[] for b in xrange(nbin)]
	bw   = np.zeros([nbin])
	for i in inds:
		j = np.argmin(bw)
		bins[j].append(i)
		bw[j] += weights[i]
	return bins

[docs]def range_sub(a,b, mapping=False):
	"""Given a set of ranges a[:,{from,to}] and b[:,{from,to}],
	return a new set of ranges c[:,{from,to}] which corresponds to
	the ranges in a with those in b removed. This might split individual
	ranges into multiple ones. If mapping=True, two extra objects are
	returned. The first is a mapping from each output range to the
	position in a it comes from. The second is a corresponding mapping
	from the set of cut a and b range to indices into a and b, with
	b indices being encoded as -i-1. a and b are assumed
	to be internally non-overlapping.

	Example: utils.range_sub([[0,100],[200,1000]], [[1,2],[3,4],[8,999]], mapping=True)
	(array([[   0,    1],
	        [   2,    3],
	        [   4,    8],
	        [ 999, 1000]]),
	array([0, 0, 0, 1]),
	array([ 0, -1,  1, -2,  2, -3,  3]))

	The last array can be interpreted as: Moving along the number line,
	we first encounter [0,1], which is a part of range 0 in c. We then
	encounter range 0 in b ([1,2]), before we hit [2,3] which is
	part of range 1 in c. Then comes range 1 in b ([3,4]) followed by
	[4,8] which is part of range 2 in c, followed by range 2 in b
	([8,999]) and finally [999,1000] which is part of range 3 in c.

	The same call without mapping: utils.range_sub([[0,100],[200,1000]], [[1,2],[3,4],[8,999]])
	array([[   0,    1],
	       [   2,    3],
	       [   4,    8],
	       [ 999, 1000]])
	"""
	def fixshape(a):
		a = np.asarray(a)
		if a.size == 0: a = np.zeros([0,2],dtype=int)
		return a
	a     = fixshape(a)
	b     = fixshape(b)
	ainds = np.argsort(a[:,0])
	binds = np.argsort(b[:,0])
	rainds= np.arange(len(a))[ainds]
	rbinds= np.arange(len(b))[binds]
	a = a[ainds]
	b = b[binds]
	ai,bi = 0,0
	c = []
	abmap = []
	rmap  = []
	while ai < len(a):
		# Iterate b until it ends past the start of a
		while bi < len(b) and b[bi,1] <= a[ai,0]:
			abmap.append(-rbinds[bi]-1)
			bi += 1
		# Now handle each b until the start of b is past the end of a
		pstart = a[ai,0]
		while bi < len(b) and b[bi,0] <= a[ai,1]:
			r=(pstart,min(a[ai,1],b[bi,0]))
			if r[1]-r[0] > 0:
				abmap.append(len(c))
				rmap.append(rainds[ai])
				c.append(r)
			abmap.append(-rbinds[bi]-1)
			pstart = b[bi,1]
			bi += 1
		# Then append what remains
		r=(pstart,a[ai,1])
		if r[1]>r[0]:
			abmap.append(len(c))
			rmap.append(rainds[ai])
			c.append(r)
		else:
			# If b extended beyond the end of a, then
			# we need to consider it again for the next a,
			# so undo the previous increment. This may lead to
			# the same b being added twice. We will handle that
			# by removing duplicates at the end.
			bi -= 1
		# And advance to the next range in a
		ai += 1
	c = np.array(c)
	# Remove duplicates if necessary
	abmap=dedup(np.array(abmap))
	rmap = np.array(rmap)
	return (c, rmap, abmap) if mapping else c

[docs]def range_union(a, mapping=False):
	"""Given a set of ranges a[:,{from,to}], return a new set where all
	overlapping ranges have been merged, where to >= from. If mapping=True,
	then the mapping from old to new ranges is also returned."""
	# We will make a single pass through a in sorted order
	a    = np.asarray(a)
	n    = len(a)
	inds = np.argsort(a[:,0])
	rmap = np.zeros(n,dtype=int)-1
	b    = []
	# i will point at the first unprocessed range
	for i in xrange(n):
		if rmap[inds[i]] >= 0: continue
		rmap[inds[i]] = len(b)
		start, end = a[inds[i]]
		# loop through every unprocessed range in range
		for j in xrange(i+1,n):
			if rmap[inds[j]] >= 0: continue
			if a[inds[j],0] > end: break
			# This range overlaps, so register it and merge
			rmap[inds[j]] = len(b)
			end = max(end, a[inds[j],1])
		b.append([start,end])
	b = np.array(b)
	if b.size == 0: b = b.reshape(0,2)
	return (b,rmap) if mapping else b

[docs]def range_normalize(a):
	"""Given a set of ranges a[:,{from,to}], normalize the ranges
	such that no ranges are empty, and all ranges go in increasing
	order. Decreasing ranges are interpreted the same way as in a slice,
	e.g. empty."""
	a = np.asarray(a)
	n1 = len(a)
	a = a[a[:,1]!=a[:,0]]
	reverse = a[:,1]<a[:,0]
	a = a[~reverse]
	n2 = len(a)
	return a

[docs]def range_cut(a, c):
	"""Cut range list a at positions given by c. For example
	range_cut([[0,10],[20,100]],[0,2,7,30,200]) -> [[0,2],[2,7],[7,10],[20,30],[30,100]]."""
	return range_sub(a,np.dstack([c,c])[0])

[docs]def compress_beam(sigma, phi):
	sigma = np.asarray(sigma,dtype=float)
	c,s=np.cos(phi),np.sin(phi)
	R = np.array([[c,-s],[s,c]])
	C = np.diag(sigma**-2)
	C = R.dot(C).dot(R.T)
	return np.array([C[0,0],C[1,1],C[0,1]])

[docs]def expand_beam(irads, return_V=False):
	C = np.array([[irads[0],irads[2]],[irads[2],irads[1]]])
	E, V = np.linalg.eigh(C)
	phi = np.arctan2(V[1,0],V[0,0])
	sigma = E**-0.5
	if sigma[1] > sigma[0]:
		sigma = sigma[::-1]
		phi += np.pi/2
	phi %= np.pi
	if return_V: return sigma, phi, V
	else: return sigma, phi

[docs]def combine_beams(irads_array):
	Cs = np.array([[[ir[0],ir[2]],[ir[2],ir[1]]] for ir in irads_array])
	Ctot = np.eye(2)
	for C in Cs:
		E, V = np.linalg.eigh(C)
		B = (V*E[None]**0.5).dot(V.T)
		Ctot = B.dot(Ctot).dot(B.T)
	return np.array([Ctot[0,0],Ctot[1,1],Ctot[0,1]])

[docs]def regularize_beam(beam, cutoff=1e-2, nl=None, normalize=False):
	"""Given a beam transfer function beam[...,nl], replace
	small values with an extrapolation that has the property
	that the ratio of any pair of such regularized beams is
	constant in the extrapolated region."""
	beam  = np.asarray(beam)
	if normalize: beam /= np.max(beam)
	# Get the length of the output beam, and the l to which both exist
	if nl is None: nl = beam.shape[-1]
	nl_both = min(nl, beam.shape[-1])
	# Build the extrapolation for the full range. We will overwrite the part
	# we want to keep unextrapolated later.
	l     = np.maximum(1,np.arange(nl))
	vcut  = np.max(beam,-1)*cutoff
	above = beam > vcut
	lcut  = np.argmin(above, -1)
	if lcut == 0: lcut = np.array(above.shape[-1]-1)
	if lcut > nl: return beam[:nl]
	obeam = vcut * (l/lcut)**(2*np.log(cutoff))
	# Get the mask for what we want to keep. This looks complicated, but that's
	# just to support arbitrary-dimensionality (maybe that wasn't really necessary).
	mask  = np.zeros(obeam.shape, int)
	iflat = lcut.reshape(-1) + np.arange(lcut.size)*nl
	mask.reshape(-1)[iflat] = 1
	mask  = np.cumsum(mask,-1) < 0.5
	obeam[:nl_both] = np.where(mask[:nl_both], beam[:nl_both], obeam[:nl_both])
	return obeam

[docs]def read_lines(fname, col=0):
	"""Read lines from file fname, returning them as a list of strings.
	If fname ends with :slice, then the specified slice will be applied
	to the list before returning."""
	toks = fname.split(":")
	fname, fslice = toks[0], ":".join(toks[1:])
	lines = [line.split()[col] for line in open(fname,"r") if line[0] != "#"]
	n = len(lines)
	return eval("lines"+fslice)

[docs]def loadtxt(fname):
	"""As numpy.loadtxt, but allows slice syntax."""
	toks = fname.split(":")
	fname, fslice = toks[0], ":".join(toks[1:])
	a = np.loadtxt(fname)
	return eval("a"+fslice)

[docs]def atleast_3d(a):
	a = np.asanyarray(a)
	if a.ndim == 0: return a.reshape(1,1,1)
	elif a.ndim == 1: return a.reshape(1,1,-1)
	elif a.ndim == 2: return a.reshape((1,)+a.shape)
	else: return a

[docs]def atleast_Nd(a, n):
	"""Prepend length-1 dimensions to array a to make it n-dimensional"""
	a = np.asanyarray(a)
	if a.ndim >= n: return a
	else: return a[(None,)*(n-a.ndim)]

[docs]def to_Nd(a, n, axis=0, return_inverse=False):
	a    = np.asanyarray(a)
	if n >= a.ndim:
		# make -1 add at end instead of in front of the end
		if axis < 0: axis = a.ndim+1+axis
		res = a.reshape(a.shape[:axis]+(1,)*(n-a.ndim)+a.shape[axis:])
	else:
		if axis < 0: axis = n+axis
		res  = a.reshape(a.shape[:axis]+(-1,)+a.shape[axis+1+a.ndim-n:])
	return (res, a.shape) if return_inverse else res

[docs]def preflat(a, n):
	"""Flatten the first n dimensions of a. If n is negative,
	flatten all but the last -n dimensions."""
	a = np.asanyarray(a)
	if n < 0: n = a.ndim-n
	return a.reshape((-1,)+a.shape[n:])

[docs]def postflat(a, n):
	"""Flatten the last n dimensions of a. If n is negative,
	flatten all but the last -n dimensions."""
	a = np.asanyarray(a)
	if n < 0: n = a.ndim-n
	return a.reshape(a.shape[:a.ndim-n]+(-1,))

[docs]def between_angles(a, range, period=2*np.pi):
	a = rewind(a, np.mean(range), period=period)
	return (a>=range[0])&(a<range[1])

[docs]def hasoff(val, off, tol=1e-6):
	"""Return True if val's deviation from an integer value
	equals off to the given tolerance (default: 1e-6). Example.
	hasoff(17.3, 0.3) == True"""
	return np.abs((val-off+0.5)%1-0.5)<tol

[docs]def same_array(a, b):
	"""Returns true if a and b are the same array"""
	return a.shape == b.shape and a.dtype == b.dtype and repr(a.data) == repr(b.data) and a.strides == b.strides

[docs]def fix_zero_strides(a):
	"""Given an array a, return the same array with any zero-stride along
	an axis with length one, such as those introduced by None-indexing,
	replaced with an equivalent value"""
	# Find last non-zero stride
	good_strides = [s for s in a.strides if s != 0]
	last = good_strides[-1] if len(good_strides) > 0 else a.itemsize
	ostrides = []
	for i in range(a.ndim-1,-1,-1):
		s = a.strides[i]
		n = a.shape[i]
		if s == 0 and n == 1:
			if i == a.ndim-1: s = last
			else: s = last * a.shape[i+1]
		ostrides.append(s)
		last = s
	ostrides = tuple(ostrides[::-1])
	oarr = np.lib.stride_tricks.as_strided(a, strides=ostrides)
	return oarr

[docs]def greedy_split(data, n=2, costfun=max, workfun=lambda w,x: x if w is None else x+w):
	"""Given a list of elements data, return indices that would
	split them it into n subsets such that cost is approximately
	minimized. costfun specifies which cost to minimize, with
	the default being the value of the data themselves. workfun
	specifies how to combine multiple values. workfun(datum,workval)
	=> workval. scorefun then operates on a list of the total workval
	for each group score = scorefun([workval,workval,....]).

	Example: greedy_split(range(10)) => [[9,6,5,2,1,0],[8,7,4,3]]
	         greedy_split([1,10,100]) => [[2],[1,0]]
	         greedy_split("012345",costfun=lambda x:sum([xi**2 for xi in x]),
	          workfun=lambda w,x:0 if x is None else int(x)+w)
	          => [[5,2,1,0],[4,3]]
	"""
	# Sort data based on standalone costs
	costs = []
	nowork = workfun(None,None)
	work = [nowork for i in xrange(n)]
	for d in data:
		work[0] = workfun(nowork,d)
		costs.append(costfun(work))
	order = np.argsort(costs)[::-1]
	# Build groups using greedy algorithm
	groups = [[] for i in xrange(n)]
	work   = [nowork for i in xrange(n)]
	cost   = costfun(work)
	for di in order:
		d = data[di]
		# Try adding to each group
		for i in xrange(n):
			iwork = workfun(work[i],d)
			icost = costfun(work[:i]+[iwork]+work[i+1:])
			if i == 0 or icost < best[2]: best = (i,iwork,icost)
		# Add it to the best group
		i, iwork, icost = best
		groups[i].append(di)
		work[i] = iwork
		cost = icost
	return groups, cost, work

[docs]def greedy_split_simple(data, n=2):
	"""Split array "data" into n lists such that each list has approximately the same
	sum, using a greedy algorithm."""
	inds = np.argsort(data)[::-1]
	rn   = range(n)
	sums = [0  for i in rn]
	res  = [[] for i in rn]
	for i in inds:
		small = 0
		for j in rn:
			if sums[j] < sums[small]: small = j
		sums[small] += data[i]
		res[small].append(i)
	return res

[docs]def cov2corr(C):
	"""Scale rows and columns of C such that its diagonal becomes one.
	This produces a correlation matrix from a covariance matrix. Returns
	the scaled matrix and the square root of the original diagonal."""
	std  = np.diag(C)**0.5
	istd = 1/std
	return np.einsum("ij,i,j->ij",C,istd,istd), std
[docs]def corr2cov(corr,std):
	"""Given a matrix "corr" and an array "std", return a version
	of corr with each row and column scaled by the corresponding entry
	in std. This is the reverse of cov2corr."""
	return np.einsum("ij,i,j->ij",corr,std,std)

[docs]def eigsort(A, nmax=None, merged=False):
	"""Return the eigenvalue decomposition of the real, symmetric matrix A.
	The eigenvalues will be sorted from largest to smallest. If nmax is
	specified, only the nmax largest eigenvalues (and corresponding vectors)
	will be returned. If merged is specified, E and V will not be returned
	separately. Instead, Q=VE**0.5 will be returned, such that QQ' = VEV'."""
	E,V  = np.linalg.eigh(A)
	inds = np.argsort(E)[::-1][:nmax]
	if merged: return V[:,inds]*E[inds][None]**0.5
	else:      return E[inds],V[:,inds]

[docs]def nodiag(A):
	"""Returns matrix A with its diagonal set to zero."""
	A = np.array(A)
	np.fill_diagonal(A,0)
	return A

[docs]def date2ctime(dstr):
	import dateutil.parser
	d = dateutil.parser.parse(dstr, ignoretz=True, tzinfos=0)
	return time.mktime(d.timetuple())

[docs]def bounding_box(boxes):
	"""Compute bounding box for a set of boxes [:,2,:], or a
	set of points [:,2]"""
	boxes = np.asarray(boxes)
	if boxes.ndim == 2:
		return np.array([np.min(boxes,0),np.max(boxes,0)])
	else:
		return np.array([np.min(boxes[:,0,:],0),np.max(boxes[:,1,:],0)])

[docs]def unpackbits(a): return np.unpackbits(np.atleast_1d(a).view(np.uint8)[::-1])[::-1]

[docs]def box2corners(box):
	"""Given a [{from,to},:] bounding box, returns [ncorner,:] coordinates
	of of all its corners."""
	box = np.asarray(box)
	ndim= box.shape[1]
	return np.array([[box[b,bi] for bi,b in enumerate(unpackbits(i)[:ndim])] for i in range(2**ndim)])

[docs]def box2contour(box, nperedge=5):
	"""Given a [{from,to},:] bounding box, returns [npoint,:] coordinates
	definiting its edges. Nperedge is the number of samples per edge of
	the box to use. For nperedge=2 this is equal to box2corners. Nperegege
	can be a list, in which case the number indicates the number to use in
	each dimension."""
	box      = np.asarray(box)
	ndim     = box.shape[1]
	nperedge = np.zeros(ndim,int)+nperedge
	# Generate the range of each coordinate
	points = []
	for i in range(ndim):
		x = np.linspace(box[0,i],box[1,i],nperedge[i])
		for j in range(2**ndim):
			bits = unpackbits(j)[:ndim]
			if bits[i]: continue
			y = np.zeros((len(x),ndim))
			y[:] = box[bits,np.arange(ndim)]; y[:,i] = x
			points.append(y)
	return np.concatenate(points,0)

[docs]def box_slice(a, b):
	"""Given two boxes/boxarrays of shape [{from,to},dims] or [:,{from,to},dims],
	compute the bounds of the part of each b that overlaps with each a, relative
	to the corner of a. For example box_slice([[2,5],[10,10]],[[0,0],[5,7]]) ->
	[[0,0],[3,2]]."""
	a  = np.asarray(a)
	b  = np.asarray(b)
	fa = a.reshape(-1,2,a.shape[-1])
	fb = b.reshape(-1,2,b.shape[-1])
	s  = np.minimum(np.maximum(0,fb[None,:]-fa[:,None,0,None]),fa[:,None,1,None]-fa[:,None,0,None])
	return s.reshape(a.shape[:-2]+b.shape[:-2]+(2,2))

[docs]def box_area(a):
	"""Compute the area of a [{from,to},ndim] box, or an array of such boxes."""
	return np.abs(np.prod(a[...,1,:]-a[...,0,:],-1))

[docs]def box_overlap(a, b):
	"""Given two boxes/boxarrays, compute the overlap of each box with each other
	box, returning the area of the overlaps. If a is [2,ndim] and b is [2,ndim], the
	result will be a single number. if a is [n,2,ndim] and b is [2,ndim], the result
	will be a shape [n] array. If a is [n,2,ndim] and b is [m,2,ndim], the result will'
	be [n,m] areas."""
	return box_area(box_slice(a,b))

[docs]def widen_box(box, margin=1e-3, relative=True):
	box = np.asarray(box)
	margin = np.zeros(box.shape[1:])+margin
	if relative: margin = (box[1]-box[0])*margin
	margin = np.asarray(margin) # Support 1d case
	margin[box[0]>box[1]] *= -1
	return np.array([box[0]-margin/2, box[1]+margin/2])

[docs]def pad_box(box, padding):
	"""How I should have implemented widen_box from the beginning.
	Simply pads a box by an absolute amount. The only complication
	is the sign stuff that handles descending axes in the box."""
	box  = np.array(box, copy=True)
	sign = np.sign(box[...,1,:]-box[...,0,:])
	box[...,0,:] -= padding*sign
	box[...,1,:] += padding*sign
	return box

[docs]def unwrap_range(range, nwrap=2*np.pi):
	"""Given a logically ordered range[{from,to},...] that
	may have been exposed to wrapping with period nwrap,
	undo the wrapping so that range[1] > range[0]
	but range[1]-range[0] is as small as possible.
	Also makes the range straddle 0 if possible.

	Unlike unwind and rewind, this function will not
	turn a very wide range into a small one because it
	doesn't assume that ranges are shorter than half the
	sky. But it still shortens ranges that are longer than
	a whole wrapping period."""
	range = np.asanyarray(range)
	range[1] -= np.floor((range[1]-range[0])/nwrap)*nwrap
	range    -= np.floor(range[1,None]/nwrap)*nwrap
	return range

[docs]def sum_by_id(a, ids, axis=0):
	ra = np.moveaxis(a, axis, 0)
	fa = ra.reshape(ra.shape[0],-1)
	fb = np.zeros((np.max(ids)+1,fa.shape[1]),fa.dtype)
	for i,id in enumerate(ids):
		fb[id] += fa[i]
	rb = fb.reshape((fb.shape[0],)+ra.shape[1:])
	return np.moveaxis(rb, 0, axis)

[docs]def pole_wrap(pos):
	"""Given pos[{lat,lon},...], normalize coordinates so that
	lat is always between -pi/2 and pi/2. Coordinates outside this
	range are mirrored around the poles, and for each mirroring a phase
	of pi is added to lon."""
	pos = pos.copy()
	lat, lon  = pos # references to columns of pos
	halforbit = np.floor((lat+np.pi/2)/np.pi).astype(int)
	front     = halforbit % 2 == 0
	back      = ~front
	# Get rid of most of the looping
	lat -= np.pi*halforbit
	# Then handle the "backside" of the sky, where lat is between pi/2 and 3pi/2
	lat[back] = -lat[back]
	lon[back]+= np.pi
	return pos

[docs]def allreduce(a, comm, op=None):
	"""Convenience wrapper for Allreduce that returns the result
	rather than needing an output argument."""
	a   = np.asanyarray(a)
	res = np.zeros_like(a)
	if op is None: comm.Allreduce(a, res)
	else:          comm.Allreduce(a, res, op)
	return res

[docs]def reduce(a, comm, root=0, op=None):
	res = np.zeros_like(a) if comm.rank == root else None
	if op is None: comm.Reduce(a, res, root=root)
	else:          comm.Reduce(a, res, op, root=root)
	return res

[docs]def allgather(a, comm):
	"""Convenience wrapper for Allgather that returns the result
	rather than needing an output argument."""
	a   = np.asarray(a)
	res = np.zeros((comm.size,)+a.shape,dtype=a.dtype)
	if np.issubdtype(a.dtype, np.string_):
		comm.Allgather(a.view(dtype=np.uint8), res.view(dtype=np.uint8))
	else:
		comm.Allgather(a, res)
	return res

[docs]def allgatherv(a, comm, axis=0):
	"""Perform an mpi allgatherv along the specified axis of the array
	a, returning an array with the individual process arrays concatenated
	along that dimension. For example allgatherv([[1,2]],comm) on one task
	and allgatherv([[3,4],[5,6]],comm) on another task results in
	[[1,2],[3,4],[5,6]] for both tasks."""
	a  = np.asarray(a)
	# Get the dtypes of all non-empty arrays, and use this harmonize all
	# the arrays' dtypes.
	dtypes = [dtype for dtype in comm.allgather(a.dtype if a.size > 0 else None) if dtype is not None]
	if len(dtypes) == 0: return a
	dtype  = np.result_type(*dtypes)
	a      = a.astype(dtype, copy=False)
	# Put the axis first, as that's what Allgatherv wants
	fa = np.moveaxis(a, axis, 0)
	# Do the same for the shapes, to figure out what the non-gather dimensions should be
	shapes = [shape[1:] for shape in comm.allgather(fa.shape) if np.prod(shape) != 0]
	# All arrays are empty, so just return what we had
	if len(shapes) == 0: return a
	# otherwise make sure we have the right shape
	fa = fa.reshape((len(fa),)+shapes[0])
	# mpi4py doesn't handle all types. But why not just do this
	# for everything?
	must_fix = np.issubdtype(a.dtype, np.str_) or a.dtype == bool
	if must_fix:
		fa = fa.view(dtype=np.uint8)
	#print(comm.rank, "fa.shape", fa.shape)
	ra = fa.reshape(fa.shape[0],-1) if fa.size > 0 else fa.reshape(0,np.prod(fa.shape[1:],dtype=int))
	N  = ra.shape[1]
	n  = allgather([len(ra)],comm)
	o  = cumsum(n)
	rb = np.zeros((np.sum(n),N),dtype=ra.dtype)
	#print("A", comm.rank, ra.shape, ra.dtype, rb.shape, rb.dtype, n, N)
	comm.Allgatherv(ra, (rb, (n*N,o*N)))
	fb = rb.reshape((rb.shape[0],)+fa.shape[1:])
	# Restore original data type
	if must_fix:
		fb = fb.view(dtype=a.dtype)
	return np.moveaxis(fb, 0, axis)

[docs]def send(a, comm, dest=0, tag=0):
	"""Faster version of comm.send for numpy arrays.
	Avoids slow pickling. Used with recv below."""
	a = np.asanyarray(a)
	comm.send((a.shape,a.dtype), dest=dest, tag=tag)
	comm.Send(a, dest=dest, tag=tag)

[docs]def recv(comm, source=0, tag=0):
	"""Faster version of comm.recv for numpy arrays.
	Avoids slow pickling. Used with send above."""
	shape, dtype = comm.recv(source=source, tag=tag)
	res = np.empty(shape, dtype)
	comm.Recv(res, source=source, tag=tag)
	return res

[docs]def tuplify(a):
	try: return tuple(a)
	except TypeError: return (a,)

[docs]def resize_array(arr, size, axis=None, val=0):
	"""Return a new array equal to arr but with the given
	axis reshaped to the given sizes. Inserted elements will
	be set to val."""
	arr    = np.asarray(arr)
	size   = tuplify(size)
	axis   = range(len(size)) if axis is None else tuplify(axis)
	axis   = [a%arr.ndim for a in axis]
	oshape = np.array(arr.shape)
	oshape[np.array(axis)] = size
	res    = np.full(oshape, val, arr.dtype)
	slices = tuple([slice(0,min(s1,s2)) for s1,s2 in zip(arr.shape,res.shape)])
	res[slices] = arr[slices]
	return res

# This function does a lot of slice logic, and that actually makes it pretty
# slow when dealing with large numbers of small boxes. It's tempting to move
# the slow parts into fortran... But the way I've set things up there's no
# natural module to put that in. The slowest part is sbox_intersect, which
# deals with variable-length lists, which is also bad for fortran.
[docs]def redistribute(iarrs, iboxes, oboxes, comm, wrap=0):
	"""Given the array iarrs[[{pre},{dims}]] which represents slices
	garr[...,narr,ibox[0,0]:ibox[0,1]:ibox[0,2],ibox[1,0]:ibox[1,1]:ibox[1,2],etc]
	of some larger, distributed array garr, returns a different
	slice of the global array given by obox."""
	iarrs  = [np.asanyarray(iarr) for iarr in iarrs]
	iboxes = sbox_fix(iboxes)
	oboxes = sbox_fix(oboxes)
	ndim   = iboxes[0].shape[-2]
	# mpi4py can't handle all ways of expressing the same dtype.
	# this attempts to force the dtype into an equivalent form it can handle
	dtype  = np.dtype(np.dtype(iarrs[0].dtype).char)
	preshape = iarrs[0].shape[:-2]
	oshapes= [tuple(sbox_size(b)) for b in oboxes]
	oarrs  = [np.zeros(preshape+oshape,dtype) for oshape in oshapes]
	presize= np.prod(preshape,dtype=int)
	# Find out what we must send to and receive from each other task.
	# rboxes will contain slices into oarr and sboxes into iarr.
	# Due to wrapping, a single pair of boxes can have multiple intersections,
	# so we may need to send multiple arrays to each other task.
	# We handle this by flattening and concatenating into a single buffer.
	# sbox_intersect must return a list of lists of boxes
	niarrs = allgather(len(iboxes), comm)
	nimap  = [i for i,a in enumerate(niarrs) for j in range(a)]
	noarrs = allgather(len(oboxes), comm)
	nomap  = [i for i,a in enumerate(noarrs) for j in range(a)]
	def safe_div(a,b,wrap=0):
		return sbox_div(a,b,wrap=wrap) if len(a) > 0 else [np.array([[0,0,1]]*ndim)]

	# Set up receive buffer
	nrecv = np.zeros(len(niarrs), int)
	all_iboxes = allgatherv(iboxes, comm)
	rboxes     = sbox_intersect(all_iboxes, oboxes, wrap=wrap)
	for i1 in range(rboxes.shape[0]):
		count = 0
		for i2 in range(rboxes.shape[1]):
			rboxes[i1,i2] = safe_div(rboxes[i1,i2], oboxes[i2])
			for box in rboxes[i1,i2]:
				count += np.prod(sbox_size(box))
		nrecv[nimap[i1]] += count*presize
	recvbuf = np.empty(np.sum(nrecv), dtype)

	# Set up send buffer
	nsend   = np.zeros(len(noarrs), int)
	sendbuf = []
	all_oboxes = allgatherv(oboxes, comm)
	sboxes     = sbox_intersect(all_oboxes, iboxes, wrap=wrap)
	for i1 in range(sboxes.shape[0]):
		count = 0
		for i2 in range(sboxes.shape[1]):
			sboxes[i1,i2] = safe_div(sboxes[i1,i2], iboxes[i2])
			for box in sboxes[i1,i2]:
				count += np.prod(sbox_size(box))
				sendbuf.append(iarrs[i2][sbox2slice(box)].reshape(-1))
		nsend[nomap[i1]] += count*presize
	sendbuf = np.concatenate(sendbuf) if len(sendbuf) > 0 else np.zeros(0,dtype)

	# Perform the actual all-to-all send
	sbufinfo = (nsend,cumsum(nsend))
	rbufinfo = (nrecv,cumsum(nrecv))

	comm.Alltoallv((sendbuf, sbufinfo), (recvbuf,rbufinfo))

	# Copy out the result
	off = 0
	for i1 in range(rboxes.shape[0]):
		for i2 in range(rboxes.shape[1]):
			for rbox in rboxes[i1,i2]:
				rshape = tuple(sbox_size(rbox))
				data   = recvbuf[off:off+np.prod(rshape)*presize]
				oarrs[i2][sbox2slice(rbox)] = data.reshape(preshape + rshape)
				off += data.size
	return oarrs

[docs]def sbox_intersect(a,b,wrap=0):
	"""Given two Nd sboxes a,b [...,ndim,{start,end,step}] into the
	same array, compute an sbox representing
	their intersection. The resulting sbox will have positive step size.
	The result is a possibly empty list of sboxes - it is empty if there is
	no overlap. If wrap is specified, then it should be a list of length ndim
	of pixel wraps, each of which can be zero to disable wrapping in
	that direction."""
	# First get intersection along each axis
	a = sbox_fix(a)
	b = sbox_fix(b)
	fa = a.reshape((-1,)+a.shape[-2:])
	fb = b.reshape((-1,)+b.shape[-2:])
	ndim = a.shape[-2]
	wrap = np.zeros(ndim,int)+wrap
	# Loop over all combinations
	res = np.empty((fa.shape[0],fb.shape[0]),dtype=np.object)
	for ai, a1 in enumerate(fa):
		for bi, b1 in enumerate(fb):
			peraxis = [sbox_intersect_1d(a1[d],b1[d],wrap=wrap[d]) for d in range(ndim)]
			# Get the outer product of these
			nper    = tuple([len(p) for p in peraxis])
			iflat   = np.arange(np.prod(nper))
			ifull   = np.array(np.unravel_index(iflat, nper)).T
			subres  = [[p[i] for i,p in zip(inds,peraxis)] for inds in ifull]
			res[ai,bi] = subres
	res = res.reshape(a.shape[:-2]+b.shape[:-2])
	if res.ndim == 0:
		res = res.reshape(-1)[0]
	return res

[docs]def sbox_intersect_1d(a,b,wrap=0):
	"""Given two 1d sboxes into the same array, compute an sbox representing
	their intersecting area. The resulting sbox will have positive step size. The result
	is a list of intersection sboxes. This can be empty if there is no intersection,
	such as between [0,n,2] and [1,n,2]. If wrap is not 0, then it
	should be an integer at which pixels repeat, so i and i+wrap would be
	equivalent. This can lead to more intersections than one would usually get.
	"""
	a = sbox_fix(a)
	b = sbox_fix(b)
	if a[2] < 0: a = sbox_flip(a)
	if b[2] < 0: b = sbox_flip(b)
	segs = [(a,b)]
	if wrap:
		a, b = np.array(a), np.array(b)
		a[:2]  -= a[0]//wrap*wrap
		b[:2]  -= b[0]//wrap*wrap
		segs[0] = (a,b)
		if a[1] > wrap: segs.append((a-[wrap,wrap,0],b))
		if b[1] > wrap: segs.append((a,b-[wrap,wrap,0]))
	res = []
	for a,b in segs:
		if b[0] < a[0]: a,b = b,a
		step  = lcm(abs(a[2]),abs(b[2]))
		# Find the first point in the intersection
		rel_inds = np.arange(b[0]-a[0],b[0]-a[0]+step,b[2])
		match = np.where(rel_inds % a[2] == 0)[0]
		if len(match) == 0: continue
		start = rel_inds[match[0]]+a[0]
		# Find the last point in the intersection
		end   =(min(a[1]-a[2],b[1]-b[2])-start)//step*step+start+step
		if end <= start: continue
		res.append([start,end,step])
	return res

[docs]def sbox_div(a,b,wrap=0):
	"""Find c such that arr[a] = arr[b][c]."""
	a = sbox_fix(a)
	b = sbox_fix(b)
	step  = a[...,2]//b[...,2]
	num   = (a[...,1]-a[...,0])//a[...,2]
	start = (a[...,0]-b[...,0])//b[...,2]
	end   = start + step*num
	res   = np.stack([start,end,step],-1)
	if wrap:
		wrap  = np.asarray(wrap,int)[...,None]
		swrap = wrap.copy()
		swrap[wrap==0] = 1
		res[...,:2] -= res[...,0,None]//swrap*wrap
	return res

[docs]def sbox_mul(a,b):
	"""Find c such that arr[c] = arr[a][b]"""
	a = sbox_fix(a).copy()
	b = sbox_fix(b).copy()
	# It's easiest to implement this for sboxes in normal ordering.
	# So we will flip a and b as needed, and then flip back the result
	# if necessary. First compute which  result entries must be flipped.
	flip = (a[...,2] < 0)^(b[...,2] < 0)
	# Then flip
	a[a[...,2]<0] = sbox_flip(a[a[...,2]<0])
	b[b[...,2]<0] = sbox_flip(b[b[...,2]<0])
	# Now that everything is in the right order, we combine
	c0 = a[...,0] + b[...,0]*a[...,2]
	c1 = np.minimum(a[...,0] + b[...,1]*a[...,2],a[...,1])
	c2 = a[...,2]*b[...,2]
	res = sbox_fix(np.stack([c0,c1,c2],-1))
	# Flip back where necessary
	res[flip] = sbox_flip(res[flip])
	return res

[docs]def sbox_flip(sbox):
	sbox = sbox_fix0(sbox)
	return np.stack([sbox[...,1]-sbox[...,2],sbox[...,0]-sbox[...,2],-sbox[...,2]],-1)

[docs]def sbox2slice(sbox):
	sbox = sbox_fix0(sbox)
	return (Ellipsis,)+tuple([slice(s[0],s[1] if s[1]>=0 else None,s[2]) for s in sbox])

[docs]def sbox_size(sbox):
	"""Return the size [...,n] of an sbox [...,{start,end,step}].
	The end must be a whole multiple of step away from start, like
	as with the other sbox functions."""
	sbox = sbox_fix0(sbox)
	sbox = sbox*np.sign(sbox[...,2,None])
	return (((sbox[...,1]-sbox[...,0])-1)//sbox[...,2]).astype(int)+1

[docs]def sbox_fix0(sbox):
	try: sbox.ndim
	except AttributeError: sbox = np.asarray(sbox)
	if sbox.shape[-1] == 2:
		tmp = np.full(sbox.shape[:-1]+(3,),1,int)
		tmp[...,:2] = sbox
		sbox = tmp
	if sbox.dtype != int:
		sbox = sbox.astype(int)
	return sbox

[docs]def sbox_fix(sbox):
	# Ensure that we have a step, setting it to 1 if missing
	sbox = sbox_fix0(sbox)
	# Make sure our end point is a whole multiple of the step
	# from the start
	sbox[...,1] = sbox[...,0] + sbox_size(sbox)*sbox[...,2]
	return sbox

[docs]def sbox_wrap(sbox, wrap=0, cap=0):
	""""Given a single sbox [...,{from,to,step?}] representing a slice of an N-dim array,
	wraps and caps the sbox, returning a list of sboxes for each
	contiguous section of the slice.

	The wrap argument, which can be scalar or a length N array-like,
	indicates the wrapping length along each dimension. Boxes that
	extend beyond the wrapping length will be split into two at the
	wrapping position, with the overshooting part wrapping around
	to the beginning of the array. The speical value 0 disables wrapping
	for that dimension.

	The cap argument, which can also be a scalar or length N array-like,
	indicates the physical length of each array dimension. The sboxes will
	be truncated to avoid accessing any data beyond this length, after wrapping
	has been taken into account.

	The function returns a list of the form [(ibox1,obox1),(ibox2,obox2)...],
	where the iboxes are sboxes representing slices into the input array
	(the array the original sbox refers to), while the oboxes represent slices
	into the output array. These sboxes can be turned into actual slices using
	sbox2slice.

	A typical example of the use of this function would be a sky map that wraps
	horizontally after 360 degrees, where one wants to support extracting subsets
	that straddle the wrapping point."""
	# This function was surprisingly complicated. If I had known it would be
	# this long I would have built it from the sbox-stuff above. But at least
	# this one should have lower overhead than that would have had.
	sbox = sbox_fix(sbox)
	ndim = sbox.shape[0]
	wrap = np.zeros(ndim,int)+wrap
	cap  = np.zeros(ndim,int)+cap
	dim_boxes = []
	for d, w in enumerate(wrap):
		ibox = sbox[d]
		ilen = sbox_size(ibox)
		c = cap[d]
		# Things will be less redundant if we ensure that a has a positive stride
		flip = ibox[2] < 0
		if flip:
			ibox = sbox_flip(ibox)
		if w:
			# move starting point to first positive loop
			ibox[:2] -= ibox[0]//w*w
			boxes_1d = []
			i = 0
			while ibox[1] > 0:
				npre = max((-ibox[0])//ibox[2],0)
				# ibox slice assuming all of the logical ibox is available
				isub = sbox_fix([ibox[0]+npre*ibox[2],min(ibox[1],w),ibox[2]])
				nsub = sbox_size(isub)
				# the physical array may be smaller than the logical one.
				if c:
					isub = sbox_fix([ibox[0]+npre*ibox[2],min(ibox[1],c),ibox[2]])
					ncap = sbox_size(isub)
				else: ncap = nsub
				if not flip: osub = [i, i+ncap, 1]
				else:        osub = [ilen-1-i, ilen-1-(i+ncap), -1]
				# accept this slice unless it doesn't overlap with anything
				if ncap > 0:
					boxes_1d.append((list(isub),osub))
				i += nsub
				ibox[:2] -= w
		else:
			# No wrapping, but may want to cap. In this case we will have both
			# upwards and downwards capping. Find the number of samples to
			# crop on each side
			if c:
				npre  = max((-ibox[0])//ibox[2],0)
				npost = max((ibox[1]-ibox[2]-(c-1))//ibox[2],0)
			else: npre, npost = 0, 0
			# Don't produce a slice if it would be empty
			if npre + npost < ilen:
				isub = [ibox[0]+npre*ibox[2], ibox[1]-npost*ibox[2], ibox[2]]
				if not flip: osub = [npre, ilen-npost, 1]
				else:        osub = [ilen-1-npre, npost-1, -1]
				boxes_1d = [(isub,osub)]
			else:
				boxes_1d = []
		dim_boxes.append(boxes_1d)
	# Now create the outer product of all the individual dimensions' box sets
	nper    = tuple([len(p) for p in dim_boxes])
	iflat   = np.arange(np.prod(nper))
	ifull   = np.array(np.unravel_index(iflat, nper)).T
	res     = [[[p[i][io] for i,p in zip(inds,dim_boxes)] for io in [0,1]] for inds in ifull]
	return res

[docs]def gcd(a, b):
	"""Greatest common divisor of a and b"""
	return gcd(b, a % b) if b else a
[docs]def lcm(a, b):
	"""Least common multiple of a and b"""
	return a*b//gcd(a,b)

[docs]def uncat(a, lens):
	"""Undo a concatenation operation. If a = np.concatenate(b)
	and lens = [len(x) for x in b], then uncat(a,lens) returns
	b."""
	cum = cumsum(lens, endpoint=True)
	return [a[cum[i]:cum[i+1]] for i in xrange(len(lens))]

[docs]def ang2rect(angs, zenith=False, axis=0):
	"""Convert a set of angles [{phi,theta},...] to cartesian
	coordinates [{x,y,z},...]. If zenith is True,
	the theta angle will be taken to go from 0 to pi, and measure
	the angle from the z axis. If zenith is False, then theta
	goes from -pi/2 to pi/2, and measures the angle up from the xy plane."""
	angs       = np.asanyarray(angs)
	phi, theta = np.moveaxis(angs, axis, 0)
	ct, st, cp, sp = np.cos(theta), np.sin(theta), np.cos(phi), np.sin(phi)
	if zenith: res = np.array([st*cp,st*sp,ct])
	else:      res = np.array([ct*cp,ct*sp,st])
	return np.moveaxis(res, 0, axis)

[docs]def rect2ang(rect, zenith=False, axis=0, return_r=False):
	"""The inverse of ang2rect."""
	x,y,z = np.moveaxis(rect, axis, 0)
	r     = (x**2+y**2)**0.5
	phi   = np.arctan2(y,x)
	if zenith: theta = np.arctan2(r,z)
	else:      theta = np.arctan2(z,r)
	ang = np.moveaxis(np.array([phi,theta]), 0, axis)
	return (ang,r) if return_r else ang

[docs]def angdist(a, b, zenith=False, axis=0):
	"""Compute the angular distance between a[{ra,dec},...]
	and b[{ra,dec},...] using a Vincenty formula that's stable
	both for small and large angular separations. a and b must
	broadcast correctly."""
	a = np.moveaxis(np.asarray(a), axis, 0)
	b = np.moveaxis(np.asarray(b), axis, 0)
	dra = a[0]-b[0]
	sin_dra = np.sin(dra)
	cos_dra = np.cos(dra)
	del dra
	cos, sin = (np.cos,np.sin) if not zenith else (np.sin, np.cos)
	a_sin_dec = sin(a[1])
	a_cos_dec = cos(a[1])
	b_sin_dec = sin(b[1])
	b_cos_dec = cos(b[1])
	y = ((b_cos_dec*sin_dra)**2 + (a_cos_dec*b_sin_dec-a_sin_dec*b_cos_dec*cos_dra)**2)**0.5
	del sin_dra
	x = a_sin_dec*b_sin_dec + a_cos_dec*b_cos_dec*cos_dra
	del a_sin_dec, a_cos_dec, b_sin_dec, b_cos_dec, a, b
	return np.arctan2(y,x)

[docs]def vec_angdist(v1, v2, axis=0):
	"""Use Kahan's version of Heron's formula to compute a stable angular
	distance between to vectors v1 and v2, which don't have to be unit vectors.
	See https://scicomp.stackexchange.com/a/27694"""
	v1 = np.asanyarray(v1)
	v2 = np.asanyarray(v2)
	a  = np.sum(v1**2,axis)**0.5
	b  = np.sum(v2**2,axis)**0.5
	c  = np.sum((v1-v2)**2,axis)**0.5
	mu = np.where(b>=c, c-(a-b), b-(a-c))
	ang= 2*np.arctan(((((a-b)+c)*mu)/((a+(b+c))*((a-c)+b)))**0.5)
	return ang

[docs]def rotmatrix(ang, raxis, axis=-1, dtype=None):
	"""Construct a 3d rotation matrix representing a rotation of
	ang degrees around the specified rotation axis raxis, which can be "x", "y", "z"
	or 0, 1, 2. If ang is a scalar, the result will be [3,3]. Otherwise,
	it will be ang.shape[:axis] + (3,3) + ang.shape[axis:]. Negative axis is interpreted
	as ang.ndim+1+axis, such that the (3,3) part ends at the end for axis=-1"""
	ang   = np.asarray(ang)
	c, s  = np.cos(ang), np.sin(ang)
	if axis < 0: axis = ang.ndim+1+axis
	if dtype is None: dtype = np.float64
	R  = np.zeros(ang.shape[:axis] + (3,3) + ang.shape[axis:], dtype)
	# Slice tuples to let us assign things directly into the position of the
	# output matrix we want
	a  = (slice(None),)*axis
	b  = (slice(None),)*(ang.ndim-axis)
	if   raxis == 0 or raxis == "x" or raxis == "X":
		R[a+(0,0)+b]= 1
		R[a+(1,1)+b]= c; R[a+(1,2)+b]=-s
		R[a+(2,1)+b]= s; R[a+(2,2)+b]= c
	elif raxis == 1 or raxis == "y" or raxis == "Y":
		R[a+(0,0)+b]= c; R[a+(0,2)+b]= s
		R[a+(1,1)+b]= 1
		R[a+(2,0)+b]=-s; R[a+(2,2)+b]= c
	elif raxis == 2 or raxis == "z" or raxis == "Z":
		R[a+(0,0)+b]= c; R[a+(0,1)+b]=-s
		R[a+(1,0)+b]= s; R[a+(1,1)+b]= c
		R[a+(2,2)+b]=1
	else: raise ValueError("Rotation axis %s not recognized" % raxis)
	return R

[docs]def label_unique(a, axes=(), rtol=1e-5, atol=1e-8):
	"""Given an array of values, return an array of
	labels such that all entries in the array with the
	same label will have approximately the same value.
	Labels count contiguously from 0 and up.
	axes specifies which axes make up the subarray that
	should be compared for equality. For scalars,
	use axes=()."""
	a = np.asarray(a)
	axes = [i % a.ndim for i in axes]
	rest = [s for i,s in enumerate(a.shape) if i not in axes]

	# First reshape into a doubly-flattened 2d array [nelem,ndim]
	fa = partial_flatten(a, axes, 0)
	fa = fa.reshape(np.prod(rest),-1)
	# Can't use lexsort, as it has no tolerance. This
	# is O(N^2) instead of O(NlogN)
	id = 0
	ids = np.zeros(len(fa),dtype=int)-1
	for i,v in enumerate(fa):
		if ids[i] >= 0: continue
		match = np.all(np.isclose(v,fa,rtol=rtol,atol=atol),-1)
		ids[match] = id
		id += 1
	return ids.reshape(rest)

[docs]def transpose_inds(inds, nrow, ncol):
	"""Given a set of flattened indices into an array of shape (nrow,ncol),
	return the indices of the corresponding elemens in a transposed array."""
	row_major = inds
	row, col = row_major//ncol, row_major%ncol
	return col*nrow + row

[docs]def rescale(a, range=[0,1]):
	"""Rescale a such that min(a),max(a) -> range[0],range[1]"""
	mi, ma = np.min(a), np.max(a)
	return (a-mi)/(ma-mi)*(range[1]-range[0])+range[0]

[docs]def split_by_group(a, start, end):
	"""Split string a into non-group and group sections,
	where a group is defined as a set of characters from
	a start character to a corresponding end character."""
	res, ind, n = [], 0, 0
	new = True
	for c in a:
		if new:
			res.append("")
			new = False
		i = start.find(c)
		if n == 0:
			if i >= 0:
				# Start of new group
				res.append("")
				ind = i
				n += 1
		else:
			if start[ind] == c:
				n += 1
			elif end[ind] == c:
				n-= 1
				if n == 0: new = True
		res[-1] += c
	return res

[docs]def split_outside(a, sep, start="([{", end=")]}"):
	"""Split string a at occurences of separator sep, except when
	it occurs inside matching groups of start and end characters."""
	segments = split_by_group(a, start, end)
	res = [""]
	for seg in segments:
		if len(seg) == 0: continue
		if seg[0] in start:
			res[-1] += seg
		else:
			toks = seg.split(sep)
			res[-1] += toks[0]
			res += toks[1:]
	return res

[docs]def find_equal_groups(a, tol=0):
	"""Given a[nsamp,...], return groups[ngroup][{ind,ind,ind,...}]
	of indices into a for which all the values in the second index
	of a is the same. find_equal_groups([[0,1],[1,2],[0,1]]) -> [[0,2],[1]]."""
	def calc_diff(a1,a2):
		if a1.dtype.char in 'SU': return a1 != a2
		else: return a1-a2
	a = np.asarray(a)
	if a.ndim == 1: a = a[:,None]
	n = len(a)
	inds = np.argsort(a[:,0])
	done = np.full(n, False, dtype=bool)
	res = []
	for i in xrange(n):
		if done[i]: continue
		xi = inds[i]
		res.append([xi])
		done[i] = True
		for j in xrange(i+1,n):
			if done[j]: continue
			xj = inds[j]
			if calc_diff(a[xj,0], a[xi,0]) > tol:
				# Current group is done
				break
			if np.sum(calc_diff(a[xj],a[xi])**2) <= tol**2:
				# Close enough
				res[-1].append(xj)
				done[j] = True
	return res

[docs]def find_equal_groups_fast(vals):
	"""Group 1d array vals[n] into equal groups. Returns uvals, order, edges
	Using these, group #i is made up of the values with index order[edges[i]:edges[i+1]],
	and all these elements correspond to value uvals[i]. Accomplishes the same
	basic task as find_equal_groups, but
	1. Only works on 1d arrays
	2. Only works with exact quality, with no support for approximate equality
	3. Returns 3 numpy arrays instead of a list of lists.
	"""
	order = np.argsort(vals, kind="stable")
	uvals, edges = np.unique(vals[order], return_index=True)
	edges = np.concatenate([edges,[len(vals)]])
	return uvals, order, edges

[docs]def label_multi(valss):
	"""Given the argument valss[:][n], which is a list of 1d arrays of the same
	length n but potentially different data types, return a single 1d array
	labels[n] of integers such that unique lables correspond to unique valss[:].
	More precisely, valss[:][labels[i]] == valss[:][labels[j]] only if
	labels[i] == labels[j]. The purpose of this is to go from having a heterogenous
	label like (1, "foo", 1.24) to having a single integer as the label.

	Example: label_multi([[0,0,1,1,2],["a","b","b","b","b"]]) → [0,1,2,2,3]"""
	oinds = 0
	nprev = 1
	for vals in valss:
		# remap arbitrary values in vals to integers in inds
		uvals, inds = np.unique(vals, return_inverse=True)
		oinds = oinds*nprev + inds
		nprev = len(uvals)
	# At this point oinds has unique indices, but there could be gaps.
	# Remove those
	oinds = np.unique(oinds, return_inverse=True)[1]
	return oinds

[docs]def pathsplit(path):
	"""Like os.path.split, but for all components, not just the last one.
	Why did I have to write this function? It should have been in os already!"""
	# This takes care of all OS-dependent path stuff. Afterwards we can safely split by /
	path = os.path.normpath(path)
	# This is to handle the common special case of a path starting with /
	if path.startswith("/"):
		return ["/"] + path.split("/")[1:]
	else:
		return path.split("/")

[docs]def minmax(a, axis=None):
	"""Shortcut for np.array([np.min(a),np.max(a)]), since I do this
	a lot."""
	return np.array([np.min(a, axis=axis),np.max(a, axis=axis)])

def broadcast_shape(*shapes):
	ndim   = max([len(shape) for shape in shapes])
	oshape = []
	for i in range(ndim):
		olen = 1
		for shape in shapes:
			if len(shape) <= i: continue
			v = shape[-1-i]
			if olen != 1 and v != 1 and v != olen:
				raise ValueError("operands could not be broadcast togehter with shapes " + " ".join([str(shape) for shape in shapes]))
			olen = max(olen, v)
		oshape.insert(0, olen)
	return tuple(oshape)

[docs]def broadcast_shape(*shapes, at=0):
	"""Return the shape resulting from broadcasting arrays with the given shapes.
	"at" controls how new axes are added. at=0 adds them at the beginning, which
	matches how numpy broadcasting works. at=1 would add them after the first
	element, etc. -1 adds them at the end."""
	# Output should have this length
	ndim   = max([len(shape) for shape in shapes])
	# Output shape starting point
	oshape = [1 for i in range(ndim)]
	for shape in shapes:
		# Start by inserting 1s as needed
		my_at = at if at >= 0 else len(shape)+1+at
		shape_padded = shape[:my_at] + (1,)*(ndim-len(shape)) + shape[my_at:]
		for i in range(ndim):
			if oshape[i] != shape_padded[i] and shape_padded[i] != 1:
				if oshape[i] == 1: oshape[i] = shape_padded[i]
				else: raise ValueError("operands could not be broadcast togehter with shapes " + " ".join([str(shape) for shape in shapes]))
	return tuple(oshape)

[docs]def broadcast_arrays(*arrays, npre=0, npost=0, at=0):
	"""Like np.broadcast_arrays, but allows arrays to be None, in which case they are
	passed just passed through as None without affecting the rest of the broadcasting.
	The argument npre specifies the number of dimensions at the beginning of the arrays
	to exempt from broadcasting. This can be either an integer or a list of integers.
	"""
	npre    = np.broadcast_to(npre,  len(arrays))
	npost   = np.broadcast_to(npost, len(arrays))
	narr    = len(arrays)
	arrays  = list(arrays)
	warrs, wshapes = [], []
	for i in range(narr):
		if arrays[i] is None: continue
		arrays[i] = np.asanyarray(arrays[i])
		warrs.append(arrays[i])
		wshapes.append(arrays[i].shape[npre[i]:arrays[i].ndim-npost[i]])
	# Find broadcasting shape
	oshape = broadcast_shape(*wshapes, at=at)
	# Broadcast and insert into output array
	res    = [None for a in arrays]
	for i, (n, m, arr) in enumerate(zip(npre, npost, arrays)):
		if arr is not None:
			ninsert = len(oshape)-(arr.ndim-n-m)
			my_at   = n+at if at >= 0 else arr.ndim+1+at-m
			res[i]  = np.broadcast_to(arr[(slice(None),)*my_at+(None,)*ninsert], arr.shape[:n]+oshape+arr.shape[arr.ndim-m:])
	return res

[docs]def point_in_polygon(points, polys):
	"""Given a points[...,2] and a set of polys[...,nvertex,2], return
	inside[...]. points[...,0] and polys[...,0,0] must broadcast correctly.

	Examples:
	utils.point_in_polygon([0.5,0.5],[[0,0],[0,1],[1,1],[1,0]]) -> True
	utils.point_in_polygon([[0.5,0.5],[2,1]],[[0,0],[0,1],[1,1],[1,0]]) -> [True, False]
	"""
	# Make sure we have arrays, and that they have a floating point data type
	points = np.asarray(points)+0.0
	polys  = np.asarray(polys) +0.0
	verts  = polys - points[...,None,:]
	ncross = np.zeros(verts.shape[:-2], dtype=np.int32)
	# For each vertex, check if it crosses y=0 by computing the x
	# position of that crossing, and seeing if that x is within the
	# poly's bounds.
	for i in range(verts.shape[-2]):
		x1, y1 = verts[...,i-1,:].T
		x2, y2 = verts[...,i,:].T
		with nowarn():
			x = -y1*(x2-x1)/(y2-y1) + x1
		ncross += ((y1*y2 < 0) & (x > 0)).T
	return ncross.T % 2 == 1

[docs]def poly_edge_dist(points, polygons):
	"""Given points [...,2] and a set of polygons [...,nvertex,2], return
	dists[...], which represents the distance of the points from the edges
	of the corresponding polygons. This means that the interior of the
	polygon will not be 0. points[...,0] and polys[...,0,0] must broadcast
	correctly."""
	points   = np.asarray(points)
	polygons = np.asarray(polygons)
	nvert    = polygons.shape[-2]
	p        = ang2rect(points,axis=-1)
	vertices = ang2rect(polygons,axis=-1)
	del points, polygons
	dists = []
	for i in range(nvert):
		v1   = vertices[...,i,:]
		v2   = vertices[...,(i+1)%nvert,:]
		vz   = np.cross(v1,v2)
		vz  /= np.sum(vz**2,-1)[...,None]**0.5
		# Find out if the point is inside our line segment or not
		vx   = v1
		vy   = np.cross(vz,vx)
		vy  /= np.sum(vy**2,-1)[...,None]**0.5
		pang = np.arctan2(np.sum( p*vy,-1),np.sum( p*vx,-1))
		ang2 = np.arctan2(np.sum(v2*vy,-1),np.sum(v2*vx,-1))
		between = (pang >= 0) & (pang < ang2)
		# If we are inside, the distance will simply be the distance
		# from the line segment, which is the distance from vz minus pi/2.
		# If we are outside, then use the distance from the edge of the line segment.
		dist_between = np.abs(np.arccos(np.clip(np.sum(p*vz,-1),-1,1))-np.pi/2)
		dist_outside = np.minimum(
			np.arccos(np.clip(np.sum(p*v1,-1),-1,1)),
			np.arccos(np.clip(np.sum(p*v2,-1),-1,1))
		)
		dist = np.where(between, dist_between, dist_outside)
		del v1, v2, vx, vy, vz, pang, ang2, between
		dists.append(dist)
	dists = np.min(dists,0)
	return dists

[docs]def block_mean_filter(a, width):
	"""Perform a binwise smoothing of a, where all samples
	in each bin of the given width are replaced by the mean
	of the samples in that bin."""
	a = np.array(a)
	if a.shape[-1] < width:
		a[:] = np.mean(a,-1)[...,None]
	else:
		width  = int(width)
		nblock = (a.shape[-1]+width-1)//width
		apad   = np.concatenate([a,a[...,-2::-1]],-1)
		work   = apad[...,:width*nblock]
		work   = work.reshape(work.shape[:-1]+(nblock,width))
		work[:]= np.mean(work,-1)[...,None]
		work   = work.reshape(work.shape[:-2]+(-1,))
		a[:]   = work[...,:a.shape[-1]]
	return a

[docs]def block_reduce(a, bsize, axis=-1, off=0, op=np.mean, inclusive=True):
	"""Replace each block of length bsize along the given axis of a
	with an aggregate value given by the operation op. op must
	accept op(array, axis), just like np.sum or np.mean. a need not
	have a whole number of blocks. In that case, the last block will
	have fewer than bsize samples in it. If off is specified, it gives
	an offset from the start of the array for the start of the first block;
	anything before that will be treated as an incomplete block, just like
	anything left over at the end. Pass the same value of off to block_expand
	to undo this."""
	if bsize == 1: return a
	a      = np.asarray(a)
	axis  %= a.ndim
	# Split the array into the first part, the whole blocks, and the remainder
	nwhole = (a.shape[axis]-off)//bsize
	pre, mid, tail = np.split(a, [off,off+nwhole*bsize], axis)
	# Average and merge these
	parts  = []
	if pre.size  > 0 and inclusive: parts.append(np.expand_dims(op(pre, axis),axis))
	if mid.size  > 0: parts.append(op(mid.reshape(mid.shape[:axis]+(nwhole,bsize)+mid.shape[axis+1:]),axis+1))
	if tail.size > 0 and inclusive: parts.append(np.expand_dims(op(tail,axis),axis))
	return np.concatenate(parts, axis)

[docs]def block_expand(a, bsize, osize, axis=-1, off=0, op="nearest", inclusive=True):
	"""The opposite of block_reduce. Where block_reduce averages (by default)
	this function duplicates (by default) to recover the original shape.
	If op="linear", then linear interpolation will be done instead of
	duplication. NOTE: Currently axis and orr are not supported for
	linear interpolation, which will always be done along the last axis."""
	a      = np.asanyarray(a)
	nwhole = (osize-off)//bsize
	nrest  = osize-off-nwhole*bsize
	axis  %= a.ndim
	if op == "nearest":
		if inclusive:
			pre, mid, tail = np.split(a, [off>0,(off>0)+nwhole], axis)
			parts = []
			if pre.size > 0: parts.append(np.repeat(pre, off,   axis))
			if mid.size > 0: parts.append(np.repeat(mid, bsize, axis))
			if tail.size> 0: parts.append(np.repeat(tail,nrest, axis))
			return np.concatenate(parts, axis)
		else:
			parts = [
					np.zeros(a.shape[:axis]+(off,)  +a.shape[axis+1:], a.dtype),
					np.repeat(a, bsize, axis),
					np.zeros(a.shape[:axis]+(nrest,)+a.shape[axis+1:], a.dtype),
				]
			return np.concatenate(parts, axis)
	elif op == "linear":
		# TODO: This part doesn't support off or axis yet.
		# Index relative to block centers. For bsize samples in a block,
		# the intervals have size 1/nblock, and the first sample is offset
		# by half an interval. Hence sample #i is at ((i+1)+0.5)/nblock-0.5
		find   = (np.arange(nwhole*bsize)+0.5)/bsize - 0.5
		if nrest != 0:
			find = np.concatenate([find, nwhole + (np.arange(nrest)+0.5)/nrest-0.5])
		i1 = np.floor(find).astype(int)
		i2 = i1+1
		x2 = find % 1
		x1 = 1 - x2
		i1 = np.maximum(i1, 0)
		i2 = np.minimum(i2, a.shape[-1]-1)
		return a[...,i1]*x1 + a[...,i2]*x2
	else:
		raise ValueError("Unrecognized operation '%s'" % op)

[docs]def ctime2date(timestamp, tzone=0, fmt="%Y-%m-%d"):
	return datetime.datetime.utcfromtimestamp(timestamp+tzone*3600).strftime(fmt)

[docs]def tofinite(arr, val=0):
	"""Return arr with all non-finite values replaced with val."""
	arr = np.asanyarray(arr).copy()
	if arr.ndim == 0:
		if ~np.isfinite(arr): arr = val
	else:
		arr[~np.isfinite(arr)] = val
	return arr

[docs]def parse_ints(s): return parse_numbers(s, int)
[docs]def parse_floats(s): return parse_numbers(s, float)
[docs]def parse_numbers(s, dtype=None):
	res = []
	for word in s.split(","):
		toks = [dtype(w) for w in word.split(":")]
		if ":" not in word:
			res.append(toks[:1])
		else:
			start, stop = toks[:2]
			step = toks[2] if len(toks) > 2 else 1
			res.append(np.arange(start,stop,step))
	res = np.concatenate(res)
	if dtype is not None:
		res = res.astype(dtype)
	return res
[docs]def parse_box(desc):
	"""Given a string of the form from:to,from:to,from:to,... returns
	an array [{from,to},:]"""
	return np.array([[float(word) for word in pair.split(":")] for pair in desc.split(",")]).T

[docs]def triangle_wave(x, period=1):
	"""Return a triangle wave with amplitude 1 and the given period."""
	# This order (rather than x/period%1) gave smaller errors
	x = x % period / period * 4
	m1 = x < 1
	m2 = (x < 3) ^ m1
	m3 = x >= 3
	res = x.copy()
	res[m1] = x[m1]
	res[m2] = 2-x[m2]
	res[m3] = x[m3]-4
	return res

[docs]def calc_beam_area(beam_profile):
	"""Calculate the beam area in steradians given a beam profile[{r,b},npoint].
	r is in radians, b should have a peak of 1.."""
	from scipy import integrate
	r, b = beam_profile
	return integrate.simps(2*np.pi*r*b,r)

[docs]def planck(f, T=T_cmb):
	"""Return the Planck spectrum at the frequency f and temperature T in Jy/sr"""
	# Was 2*h*f**3, but writing it out like this is more robust to people sending
	# in huge integers for f, which causes overflow if this function is numba-ized
	return 2*h*f*f*f/c**2/(np.exp(h*f/(k*T))-1) * 1e26
blackbody = planck

[docs]def iplanck_T(f, I):
	"""The inverse of planck with respect to temperature"""
	return h*f/k/np.log(1+1/(I/1e26*c**2/(2*h*f**3)))

[docs]def dplanck(f, T=T_cmb):
	"""The derivative of the planck spectrum with respect to temperature, evaluated
	at frequencies f and temperature T, in units of Jy/sr/K."""
	# A blackbody has intensity I = 2hf**3/c**2/(exp(hf/kT)-1) = V/(exp(x)-1)
	# with V = 2hf**3/c**2, x = hf/kT.
	# dI/dx = -V/(exp(x)-1)**2 * exp(x)
	# dI/dT = dI/dx * dx/dT
	#       = 2hf**3/c**2/(exp(x)-1)**2*exp(x) * hf/k / T**2
	#       = 2*h**2*f**4/c**2/k/T**2 * exp(x)/(exp(x)-1)**2
	#       = 2*x**4 * k**3*T**2/(h**2*c**2) * exp(x)/(exp(x)-1)**2
	#       = .... /(4*sinh(x/2)**2)
	x     = h*f/(k*T)
	dIdT  = 2*x**4 * k**3*T**2/(h**2*c**2) / (4*np.sinh(x/2)**2) * 1e26
	return dIdT

[docs]def graybody(f, T=10, beta=1):
	"""Return a graybody spectrum at the frequency f and temperature T in Jy/sr"""
	return  2*h*f**(3+beta)/c**2/(np.exp(h*f/(k*T))-1) * 1e26

[docs]def tsz_spectrum(f, T=T_cmb):
	"""The increase in flux due to tsz in Jy/sr per unit of y. This is
	just the first order approximation, but it's good enough for realistic
	values of y, i.e. y << 1"""
	x  = h*f/(k*T)
	ex = np.exp(x)
	return 2*h*f**3/c**2 * (x*ex)/(ex-1)**2 * (x*(ex+1)/(ex-1)-4) * 1e26

# Helper functions for conversion from peak amplitude in cmb maps to flux

[docs]def flux_factor(beam_area, freq, T0=T_cmb):
	"""Compute the factor A that when multiplied with a linearized
	temperature increment dT around T0 (in K) at the given frequency freq
	in Hz and integrated over the given beam_area in steradians, produces
	the corresponding flux = A*dT. This is useful for converting between
	point source amplitudes and point source fluxes.

	For uK to mJy use flux_factor(beam_area, freq)/1e3
	"""
	return dplanck(freq, T0)*beam_area

[docs]def noise_flux_factor(beam_area, freq, T0=T_cmb):
	"""Compute the factor A that converts from white noise level in K sqrt(steradian)
	to uncertainty in Jy for the given beam area in steradians and frequency in Hz.
	This assumes white noise and a gaussian beam, so that the area of the real-space squared beam is
	just half that of the normal beam area.

	For uK arcmin to mJy, use noise_flux_factor(beam_area, freq)*arcmin/1e3
	"""
	squared_beam_area = beam_area/2
	return dplanck(freq, T0)*beam_area/squared_beam_area**0.5

# Cluster physics

[docs]def gnfw(x, xc, alpha, beta, gamma):
	return (x/xc)**gamma*(1+(x/xc)**alpha)**((beta-gamma)/alpha)

[docs]def tsz_profile_raw(x, xc=0.497, alpha=1.0, beta=-4.65, gamma=-0.3):
	"""Dimensionless radial (3d) cluster thermal pressure profile from
	arxiv:1109.3711. That article used a different definition of beta,
	beta' = 4.35 such that beta=gamma-alpha*beta'. I've translated it to
	follow the standard gnfw formula here. The numbers correspond to
	z=0, and M200 = 1e14 solar masses. They change slightly with mass
	and significantly with distance. But the further away they are, the
	smaller they get and the less the shape matters, so these should be
	good defaults.

	The full dimensions are this number times
	P0*G*M200*200*rho_cr(z)*f_b/(2*R200) where P0=18.1 at z=0 and M200=1e14.
	To get the dimensionful electron pressure,
	further scale by (2+2*Xh)/(3+5*Xh), where Xh=0.76 is the hydrogen fraction.
	But if one is working in units of y, then the dimensionless version is enough.

	x = r/R200. That is, it is the distance from the cluster center in units
	of the radius inside which the mean density is 200x as high as the critical
	density rho_c.
	"""
	return gnfw(x, xc=xc, alpha=alpha, beta=beta, gamma=gamma)

_tsz_profile_los_cache = {}
[docs]def tsz_profile_los(x, xc=0.497, alpha=1.0, beta=-4.65, gamma=-0.3, zmax=1e5, npoint=100, x1=1e-8, x2=1e4, _a=8, cache=None):
	"""Fast, highly accurate approximate version of tsz_profile_los_exact. Interpolates the exact
	function in log-log space, and caches the interpolator. With the default settings,
	it's accurate to better than 1e-5 up to at least x = 10000, and building the
	interpolator takes about 25 ms. After that, each evaluation takes 50-100 ns per
	data point. This makes it about 10000x faster than tsz_profile_los_exact.
	See tsz_profile_raw for the units."""
	from scipy import interpolate
	# Cache the fit parameters. 
	if cache is None: global _tsz_profile_los_cache
	else: _tsz_profile_los_cache = {}
	key = (xc, alpha, beta, gamma, zmax, npoint, _a, x1, x2)
	if key not in _tsz_profile_los_cache:
		xp = np.linspace(np.log(x1),np.log(x2),npoint)
		yp = np.log(tsz_profile_los_exact(np.exp(xp), xc=xc, alpha=alpha, beta=beta, gamma=gamma, zmax=zmax, _a=_a))
		_tsz_profile_los_cache[key] = (interpolate.interp1d(xp, yp, "cubic"), x1, x2, yp[0], yp[-1], (yp[-2]-yp[-1])/(xp[-2]-xp[-1]))
	spline, xmin, xmax, vleft, vright, slope = _tsz_profile_los_cache[key]
	# Split into 3 cases: x<xmin, x inside and x > xmax.
	x     = np.asfarray(x)
	left  = x<xmin
	right = x>xmax
	inside= (~left) & (~right)
	return np.piecewise(x, [inside, left, right], [
		lambda x: np.exp(spline(np.log(x))),
		lambda x: np.exp(vleft),
		lambda x: np.exp(vright + (np.log(x)-np.log(xmax))*slope),
	])

[docs]def tsz_profile_los_exact(x, xc=0.497, alpha=1.0, beta=-4.65, gamma=-0.3, zmax=1e5, _a=8):
	"""Line-of-sight integral of the cluster_pressure_profile. See tsz_profile_raw
	for the meaning of the arguments. Slow due to the use
	of quad and the manual looping this requires. Takes about 1 ms per data point.
	The argument _a controls a change of variable used to improve the speed and
	accuracy of the integral, and should not be necessary to change from the default
	value of 8.

	See tsz_profile_raw for the units and how to scale it to something physical.
	Without scaling, the profile has a peak of about 0.5 and a FWHM of about
	0.12 with the default parameters.

	Instead of using this function directly, consider using
	tsz_profile_los instead. It's 10000x faster and more than accurate enough.
	"""
	from scipy.integrate import quad
	x     = np.asarray(x)
	xflat = x.reshape(-1)
	# We have int f(x) dx, but would be easier to integrate
	# int y**a f(y) dy. So we want y**a dy = dx => 1/(a+1)*y**(a+1) = x
	# => y = (x*(a+1))**(1/(a+1))
	def yfun(x): return (x*(_a+1))**(1/(_a+1))
	def xfun(y): return y**(_a+1)/(_a+1)
	res    = 2*np.array([quad(lambda y: y**_a*tsz_profile_raw((xfun(y)**2+x1**2)**0.5, xc=xc, alpha=alpha, beta=beta, gamma=gamma), 0, yfun(zmax))[0] for x1 in xflat])
	res   = res.reshape(x.shape)
	return res

[docs]def tsz_tform(r200=1*arcmin, l=None, lmax=40000, xc=0.497, alpha=1.0, beta=-4.65, gamma=-0.3, zmax=1e5):
	"""Return the radial spherical harmonic coefficients b(l) of the tSZ profile with the
	parameters xc, alpha, beta, gamma. Scale controls the angular size of the profile on the
	sky. r200 is the cluster's angular R200 size, in radians (default=1 arcmin).

	If l (which can be multidimensional) is specified, the tsz coefficients will
	be evaluated at these ls.  Otherwise l = np.arange(lmax+1) will be used.

	The 2d-but-radially-symmetric fourier integral and cuspy nature of the tSZ profile
	are both handled via a fast hankel transform.
	"""
	from scipy import interpolate
	lvals, bvals = profile_to_tform_hankel(lambda r: tsz_profile_los(r/r200, xc=xc, alpha=alpha, beta=beta, gamma=gamma, zmax=zmax))
	if l is None: l = np.arange(lmax+1)
	bout = interpolate.interp1d(np.log(lvals), bvals, "cubic")(np.log(np.maximum(l,np.min(lvals))))
	return bout

### Binning ####

[docs]def edges2bins(edges):
	res = np.zeros((edges.size-1,2),int)
	res[:,0] = edges[:-1]
	res[:,1] = edges[1:]
	return res

[docs]def bins2edges(bins):
	return np.concatenate([bins[:,0],bins[1,-1:]])

[docs]def linbin(n, nbin=None, nmin=None, bsize=None):
	"""Given a number of points to bin and the number of approximately
	equal-sized bins to generate, returns [nbin_out,{from,to}].
	nbin_out may be smaller than nbin. The nmin argument specifies
	the minimum number of points per bin, but it is not implemented yet.
	nbin defaults to the square root of n if not specified."""
	if bsize is not None:
		if nbin is None: nbin = ceil(n/bsize)
		edges = np.arange(nbin+1)*bsize
	else:
		if nbin is None: nbin = nint(n**0.5)
		edges = np.arange(nbin+1)*n//nbin
	return np.vstack((edges[:-1],edges[1:])).T

[docs]def expbin(n, nbin=None, nmin=8, nmax=0):
	"""Given a number of points to bin and the number of exponentially spaced
	bins to generate, returns [nbin_out,{from,to}].
	nbin_out may be smaller than nbin. The nmin argument specifies
	the minimum number of points per bin. nbin defaults to n**0.5"""
	if not nbin: nbin = int(np.round(n**0.5))
	tmp  = np.array(np.exp(np.arange(nbin+1)*np.log(n+1)/nbin)-1,dtype=int)
	fixed = [tmp[0]]
	i = 0
	while i < nbin:
		for j in range(i+1,nbin+1):
			if tmp[j]-tmp[i] >= nmin:
				fixed.append(tmp[j])
				i = j
	# Optionally split too large bins
	if nmax:
		tmp = [fixed[0]]
		for v in fixed[1:]:
			dv = v-tmp[-1]
			nsplit = (dv+nmax-1)//nmax
			tmp += [tmp[-1]+dv*(i+1)//nsplit for i in range(nsplit)]
		fixed = tmp
	tmp = np.array(fixed)
	tmp[-1] = n
	return np.vstack((tmp[:-1],tmp[1:])).T

[docs]def bin_data(bins, d, op=np.mean):
	"""Bin the data d into the specified bins along the last dimension. The result has
	shape d.shape[:-1] + (nbin,)."""
	nbin  = bins.shape[0]
	dflat = d.reshape(-1,d.shape[-1])
	dbin  = np.zeros([dflat.shape[0], nbin])
	for bi, b in enumerate(bins):
		dbin[:,bi] = op(dflat[:,b[0]:b[1]],1)
	return dbin.reshape(d.shape[:-1]+(nbin,))

[docs]def bin_expand(bins, bdata):
	res = np.zeros(bdata.shape[:-1]+(bins[-1,1],),bdata.dtype)
	for bi, b in enumerate(bins):
		res[...,b[0]:b[1]] = bdata[...,bi]
	return res

[docs]def is_int_valued(a): return a%1 == 0

#### Matrix operations that don't need fortran ####

# Don't do matmul - it's better expressed with einsum

[docs]def solve(A, b, axes=[-2,-1], masked=False):
	"""Solve the linear system Ax=b along the specified axes
	for A, and axes[0] for b. If masked is True, then entries
	where A00 along the given axes is zero will be skipped."""
	A,b = np.asanyarray(A), np.asanyarray(b)
	baxes = axes if A.ndim == b.ndim else [axes[0]%A.ndim]
	fA = partial_flatten(A, axes)
	fb = partial_flatten(b, baxes)
	if masked:
		mask = fA[...,0,0] != 0
		fb[~mask] = 0
		fb[mask]  = np.linalg.solve(fA[mask],fb[mask])
	else:
		fb = np.linalg.solve(fA,fb)
	return partial_expand(fb, b.shape, baxes)

[docs]def eigpow(A, e, axes=[-2,-1], rlim=None, alim=None):
	"""Compute the e'th power of the matrix A (or the last
	two axes of A for higher-dimensional A) by exponentiating
	the eigenvalues. A should be real and symmetric.

	When e is not a positive integer, negative eigenvalues
	could result in a complex result. To avoid this, negative
	eigenvalues are set to zero in this case.

	Also, when e is not positive, tiny eigenvalues dominated by
	numerical errors can be blown up enough to drown out the
	well-measured ones. To avoid this, eigenvalues
	smaller than 1e-13 for float64 or 1e-4 for float32 of the
	largest one (rlim), or with an absolute value less than 2e-304 for float64 or
	1e-34 for float32 (alim) are set to zero for negative e. Set alim
	and rlim to 0 to disable this behavior.
	"""
	# This function basically does
	# E,V = np.linalg.eigh(A)
	# E **= e
	# return (V*E).dot(V.T)
	# All the complicated stuff is there to support axes and tolerances.
	if axes[0]%A.ndim != A.ndim-2 or axes[1]%A.ndim != A.ndim-1:
		fa = partial_flatten(A, axes)
		fa = eigpow(fa, e, rlim=rlim, alim=alim)
		return partial_expand(fa, A.shape, axes)
	else:
		E, V = np.linalg.eigh(A)
		if rlim is None: rlim = np.finfo(E.dtype).resolution*100
		if alim is None: alim = np.finfo(E.dtype).tiny*1e4
		mask = np.full(E.shape, False, bool)
		if not is_int_valued(e):
			mask |= E < 0
		if e < 0:
			aE = np.abs(E)
			if A.ndim > 2:
				mask |= (aE < np.max(aE,1)[:,None]*rlim) | (aE < alim)
			else:
				mask |= (aE < np.max(aE)*rlim) | (aE < alim)
		E[~mask] **= e
		E[mask]    = 0
		if A.ndim > 2:
			res = np.einsum("...ij,...kj->...ik",V*E[...,None,:],V)
		else:
			res = V.dot(E[:,None]*V.T)
		return res

[docs]def build_conditional(ps, inds, axes=[0,1]):
	"""Given some covariance matrix ps[n,n] describing a
	set of n Gaussian distributed variables, and a set of
	indices inds[m] specifying which of these variables are already
	known, return matrices A[n-m,m], cov[m,m] such that the
	conditional distribution for the unknown variables is
	x_unknown ~ normal(A x_known, cov). If ps has more than
	2 dimensions, then the axes argument indicates which
	dimensions contain the matrix.

	Example:

	C  = np.array([[10,2,1],[2,8,1],[1,1,5]])
	vknown = np.linalg.cholesky(C[:1,:1]).dot(np.random.standard_normal(1))
	A, cov = lensing.build_conditional(C, v0)
	vrest  = A.dot(vknown) + np.linalg.cholesky(cov).dot(np.random_standard_normal(2))

	vtot = np.concatenate([vknown,vrest]) should have the same distribution
	as a sample drawn directly from the full C.
	"""
	ps   = np.asarray(ps)
	# Make the matrix parts the last axes, so we have [:,ncomp,ncomp]
	C = partial_flatten(ps,   axes)
	# Define masks for what is known and unknown
	known       = np.full(C.shape[1],False,bool)
	known[inds] = True
	unknown     = ~known
	# Hack: Handle masked arrays where some elements are all-zero.
	def inv(A):
		good = ~np.all(np.einsum("aii->ai", A)==0,-1)
		res  = A*0
		res[good] = np.linalg.inv(A[good])
		return res
	# Build the parameters for the conditional distribution
	Ci     = inv(C)
	Ciuk   = Ci[:,unknown,:][:,:,known]
	Ciuu   = Ci[:,unknown,:][:,:,unknown]
	Ciuui  = inv(Ciuu)
	A      = -np.matmul(Ciuui, Ciuk)
	# Expand back to original shape
	A      = partial_expand(A,     ps.shape, axes)
	cov    = partial_expand(Ciuui, ps.shape, axes)
	return A, cov

[docs]def nint(a):
	"""Return a rounded to the nearest integer, as an integer."""
	return np.round(a).astype(int)
[docs]def ceil(a):
	"""Return a rounded to the next integer, as an integer."""
	return np.ceil(a).astype(int)
[docs]def floor(a):
	"""Return a rounded to the previous integer, as an integer."""
	return np.floor(a).astype(int)

format_regex = r"%(\([a-zA-Z]\w*\)|\(\d+)\)?([ +0#-]*)(\d*|\*)(\.\d+|\.\*)?(ll|[lhqL])?(.)"
[docs]def format_to_glob(format):
	"""Given a printf format, construct a glob pattern that will match
	its outputs. However, since globs are not very powerful, the resulting
	glob will be much more premissive than the input format, and you will
	probably want to filter the results further."""
	# This matches a pretty general printf format
	def subfun(m):
		name, flags, width, prec, size, type = m.groups()
		if type == '%': return '%'
		else: return '*'
	return re.sub(format_regex, subfun, format)

[docs]def format_to_regex(format):
	"""Given a printf format, construct a regex that will match its outputs."""
	ireg = r"([^%]*)"+format_regex+r"([^%]*)"
	def subfun(m):
		pre, name, flags, width, prec, size, type, post = m.groups()
		opre  = re.escape(pre)
		opost = re.escape(post)
		open  = r"(?P<"+name[1:-1]+">" if name is not None else "("
		# Expand variable widths
		iwidth = 0 if width is None or width == '*' or width == '' else int(width)
		iprec  = 0 if prec  is None or prec  == '*' else int(prec[1:])
		if type == '%': return opre + '%' + opost
		if type == 's':
			if "-" in flags: return opre + open + ".*) *" + opost
			else:            return opre + r" *" + open + ".*)" + opost
		else:
			# Numeric type
			if   "+" in flags: omid = r"[+-]"
			elif " " in flags: omid = r"[ -]"
			else: omid = r"-?"
			if "-" in flags:
				prepad  = ""
				postpad = " *"
			else:
				prepad  = r"0*" if "0" in flags else r" *"
				postpad = ""
			if type in ['d','i','u'] or type in ['f','F'] and prec == '0':
				num = r"\d+"
			elif type == 'o': num = r"[0-7]+"
			elif type == 'x': num = r"[0-9a-f]+"
			elif type == 'X': num = r"[0-9A-F]+"
			elif type == 'f': num = r"\d+\.\d*"
			elif type == 'e': num = r"\d+\.\d*e[+-]\d+"
			elif type == 'E': num = r"\d+\.\d*E[+-]\d+"
			elif type == 'g': num = r"(\d+(\.\d*)?)|(\d+\.\d*e[+-]\d+)"
			elif type == 'G': num = r"(\d+(\.\d*)?)|(\d+\.\d*E[+-]\d+)"
			else: return NotImplementedError("Format character '%s'" % type)
			omid = prepad + open + omid + num + r")" + postpad
			return opre + omid + opost
	return re.sub(ireg, subfun, format)

# Not sure if this belongs here...
[docs]class Printer:
	def __init__(self, level=1, prefix=""):
		self.level  = level
		self.prefix = prefix
[docs]	def write(self, desc, level, exact=False, newline=True, prepend=""):
		if level == self.level or not exact and level <= self.level:
			sys.stderr.write(prepend + self.prefix + desc + ("\n" if newline else ""))
[docs]	def push(self, desc):
		return Printer(self.level, self.prefix + desc)
[docs]	def time(self, desc, level, exact=False, newline=True):
		class PrintTimer:
			def __init__(self, printer): self.printer = printer
			def __enter__(self): self.time = time.time()
			def __exit__(self, type, value, traceback):
				self.printer.write(desc, level, exact=exact, newline=newline, prepend="%6.2f " % (time.time()-self.time))
		return PrintTimer(self)

[docs]def ndigit(num):
	"""Returns the number of digits in non-negative number num"""
	with nowarn(): return np.int32(np.floor(np.maximum(1,np.log10(num))))+1

[docs]def contains_any(a, bs):
	"""Returns true if any of the strings in list bs are found
	in the string a"""
	for b in bs:
		if b in a: return True
	return False

[docs]def build_legendre(x, nmax):
	x   = np.asarray(x)
	vmin, vmax = minmax(x)
	x   = (x-vmin)*(2.0/(vmax-vmin))-1
	res = np.zeros((nmax,)+x.shape)
	if nmax > 0: res[0] = 1
	if nmax > 1: res[1] = x
	for i in range(1, nmax-1):
		res[i+1] = ((2*i+1)*x*res[i] - i*res[i-1])/(i+1)
	return res

[docs]def build_cossin(x, nmax):
	x   = np.asarray(x)
	res = np.zeros((nmax,)+x.shape, x.dtype)
	if nmax > 0: res[0] = np.sin(x)
	if nmax > 1: res[1] = np.cos(x)
	if nmax > 2: res[2] = 2*res[0]*res[1]
	if nmax > 3: res[3] = res[1]**2-res[0]**2
	for i in range(3,nmax):
		if i % 2 == 0: res[i] = res[i-2]*res[1] + res[i-1]*res[0]
		if i % 2 == 1: res[i] = res[i-2]*res[1] - res[i-3]*res[0]
	return res

[docs]def load_ascii_table(fname, desc, sep=None, dsep=None):
	"""Load an ascii table with heterogeneous columns.
	fname: Path to file
	desc: whitespace-separated list of name:typechar pairs, or | for columns that are to be ignored.
	desc must cover every column present in the file"""
	dtype = []
	j = 0
	for i, tok in enumerate(desc.split(dsep)):
		if ":" not in tok:
			j += 1
			dtype.append(("sep%d"%j,"U%d"%len(tok)))
		else:
			name, typ = tok.split(":")
			dtype.append((name,typ))
	return np.loadtxt(fname, dtype=dtype, delimiter=sep)

[docs]def count_variable_basis(bases):
	"""Counts from 0 and up through a variable-basis number,
	where each digit has a different basis. For example,
	count_variable_basis([2,3]) would yield [0,0], [0,1], [0,2],
	[1,0], [1,1], [1,2]."""
	N = bases
	n = len(bases)
	I = [0 for i in range(n)]
	yield I
	while True:
		for i in range(n-1,-1,-1):
			I[i] += 1
			if I[i] < N[i]: break
			else:
				for j in range(i,n): I[j] = 0
		else: break
		yield I

[docs]def list_combination_iter(ilist):
	"""Given a list of lists of values, yields every combination of
	one value from each list."""
	for I in count_variable_basis([len(v) for v in ilist]):
		yield [v[i] for v,i in zip(ilist,I)]

class _SliceEval:
	def __getitem__(self, sel):
		if isinstance(sel, slice): return (sel,)
		else: return sel
sliceeval = _SliceEval()

[docs]def expand_slice(sel, n, nowrap=False):
	"""Expands defaults and negatives in a slice to their implied values.
	After this, all entries of the slice are guaranteed to be present in their final form.
	Note, doing this twice may result in odd results, so don't send the result of this
	into functions that expect an unexpanded slice. Might be replacable with slice.indices()."""
	step = sel.step or 1
	def cycle(i,n):
		if nowrap: return i
		else: return min(i,n) if i >= 0 else n+i
	def default(a, val): return a if a is not None else val
	if step == 0: raise ValueError("slice step cannot be zero")
	if step > 0: return slice(cycle(default(sel.start,0),n),cycle(default(sel.stop,n),n),step)
	else: return slice(cycle(default(sel.start,n-1), n), cycle(sel.stop,n) if sel.stop is not None else -1, step)

[docs]def split_slice(sel, ndims):
	"""Splits a numpy-compatible slice "sel" into sub-slices sub[:], such that
	a[sel] = s[sub[0]][:,sub[1]][:,:,sub[2]][...], This is useful when
	implementing arrays with heterogeneous indices. Ndims indicates the number of
	indices to allocate to each split, starting from the left. Also expands all
	ellipsis."""
	if not isinstance(sel,tuple): sel = (sel,)
	# We know the total number of dimensions involved, so we can expand ellipis
	# What the heck? "in" operator is apparently broken for lists that
	# contain numpy arrays.
	parts = listsplit(sel, Ellipsis)
	if len(parts) > 1:
		# Only the rightmost ellipsis has any effect
		left, right = sum(parts[:-1],()), parts[-1]
		nfree = sum(ndims) - sum([i is not None for i in (left+right)])
		sel = left + tuple([slice(None) for i in range(nfree)]) + right
	return split_slice_simple(sel, ndims)

[docs]def split_slice_simple(sel, ndims):
	"""Helper function for split_slice. Splits a slice
	in the absence of ellipsis."""
	res = [[] for n in ndims]
	notNone = [v is not None for v in sel]
	subs = np.concatenate([[0],cumsplit(notNone, ndims)])
	for i, r in enumerate(res):
		r += sel[subs[i]:subs[i+1]]
	if subs[i+1] < len(sel):
		raise IndexError("Too many indices")
	return [tuple(v) for v in res]

class _get_slice_class:
	def __getitem__(self, a): return a
get_slice = _get_slice_class()

[docs]def parse_slice(desc):
	if desc is None: return None
	else: return eval("get_slice" + desc)

[docs]def slice_downgrade(d, s, axis=-1):
	"""Slice array d along the specified axis using the Slice s,
	but interpret the step part of the slice as downgrading rather
	than skipping."""
	a = np.moveaxis(d, axis, 0)
	step = s.step or 1
	a = a[s.start:s.stop:-1 if step < 0 else 1]
	step = abs(step)
	# Handle the whole blocks first
	a2 = a[:len(a)//step*step]
	a2 = np.mean(a2.reshape((len(a2)//step,step)+a2.shape[1:]),1)
	# Then append the incomplete block
	if len(a2)*step != len(a):
		rest = a[len(a2)*step:]
		a2 = np.concatenate([a2,[np.mean(rest,0)]],0)
	return np.moveaxis(a2, 0, axis)

[docs]def outer_stack(arrays):
	"""Example. outer_stack([[1,2,3],[10,20]]) -> [[[1,1],[2,2],[3,3]],[[10,20],[10,20],[10,2]]]"""
	res = np.empty([len(arrays)]+[len(a) for a in arrays], arrays[0].dtype)
	for i, array in enumerate(arrays):
		res[i] = array[(None,)*i + (slice(None),) + (None,)*(len(arrays)-i-1)]
	return res

[docs]def tform_to_profile(bl, theta, normalize=False):
	"""Given the transform b(l) of a beam, evaluate its real space angular profile
	at the given radii theta."""
	bl = np.asarray(bl)
	l  = np.arange(bl.size)
	x  = np.cos(theta)
	a  = bl*(2*l+1)/(4*np.pi)
	profile = np.polynomial.legendre.legval(x,a)
	if normalize: profile /= np.sum(a)
	return profile
# Compatibility
beam_transform_to_profile = tform_to_profile

[docs]class RadialFourierTransform:
	def __init__(self, lrange=None, rrange=None, n=512, pad=256):
		"""Construct an object for transforming between radially
		symmetric profiles in real-space and fourier space using a
		fast Hankel transform. Aside from being fast, this is also
		good for representing both cuspy and very extended profiles
		due to the logarithmically spaced sample points the fast
		Hankel transform uses. A cost of this is that the user can't
		freely choose the sample points. Instead one passes the
		multipole range or radial range of interest as well as the
		number of points to use.

		The function currently assumes two dimensions with flat geometry.
		That means the function is only approximate for spherical
		geometries, and will only be accurate up to a few degrees
		in these cases.

		Arguments:
		* lrange = [lmin, lmax]: The multipole range to use. Defaults
		  to [0.01, 1e6] if no rrange is given.
		* rrange = [rmin, rmax]: The radius range to use if lrange is
			not specified, in radians. Example values: [1e-7,10].
			Since we don't use spherical geometry r is not limited to 2 pi.
		* n: The number of logarithmically equi-spaced points to use
			in the given range. Default: 512. The Hankel transform usually
			doesn't need many points for good accuracy, and can suffer if
			too many points are used.
		* pad: How many extra points to pad by on each side of the range.
		  Padding is useful to get good accuracy in a Hankel transform.
		  The transforms this function does will return padded output,
			which can be unpadded using the unpad method. Default: 256
		"""
		if lrange is None and rrange is None: lrange = [0.1, 1e7]
		if lrange is None: lrange = [1/rrange[1], 1/rrange[0]]
		logl1, logl2 = np.log(lrange)
		logl0        = (logl2+logl1)/2
		self.dlog    = (logl2-logl1)/n
		i0           = (n+1)/2+pad
		self.l       = np.exp(logl0 + (np.arange(1,n+2*pad+1)-i0)*self.dlog)
		self.r       = 1/self.l[::-1]
		self.pad     = pad
[docs]	def real2harm(self, rprof):
		"""Perform a forward (real -> harmonic) transform, taking us from the
		provided real-space radial profile rprof(r) to a harmonic-space profile
		lprof(l). rprof can take two forms:
		1. A function rprof(r) that can be called to evalute the profile at
		   arbitrary points.
		2. An array rprof[self.r] that provides the profile evaluated at the
		   points given by this object's .r member.
		The transform is done along the last axis of the profile.
		Returns lprof[self.l]. This includes padding, which can be removed
		using self.unpad"""
		import scipy.fft
		try: rprof = rprof(self.r)
		except TypeError: pass
		lprof = 2*np.pi*scipy.fft.fht(rprof*self.r, self.dlog, 0)/self.l
		return lprof
[docs]	def harm2real(self, lprof):
		"""Perform a backward (harmonic -> real) transform, taking us from the
		provided harmonic-space radial profile lprof(l) to a real-space profile
		rprof(r). lprof can take two forms:
		1. A function lprof(l) that can be called to evalute the profile at
		   arbitrary points.
		2. An array lprof[self.l] that provides the profile evaluated at the
		   points given by this object's .l member.
		The transform is done along the last axis of the profile.
		Returns rprof[self.r]. This includes padding, which can be removed
		using self.unpad"""
		import scipy.fft
		try: lprof = lprof(self.l)
		except TypeError: pass
		rprof = scipy.fft.ifht(lprof/(2*np.pi)*self.l, self.dlog, 0)/self.r
		return rprof
[docs]	def unpad(self, *arrs):
		"""Remove the padding from arrays used by this object. The
		values in the padded areas of the output of the transform have
		unreliable values, but they're not cropped automatically to
		allow for round-trip transforms. Example:
			r = unpad(r_padded)
			r, l, vals = unpad(r_padded, l_padded, vals_padded)"""
		if self.pad == 0: res = arrs
		else: res = tuple([arr[...,self.pad:-self.pad] for arr in arrs])
		return res[0] if len(arrs) == 1 else res
[docs]	def lind(self, l): return (np.log(l)-np.log(self.l[0]))/self.dlog
[docs]	def rind(self, r): return (np.log(r)-np.log(self.r[0]))/self.dlog

[docs]def profile_to_tform_hankel(profile_fun, lmin=0.1, lmax=1e7, n=512, pad=256):
	"""Transform a radial profile given by the function profile_fun(r) to
	sperical harmonic coefficients b(l) using a Hankel transform. This approach
	is good at handling cuspy distributions due to using logarithmically spaced
	points. n points from 10**logrange[0] to 10**logrange[1] will be used.
	Returns l, bl. l will not be equi-spaced, so you may want to interpolate
	the results. Note that unlike other similar functions in this module and
	the curvedsky module, this function uses the flat sky approximation, so
	it should only be used for profiles up to a few degrees in size."""
	rht   = RadialFourierTransform(lrange=[lmin,lmax], n=n, pad=pad)
	lprof = rht.real2harm(profile_fun)
	return rht.unpad(rht.l, lprof)

[docs]def fix_dtype_mpi4py(dtype):
	"""Work around mpi4py bug, where it refuses to accept dtypes with endian info"""
	return np.dtype(np.dtype(dtype).char)

[docs]def native_dtype(dtype):
	"""Return the native version of dtype. E.g. if the input is big-endian float32, returns plain float32"""
	return np.dtype(np.dtype(dtype).char)

[docs]def decode_array_if_necessary(arr):
	"""Given an arbitrary numpy array arr, decode it if it is of type S and we're in a
	version of python that doesn't like that"""
	try:
		# Check if we're in python 3
		np.array(["a"],"S")[0] in "a"
		return arr
	except TypeError:
		# Yes, we need to decode
		if arr.dtype.type is np.bytes_:
			return np.char.decode(arr)
		else:
			return arr

[docs]def encode_array_if_necessary(arr):
	"""Given an arbitrary numpy array arr, encode it if it is of type S and we're in a
	version of python that doesn't like that"""
	arr = np.asarray(arr)
	try:
		# Check if we're in python 3
		np.array(["a"],"S")[0] in "a"
		return arr
	except TypeError:
		# Yes, we need to encode
		if arr.dtype.type is np.str_:
			return np.char.encode(arr)
		else:
			return arr

### These functions deal with the conversion between decimal and sexagesimal ###

[docs]def to_sexa(x):
	"""Given a number in decimal degrees x, returns (sign,deg,min,sec).
	Given this x can be reconstructed as sign*(deg+min/60+sec/3600).
	"""
	# Handle both scalars and vectors efficiently. We need to do it like this
	# because the vector stuff is 30x slower than the scalar implementation for
	# single numbers. This construction only has a factor 2 slowdown.
	try:
		len(x)
		x    = np.asanyarray(x)
		sign = np.where(x < 0, -1, 1)*1
		ifun = np.int32
	except TypeError:
		sign = -1 if x < 0 else 1
		ifun = int
	x    = x*sign
	deg  = ifun(x)
	x    = (x-deg)*60
	min  = ifun(x)
	sec  = (x-min)*60
	return (sign, deg, min, sec)

[docs]def from_sexa(sign, deg, min, sec):
	"""Reconstruct a decimal number from the sexagesimal representation."""
	return sign*(deg+min/60+sec/3600)

[docs]def format_sexa(x, fmt="%(deg)+03d:%(min)02d:%(sec)06.2f"):
	sign, deg, min, sec = to_sexa(x)
	return fmt % {"deg": sign*deg, "min": min, "sec": sec}

[docs]def jname(ra, dec, fmt="J%(ra_H)02d%(ra_M)02d%(ra_S)02d%(dec_d)+02d%(dec_m)02d%(dec_s)02d", tag=None, sep=" "):
	"""Build a systematic object name for the given ra/dec in degrees. The format
	is specified using the format string fmt. The default format string is
	'J%(ra_H)02d%(ra_M)02d%(ra_S)02d%(dec_d)+02d%(dec_m)02d%(dec_s)02d'. This is
	not fully compliant with the IAU specification, but it's what is used in ACT.
	Formatting uses standard python string interpolation. The available variables are
	ra:  right ascension in decimal degrees
	dec: declination in decimal degrees
	ra_d,  ra_m,  ra_s:  sexagesimal degrees, arcmins and arcsecs of right ascensions
	dec_d, dec_m, dec_s: sexagesimal degrees, arcmins and arcsecs of declination
	ra_H,  ra_M,  ra_S:  hours, minutes and seconds of right ascension
	dec_H, rec_M, dec_S: hours, minutes and seconds of declination (doesn't make much sense)

	tag is prefixed to the format, with sep as the separator. This lets one prefix
	the survey name without needing to rewrite the whole format string.
	"""
	rad = to_sexa(ra%360)
	rah = to_sexa(ra/15%24)
	ded = to_sexa(dec)
	deh = to_sexa(dec/15)
	prefix = tag + sep if tag is not None else ""
	return prefix + fmt % {
		"ra": ra, "dec": dec,
		"ra_d" :rad[0]*rad[1], "ra_m" : rad[2], "ra_s" : rad[3],
		"ra_H" :rah[0]*rah[1], "ra_M" : rah[2], "ra_S" : rah[3],
		"dec_d":ded[0]*ded[1], "dec_m": ded[2], "dec_s": ded[3],
		"dec_H":deh[0]*deh[1], "dec_M": deh[2], "dec_S": deh[3]}

[docs]def ang2chord(ang):
	"""Converts from the angle between two points on a circle to the length of the chord between them"""
	return 2*np.sin(ang/2)

[docs]def chord2ang(chord):
	"""Inverse of ang2chord."""
	return 2*np.arcsin(chord/2)

[docs]def crossmatch(pos1, pos2, rmax, mode="closest", coords="auto"):
	"""Find close matches between positions given by pos1[:,ndim] and pos2[:,ndim],
	up to a maximum distance of rmax (in the same units as the positions).

	The argument "coords" controls how the coordinates are interpreted. If it is
	"cartesian", then they are assumed to be cartesian coordinates. If it is
	"radec" or "phitheta", then the coordinates are assumed to be angles in radians,
	which will be transformed to cartesian coordinates internally before being used.
	"radec" is equator-based while "phitheta" is zenith-based. The default, "auto",
	will assume "radec" if ndim == 2, and "cartesian" otherwise.

	It's possible that multiple objects from the catalogs are within rmax of each
	other. The "mode" argument controls how this is handled.
	mode == "all":
	 Returns a list of pairs of indices into the two lists, one for each pair of
	 objects that are close enough to each other, regardless of the presence of
	 any other matches. Any given object can be mentioned multiple times in this
	 list.
	mode == "closest":
	 Like "all", but only the closest time an index appears in a pair is kept, the
	 others are discarded.
	mode == "first":
	 Like "all", but only the first time an index appears in a pair is kept, the
	 others are discarted. This can be useful if some objects should be given
	 higher priority than others. For example, one could sort pos1 and pos2 by
	 brightness and then use mode == "first" to prefer bright objects in the match."""
	from scipy import spatial
	
	pos1 = np.asarray(pos1); n1 = len(pos1)
	pos2 = np.asarray(pos2); n2 = len(pos2)

	assert pos1.ndim == 2, "crossmatch: pos1 must be [npoint,ndim], but was %s" % str(pos1.shape)
	assert pos2.ndim == 2, "crossmatch: pos2 must be [npoint,ndim], but was %s" % str(pos2.shape)
	assert pos1.shape[1] == pos2.shape[1], "crossmatch: pos1's shape %s is incompatible with pos2's shape %s" % (str(pos1.shape), str(pos2.shape))

	# Normalize the coordinates
	if coords == "auto":
		coords = "radec" if pos1.shape[1] == 2 else "cartesian"
	if coords == "radec":
		trans = lambda pos: ang2rect(pos, zenith=False, axis=1)
		reff  = ang2chord(rmax)
	elif coords == "phitheta":
		trans = lambda pos: ang2rect(pos, zenith=True,  axis=1)
		reff  = ang2chord(rmax)
	elif coords == "cartesian":
		trans = lambda pos: pos
		reff  = rmax
	else:
		raise ValueError("crossmatch: Unrecognized value for coords: %s" % (str(coords)))
	pos1 = trans(pos1)
	pos2 = trans(pos2)

	# Start by generating the full list
	tree1   = spatial.cKDTree(pos1)
	tree2   = spatial.cKDTree(pos2)
	matches = tree1.query_ball_tree(tree2, r=reff)
	pairs   = [(i1,i2) for i1, group in enumerate(matches) for i2 in group]

	if mode == "all":
		return pairs
	else:
		if mode == "first":
			# "first" mode only keeps the first group an object appears in. So the pairs
			# are already in the right order.
			pass
		elif mode == "closest":
			parr   = np.array(pairs,int).reshape(-1,2)
			d2     = np.sum((pos1[parr[:,0]]-pos2[parr[:,1]])**2,1)
			order  = np.argsort(d2)
			pairs  = [pairs[i] for i in order]
		else:
			raise ValueError("crossmatch: Unrecognized mode: %s" % (str(mode)))
		# Filter out all but the first mention of each
		done1 = np.zeros(n1, bool)
		done2 = np.zeros(n2, bool)
		opairs= []
		for i1, i2 in pairs:
			if done1[i1] or done2[i2]: continue
			done1[i1] = done2[i2] = True
			opairs.append((i1,i2))
		return opairs

[docs]def real_dtype(dtype):
	"""Return the closest real (non-complex) dtype for the given dtype"""
	# A bit ugly, but actually quite fast
	return np.zeros(1, dtype).real.dtype

[docs]def complex_dtype(dtype):
	"""Return the closest complex dtype for the given dtype"""
	return np.result_type(dtype, 0j)

[docs]def ascomplex(arr):
	arr = np.asanyarray(arr)
	return arr.astype(complex_dtype(arr.dtype))

# Conjugate gradients

[docs]def default_M(x):     return np.copy(x)
[docs]def default_dot(a,b): return a.dot(np.conj(b))

[docs]class CG:
	"""A simple Preconditioner Conjugate gradients solver. Solves
	the equation system Ax=b.

	This improves on the one in scipy in several ways. It allows one to specify
	one's own dot product operator, which is necessary for handling distributed
	degrees of freedom, where each mpi task only stores parts of the full
	solution. It is also reentrant, meaning that one can do nested CG if necessary.
	"""
	def __init__(self, A, b, x0=None, M=default_M, dot=default_dot):
		"""Initialize a solver for the system Ax=b, with a starting guess of x0 (0
		if not provided). Vectors b and x0 must provide addition and multiplication,
		as well as the .copy() method, such as provided by numpy arrays. The
		preconditioner is given by M. A and M must be functors acting on vectors
		and returning vectors. The dot product may be manually specified using the
		dot argument. This is useful for MPI-parallelization, for example."""
		# Init parameters
		self.A   = A
		self.b   = b # not necessary to store this. Delete?
		self.M   = M
		self.dot = dot
		if x0 is None:
			self.x = b*0
			self.r = b
		else:
			self.x  = x0.copy()
			self.r  = b-self.A(self.x)
		# Internal work variables
		n = b.size
		z = self.M(self.r)
		self.rz  = self.dot(self.r, z)
		self.rz0 = float(self.rz)
		self.p   = z
		self.i   = 0
		self.err = np.inf
[docs]	def step(self):
		"""Take a single step in the iteration. Results in .x, .i
		and .err being updated. To solve the system, call step() in
		a loop until you are satisfied with the accuracy. The result
		can then be read off from .x."""
		# Full vectors: p, Ap, x, r, z. Ap and z not in memory at the
		# same time. Total memory cost: 4 vectors + 1 temporary = 5 vectors
		Ap = self.A(self.p)
		alpha = self.rz/self.dot(self.p, Ap)
		self.x += alpha*self.p
		self.r -= alpha*Ap
		del Ap
		z       = self.M(self.r)
		next_rz = self.dot(self.r, z)
		self.err = next_rz/self.rz0
		beta = next_rz/self.rz
		self.rz = next_rz
		self.p  = z + beta*self.p
		self.i += 1
[docs]	def save(self, fname):
		"""Save the volatile internal parameters to hdf file fname. Useful
		for later restoring cg iteration"""
		import h5py
		with h5py.File(fname, "w") as hfile:
			for key in ["i","rz","rz0","x","r","p","err"]:
				hfile[key] = getattr(self, key)
[docs]	def load(self, fname):
		"""Load the volatile internal parameters from the hdf file fname.
		Useful for restoring a saved cg state, after first initializing the
		object normally."""
		import h5py
		with h5py.File(fname, "r") as hfile:
			for key in ["i","rz","rz0","x","r","p","err"]:
				setattr(self, key, hfile[key][()])

[docs]class Minres:
	"""A simple Minres solver. Solves the equation system Ax=b."""
	def __init__(self, A, b, x0=None, dot=default_dot):
		"""Initialize a solver for the system Ax=b, with a starting guess of x0 (0
		if not provided). Vectors b and x0 must provide addition and multiplication,
		as well as the .copy() method, such as provided by numpy arrays. The
		preconditioner is given by M. A and M must be functors acting on vectors
		and returning vectors. The dot product may be manually specified using the
		dot argument. This is useful for MPI-parallelization, for example."""
		# Init parameters
		self.A   = A
		self.dot = dot
		if x0 is None:
			self.x = b*0
			self.r = b*1
		else:
			self.x  = x0.copy()
			self.r  = b-self.A(self.x)
		# Internal work variables
		z       = self.A(self.r)
		self.rz = self.dot(self.r,z)
		self.rz0= self.rz
		self.p  = self.r.copy()
		self.q  = z
		self.i  = 0
		self.err= 1
		self.abserr = self.rz/len(self.x)
[docs]	def step(self):
		"""Take a single step in the iteration. Results in .x, .i
		and .err being updated. To solve the system, call step() in
		a loop until you are satisfied with the accuracy. The result
		can then be read off from .x."""
		# Vectors: x, r, z, p, q. All in use at the same time.
		# So memory cost = 5 vectors + 1 temporary = 6 vectors
		alpha   = self.rz/self.dot(self.q,self.q)
		self.x += alpha*self.p
		self.r -= alpha*self.q
		z       = self.A(self.r)
		next_rz = self.dot(self.r,z)
		beta    = next_rz/self.rz
		self.rz = next_rz
		self.q *= beta; self.q += z; del z
		self.p *= beta; self.p += self.r
		self.i += 1
		# Estimate of variance of Ax-b relative to starting point
		self.err    = self.rz/self.rz0
		# Estimate of variance of Ax-b
		self.abserr = self.rz/len(self.x)

[docs]def nditer(shape):
	ndim = len(shape)
	I    = [0]*ndim
	while True:
		yield tuple(I)
		for dim in range(ndim-1,-1,-1):
			I[dim] += 1
			if I[dim] < shape[dim]: break
			I[dim] = 0
		else:
			break

[docs]def first_importable(*args):
	"""Given a list of module names, return the name of the first
	one that can be imported."""
	import importlib
	for arg in args:
		try:
			importlib.import_module(arg)
			return arg
		except ModuleNotFoundError:
			continue

[docs]def glob(desc):
	"""Like glob.glob, but without nullglob turned on. This is useful for not
	just silently throwing away arguments with spelling mistakes."""
	import glob as g
	res = g.glob(desc)
	if len(res) == 0: return [desc]
	else: return res

[docs]def cache_get(cache, key, op):
	if not cache: return op()
	if key not in cache:
		cache[key] = op()
	return cache[key]

[docs]def replace(istr, ipat, repl):
	ostr = istr.replace(ipat, repl)
	if ostr == istr: raise KeyError("Pattern not found")
	return ostr

# I used to do stuff like a[~np.isfinite(a)] = 0, but this should be
# lower overhad and faster
[docs]def remove_nan(a):
	"""Sets nans and infs to 0 in an array in-place. Should have no memory overhead.
	Also returns the array for convenience."""
	return np.nan_to_num(a, copy=False, nan=0, posinf=0, neginf=0)
[docs]def without_nan(a):
	"""Returns a copy of a with nans and infs set to 0. The original
	array is not modified."""
	return np.nan_to_num(a, copy=True, nan=0, posinf=0, neginf=0)

# Why doesn't scipy have this?
[docs]def primes(n):
	"""Simple prime factorization of the positive integer n. Uses the
	brute force algorithm, but it's quite fast even for huge numbers."""
	i = 2
	factors = []
	while i * i <= n:
		if n % i:
			i += 1
		else:
			n //= i
		factors.append(i)
	if n > 1:
		factors.append(n)
	return factors

[docs]def res2nside(res):
	return (np.pi/3)**0.5/res
[docs]def nside2res(nside):
	return (np.pi/3)**0.5/nside

[docs]def split_esc(string, delim, esc='\\'):
	"""Split string by the delimiter except when escaped by
	the given escape character, which defaults to backslash.
	Consumes one level of escapes. Yields the tokens one by
	one as an iterator."""
	if len(delim) != 1: raise ValueError("delimiter must be one character")
	if len(esc)   != 1: raise ValueError("escape character must be one character")
	if len(string) == 0: yield ""
	inesc = False
	ostr  = ""
	for i, c in enumerate(string):
		if inesc:
			if c != esc: ostr += c
			inesc = False
		elif c == esc:
			inesc = True
		elif c == delim:
			yield ostr
			ostr = ""
		else:
			ostr += c
	if len(ostr) > 0:
		yield ostr

[docs]def getenv(name, default=None):
	"""Return the value of the named environment variable, or default if it's not set"""
	try: return os.environ[name]
	except KeyError: return default

[docs]def setenv(name, value, keep=False):
	"""Set the named environment variable to the given value. If keep==False
	(the default), existing values are overwritten. If the value is None, then
	it's deleted from the environment. If keep==True, then this function does
	nothing if the variable already has a value."""
	if   name in os.environ and keep: return
	elif name in os.environ and value is None: del os.environ[name]
	elif value is not None: os.environ[name] = str(value)

[docs]def zip2(*args):
	"""Variant of python's zip that calls next() the same number of times on
	all arguments. This means that it doesn't give up immediately after getting
	the first StopIteration exception, but continues on until the end of the row.
	This can be useful for iterators that want to do cleanup after hte last yield."""
	done = False
	while not done:
		res = []
		for arg in args:
			try:
				res.append(next(arg))
			except StopIteration:
				done = True
		if not done:
			yield tuple(res)

[docs]def call_help(fun, *args, **kwargs):
	for ai, arg in enumerate(args):
		print("arg %d %s" % (ai, arg_help(arg)))
	for name, arg in kwargs.items():
		print("kwarg %s %s" % (name, arg_help(arg)))
	return fun(*args, **kwargs)

[docs]def arg_help(arg):
	if isinstance(arg, np.ndarray):
		return "np.ndarray %s %s %s %s" % (str(arg.shape), str(arg.dtype), str(arg.strides), "contig" if arg.flags["C_CONTIGUOUS"] else "noncontig")
	else:
		return "value %s" % (str(arg))