Source code for breads.utils

import itertools
import os
from copy import copy

import astropy.coordinates
import astropy.io.fits as fits
import astropy.units as u
import numpy as np
import pandas as pd
from astropy.time import Time
from astroquery.simbad import Simbad
from py.path import local
from scipy.interpolate import InterpolatedUnivariateSpline
from scipy.interpolate import interp1d
from scipy.optimize import lsq_linear
from scipy.signal import correlate2d
from scipy.stats import median_abs_deviation



[docs]
def filter_spec_with_spline(wvs, spec,specerr=None,x_nodes=None,M_spline=None):
    """

    Parameters
    ----------
    wvs
    spec
    specerr
    x_nodes
    m_spline

    Returns
    -------

    """
    if specerr is None:
        specerr = np.ones(spec.shape)

    if M_spline is None:
        M_spline = get_spline_model(x_nodes, wvs, spline_degree=3)

    M = M_spline/specerr[:,None]
    d = spec/specerr
    where_finite = np.where(np.isfinite(d))
    M = M[where_finite[0],:]
    d = d[where_finite]

    paras = lsq_linear(M,d).x
    m = np.dot(M, paras)
    r = d - m

    LPF_spec = np.zeros(spec.shape)+np.nan
    HPF_spec = np.zeros(spec.shape)+np.nan
    LPF_spec[where_finite] = m*specerr[where_finite]
    HPF_spec[where_finite] = r*specerr[where_finite]

    return HPF_spec,LPF_spec



[docs]
def find_closest_leftnright_elements(v1, v2):
    """ Find the closest elements in v1 to the left and right of each element in v2.
    (By chatgpt)

    Parameters
    ----------
    v1 : np.ndarray
        The array to search within (may contain NaNs).
    v2 : np.ndarray
        The array with values to find bounds for (may contain NaNs).

    Returns
    -------
    v_left : np.ndarray
        Closest elements in v1 to the left of each element in v2.
    v_right: np.ndarray
        Closest elements in v1 to the right of each element in v2.
    """

    # Remove NaNs from v1 and get corresponding indices
    valid_v1_mask = ~np.isnan(v1)
    v1_valid = v1[valid_v1_mask]

    # Finding the indices in the valid v1 array
    indices = np.searchsorted(v1_valid, v2)

    # Initialize arrays to store the left and right closest elements
    v_left = np.full_like(v2, np.nan, dtype=np.float64)
    v_right = np.full_like(v2, np.nan, dtype=np.float64)

    # Mask for valid v2 elements
    valid_v2_mask = ~np.isnan(v2)

    # Handling boundary conditions and valid indices
    valid_left_mask = valid_v2_mask & (indices > 0)
    valid_right_mask = valid_v2_mask & (indices < len(v1_valid))

    # Assigning left and right closest elements
    v_left[valid_left_mask] = v1_valid[indices[valid_left_mask] - 1]
    v_right[valid_right_mask] = v1_valid[indices[valid_right_mask]]

    # Handling boundary conditions for out of range values
    v_right[valid_v2_mask & (indices == 0)] = v1_valid[0]
    v_left[valid_v2_mask & (indices == len(v1_valid))] = v1_valid[-1]

    return v_left, v_right



[docs]
def get_err_from_posterior(x, posterior):
    """ Return the mode, and the left and right errors of a distribution. The errors are defined with a 68% confidence level.

    Parameters
    ----------
    x : Sampling of the 1D posterior
    posterior : Posterior array

    Returns
    -------
        Mode, left error, right error

    """
    ind = np.argsort(posterior)
    cum_posterior = np.zeros(np.shape(posterior))
    cum_posterior[ind] = np.cumsum(posterior[ind])
    cum_posterior = cum_posterior/np.max(cum_posterior)
    argmax_post = np.argmax(cum_posterior)
    if len(x[0:np.min([argmax_post+1,len(x)])]) < 2:
        lx = x[0]
    else:
        tmp_cumpost = cum_posterior[0:np.min([argmax_post+1,len(x)])]
        tmp_x= x[0:np.min([argmax_post+1,len(x)])]
        deriv_tmp_cumpost = np.insert(tmp_cumpost[1::]-tmp_cumpost[0:np.size(tmp_cumpost)-1],np.size(tmp_cumpost)-1,0)
        try:
            whereinflection = np.where(deriv_tmp_cumpost<0)[0][0]
            where2keep = np.where((tmp_x<=tmp_x[whereinflection])+(tmp_cumpost>=tmp_cumpost[whereinflection]))
            tmp_cumpost = tmp_cumpost[where2keep]
            tmp_x = tmp_x[where2keep]
        except:
            pass
        lf = interp1d(tmp_cumpost,tmp_x,bounds_error=False,fill_value=x[0])
        lx = lf(1-0.6827)
    if len(x[argmax_post::]) < 2:
        rx=x[-1]
    else:
        tmp_cumpost = cum_posterior[argmax_post::]
        tmp_x= x[argmax_post::]
        deriv_tmp_cumpost = np.insert(tmp_cumpost[1::]-tmp_cumpost[0:np.size(tmp_cumpost)-1],np.size(tmp_cumpost)-1,0)
        try:
            whereinflection = np.where(deriv_tmp_cumpost>0)[0][0]
            where2keep = np.where((tmp_x>=tmp_x[whereinflection])+(tmp_cumpost>=tmp_cumpost[whereinflection]))
            tmp_cumpost = tmp_cumpost[where2keep]
            tmp_x = tmp_x[where2keep]
        except:
            pass
        rf = interp1d(tmp_cumpost,tmp_x,bounds_error=False,fill_value=x[-1])
        rx = rf(1-0.6827)
    return x[argmax_post],x[argmax_post]-lx,rx-x[argmax_post]


def _task_findbadpix(paras):
    """

    Parameters
    ----------
    paras

    Returns
    -------

    """

    data_arr,noise_arr,badpix_arr,med_spec,M_spline,threshold = paras
    new_data_arr = np.array(copy(data_arr), '<f4')#.byteswap().newbyteorder()
    new_badpix_arr = copy(badpix_arr)
    res = np.zeros(data_arr.shape) + np.nan
    for k in range(data_arr.shape[1]):
        where_data_finite = np.where(np.isfinite(med_spec)*np.isfinite(badpix_arr[:,k])*np.isfinite(data_arr[:,k])*np.isfinite(noise_arr[:,k])*(noise_arr[:,k]!=0))
        if np.size(where_data_finite[0]) == 0:
            res[:,k] = np.nan
            continue
        d = data_arr[where_data_finite[0],k]
        d_err = noise_arr[where_data_finite[0],k]

        M = M_spline[where_data_finite[0],:]*med_spec[where_data_finite[0],None]

        validpara = np.where(np.nansum(M>np.nanmax(M)*1e-6,axis=0)!=0)
        M = M[:,validpara[0]]

        # bounds_min = [0, ]* M.shape[1]
        bounds_min = [-np.inf, ]* M.shape[1]
        bounds_max = [np.inf, ] * M.shape[1]
        p = lsq_linear(M/d_err[:,None],d/d_err,bounds=(bounds_min, bounds_max)).x
        # p,chi2,rank,s = np.linalg.lstsq(M/d_err[:,None],d/d_err,rcond=None)
        m = np.dot(M,p)
        res[where_data_finite[0],k] = d-m

        # where_bad = np.where((np.abs(res[:,k])>3*np.nanstd(res[:,k])) | np.isnan(res[:,k]))
        meddev=median_abs_deviation(res[where_data_finite[0],k])
        where_bad = np.where((np.abs(res[:,k])>threshold*meddev) | np.isnan(res[:,k]))
        new_badpix_arr[where_bad[0],k] = np.nan
        where_bad = np.where(np.isnan(np.correlate(new_badpix_arr[:,k] ,np.ones(2),mode="same")))
        new_badpix_arr[where_bad[0],k] = np.nan
        new_data_arr[where_bad[0],k] = np.nan

        # print(np.nanmedian(d))
        # if np.nanmedian(d)>0.5e-10:
        #     plt.figure(1)
        #     plt.plot(d,label="d")
        #     # m0 = med_spec[where_data_finite[0],None]
        #     # plt.plot(m0/np.nansum(m0)*np.nansum(d),label="m0")
        #     # plt.plot(m,label="m")
        #     # plt.plot(d_err,label="err")
        #     plt.plot(d-m,label="res")
        #     plt.plot(d/d*threshold*meddev,label="threshold")
        #     plt.plot(new_data_arr[where_data_finite[0],k],label="new d",linestyle="--")
        #     plt.legend()
        #     plt.figure(2)
        #     plt.plot(new_badpix_arr[where_data_finite[0],k],label="bad pix",linestyle="-")
        #     plt.show()

        new_data_arr[:,k] = np.array(pd.DataFrame(new_data_arr[:,k]).interpolate(method="linear").fillna(method="bfill").fillna(method="ffill"))[:, 0]

    return new_data_arr,new_badpix_arr,res

def _remove_edges(paras):
    """

    Parameters
    ----------
    paras

    Returns
    -------

    """

    slices,nan_mask_boxsize = paras
    cp_slices = copy(slices)
    if nan_mask_boxsize != 0:
        for slice in cp_slices:
            slice[np.where(slice==0)] = np.nan
            slice[np.where(np.isnan(correlate2d(slice,np.ones((nan_mask_boxsize,nan_mask_boxsize)),mode="same")))] = np.nan
        cp_slices[:,0:nan_mask_boxsize//2,:] = np.nan
        cp_slices[:,-nan_mask_boxsize//2+1::,:] = np.nan
        cp_slices[:,:,0:nan_mask_boxsize//2] = np.nan
        cp_slices[:,:,-nan_mask_boxsize//2+1::] = np.nan
    return cp_slices


[docs]
def corrected_wavelengths(data, off0, off1, center_data):
    """

    Parameters
    ----------
    data
    off0
    off1
    center_data

    Returns
    -------

    """

    wavs = data.read_wavelengths.astype(float) * u.micron
    if center_data:
        wavs = wavs + (wavs - np.mean(wavs)) * off1 + off0 * u.angstrom
    else:
        wavs = wavs * (1 + off1) + off0 * u.angstrom
    return wavs



[docs]
def mask_bleeding(data, threshold=1.05, per=[5, 95], mask_region = (5, 6, 2), edge=5):
    """

    Parameters
    ----------
    data
    threshold
    per
    mask_region
    edge

    Returns
    -------

    """

    nz, ny, nx = data.data.shape
    width_mask_y, region_mask_x_left, region_mask_x_right = mask_region
    img_mean = np.nanmedian(data.data, axis=0)
    star_y, star_x = np.unravel_index(np.nanargmax(img_mean), img_mean.shape)
    num_mask = np.zeros((ny, nx))
    for i in range(ny):
        for j in range(nx):
            # i, j = 24, 47
            # i, j = 45, 24
            if not (star_y - width_mask_y <= i <= star_y + width_mask_y):
                continue
            if not (j < star_x - region_mask_x_left or j > star_x + region_mask_x_right):
                continue
                # exit()
            num_mask[i, j] = sum(np.isnan(data.bad_pixels[:, i, j]))
            data_f = data.continuum[:, i, j] * data.bad_pixels[:,i,j]
            data_f_nonans = data_f[~np.isnan(data_f)]
            high_end = np.nanmax([np.nanmean(data_f_nonans[:edge]), np.nanmean(data_f_nonans[-edge:])])
            # print(percentiles)
            if sum(~np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])) < nz / 5:
                # if not all(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])):
                #     print("low count")
                #     print(sum(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])) < nz / 5, sum(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])), nz / 5)
                #     plt.figure()
                #     plt.plot(data.continuum[:, i, j] * data.bad_pixels[:,i,j])
                #     plt.plot(data.data[:,i,j] * data.bad_pixels[:,i,j])
                #     plt.show()
                data.bad_pixels[:, i, j] = np.nan
            if high_end / np.nanmedian(data_f) > threshold:
                data.bad_pixels[:, i, j] = np.nan
            # else:
            #     if not all(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])):
            #         # print(sum(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])) < nz / 5, sum(np.isnan(data.data[:,i,j] * data.bad_pixels[:,i,j])), nz / 5)
            #         # print(high_end / np.nanmedian(data_f), high_end, np.nanmedian(data_f), [np.nanmean(data_f_nonans[:edge]), np.nanmean(data_f_nonans[-edge:])])
            #         plt.figure()
            #         plt.title(f"{i}, {j}")
            #         plt.plot(data.continuum[:, i, j] * data.bad_pixels[:,i,j])
            #         plt.plot(data.data[:,i,j] * data.bad_pixels[:,i,j])
            #         plt.show()

            #     outliers = np.logical_or(data_f > mask * np.nanmedian(data_f), np.isnan(data_f))
            #     if len(np.where(~outliers)[0]) == 0:
            #         data.bad_pixels[:, i, j] = np.nan
            #     else:
            #         # first false value from
            #         left, right = np.where(~outliers)[0][0], np.where(~outliers)[0][-1]
            #         data_f = data_f[~np.isnan(data_f)]
            #         if np.nanmean(data_f[:6]) > np.nanmean(data_f[-6:]):
            #             data.bad_pixels[:left, i, j] = np.nan
            #         else:
            #             data.bad_pixels[right+1:, i, j] = np.nan
            #     plt.plot(data.continuum[:, i, j] * data.bad_pixels[:,i,j])
            #     plt.plot(data.data[:,i,j] * data.bad_pixels[:,i,j])
            #     plt.show()
            #     plt.close()
            num_mask[i, j] = sum(np.isnan(data.bad_pixels[:, i, j])) - num_mask[i, j]

            # exit()
    # plt.figure()
    # plt.imshow(num_mask / nz, origin="lower", vmin=0, vmax=1)
    # plt.colorbar()
    # plt.show()
    # exit()


[docs]
def findbadpix(cube, noisecube=None, badpixcube=None,chunks=20,mypool=None,med_spec=None,nan_mask_boxsize=3,threshold=3):
    """

    Parameters
    ----------
    cube
    noisecube
    badpixcube
    chunks
    mypool
    med_spec
    nan_mask_boxsize
    threshold

    Returns
    -------

    """

    if noisecube is None:
        noisecube = np.ones(cube.shape)
    if badpixcube is None:
        badpixcube = np.ones(cube.shape)

    new_cube = copy(cube)
    new_badpixcube = copy(badpixcube)
    new_badpixcube[np.where(np.isnan(cube)*np.isnan(noisecube))] = np.nan
    nz,ny,nx = cube.shape
    res = np.zeros(cube.shape) + np.nan

    x = np.arange(nz)
    x_knots = x[np.linspace(0,nz-1,chunks+1,endpoint=True).astype(int)]
    x_knots = x[np.linspace(0,nz-1,chunks+1,endpoint=True).astype(int)]
    M_spline = get_spline_model(x_knots,x,spline_degree=3)

    N_valid_pix = ny*nx
    if med_spec is None:
        _cube = copy(cube)
        _cube[np.where(_cube<=0)] = np.nan
        med_spec = np.nanmedian(cube,axis=(1,2))
    new_badpixcube[np.where(cube==0)] = np.nan

    if mypool is None:
        new_badpixcube = _remove_edges((new_badpixcube,nan_mask_boxsize))
    else:
        numthreads = mypool._processes
        chunk_size = nz//(3*numthreads)
        N_chunks = nz//chunk_size
        wvs_indices_list = []
        slices_list = []
        for k in range(N_chunks-1):
            slices_list.append(new_badpixcube[(k*chunk_size):((k+1)*chunk_size)])
            wvs_indices_list.append(np.arange((k*chunk_size),((k+1)*chunk_size)))
        slices_list.append(new_badpixcube[((N_chunks-1)*chunk_size):nz])
        wvs_indices_list.append(np.arange(((N_chunks-1)*chunk_size),nz))

        outputs_list = mypool.map(_remove_edges, zip(slices_list,itertools.repeat(nan_mask_boxsize)))
        #save it to shared memory
        for indices, out in zip(wvs_indices_list,outputs_list):
            new_badpixcube[indices,:,:] = out


    if mypool is None:
        data_list = np.reshape(new_cube,(nz,nx*ny))
        noise_list = np.reshape(noisecube,(nz,nx*ny))
        badpix_list = np.reshape(new_badpixcube,(nz,nx*ny))
        out_data,out_badpix,out_res = _task_findbadpix((data_list,noise_list,badpix_list,med_spec,M_spline,threshold))
        new_cube = np.reshape(out_data,(nz,ny,nx))
        new_badpixcube = np.reshape(out_badpix,(nz,ny,nx))
        res = np.reshape(out_res,(nz,ny,nx))
    else:
        numthreads = mypool._processes
        chunk_size = N_valid_pix//(3*numthreads)
        wherenotnans = np.where(np.nansum(np.isfinite(badpixcube),axis=0)!=0)
        row_valid_pix = wherenotnans[0]
        col_valid_pix = wherenotnans[1]
        N_chunks = N_valid_pix//chunk_size

        row_indices_list = []
        col_indices_list = []
        data_list = []
        noise_list = []
        badpix_list = []
        for k in range(N_chunks-1):
            _row_valid_pix = row_valid_pix[(k*chunk_size):((k+1)*chunk_size)]
            _col_valid_pix = col_valid_pix[(k*chunk_size):((k+1)*chunk_size)]

            row_indices_list.append(_row_valid_pix)
            col_indices_list.append(_col_valid_pix)

            data_list.append(cube[:,_row_valid_pix,_col_valid_pix])
            noise_list.append(noisecube[:,_row_valid_pix,_col_valid_pix])
            badpix_list.append(new_badpixcube[:,_row_valid_pix,_col_valid_pix])

        _row_valid_pix = row_valid_pix[((N_chunks-1)*chunk_size):N_valid_pix]
        _col_valid_pix = col_valid_pix[((N_chunks-1)*chunk_size):N_valid_pix]

        row_indices_list.append(_row_valid_pix)
        col_indices_list.append(_col_valid_pix)

        data_list.append(cube[:,_row_valid_pix,_col_valid_pix])
        noise_list.append(noisecube[:,_row_valid_pix,_col_valid_pix])
        badpix_list.append(new_badpixcube[:,_row_valid_pix,_col_valid_pix])

        outputs_list = mypool.map(_task_findbadpix, zip(data_list,noise_list,badpix_list,
                                                               itertools.repeat(med_spec),
                                                               itertools.repeat(M_spline),
                                                                itertools.repeat(threshold)))
        for row_indices,col_indices,out in zip(row_indices_list,col_indices_list,outputs_list):
            out_data,out_badpix,out_res = out
            new_cube[:,row_indices,col_indices] = out_data
            new_badpixcube[:,row_indices,col_indices] = out_badpix
            res[:,row_indices,col_indices] = out_res

    return new_badpixcube, new_cube, res





[docs]
def broaden(wvs,spectrum,R,mppool=None,kernel=None):
    """
    Broaden a spectrum to instrument resolution assuming a gaussian line spread function.

    Args:
        wvs: Wavelength vector (ndarray).
        spectrum: Spectrum vector (ndarray).
        R: Resolution of the instrument as lambda/(delta lambda) with delta lambda the FWHM of the line spread function.
            If scalar, the resolution is assumed to be independent of wavelength.
            Or the resolution can be specified at each wavelength if R is a vector of the same size as wvs.
        mypool: Multiprocessing pool to parallelize the code. If None (default), non parallelization is applied.
            E.g. mppool = mp.Pool(processes=10) # 10 is the number processes

    Returns
        Broadened spectrum
    """
    if mppool is None:
        # Each wavelength processed sequentially
        return _task_broaden((np.arange(np.size(spectrum)).astype(int),wvs,spectrum,R,kernel))
    else:
        conv_spectrum = np.zeros(spectrum.shape)

        # Divide the spectrum into 100 chunks to be parallelized
        chunk_size=100
        N_chunks = np.size(spectrum)//chunk_size
        indices_list = []
        for k in range(N_chunks-1):
            indices_list.append(np.arange(k*chunk_size,(k+1)*chunk_size).astype(int))
        indices_list.append(np.arange((N_chunks-1)*chunk_size,np.size(spectrum)).astype(int))
        # Start parallelization
        outputs_list = mppool.map(_task_broaden, zip(indices_list,
                                                               itertools.repeat(wvs),
                                                               itertools.repeat(spectrum),
                                                               itertools.repeat(R),
                                                               itertools.repeat(kernel)))
        # Retrieve results
        for indices,out in zip(indices_list,outputs_list):
            conv_spectrum[indices] = out

        return conv_spectrum



[docs]
def clean_nans(arr, set_to="median", allowed_range=None, continuum=None):
    """

    Parameters
    ----------
    arr
    set_to
    allowed_range
    continuum

    Returns
    -------

    """
    if set_to == "continuum":
        cont = np.ravel(continuum)
        shape = arr.shape
        arr.flatten()
        for i in range(len(arr)):
            if np.isnan(arr[i]):
                arr[i] = cont[i]
        arr.reshape(shape)
        if allowed_range is not None:
            min_v, max_v = allowed_range
            arr[arr > max_v] = set_to
            arr[arr < min_v] = set_to
        return

    if set_to == "median":
        set_to = np.nanmedian(arr)
    np.nan_to_num(arr, copy = False, nan=set_to)
    if allowed_range is not None:
        min_v, max_v = allowed_range
        arr[arr > max_v] = set_to
        arr[arr < min_v] = set_to




def _task_broaden(paras):
    """ Perform the spectrum broadening for broaden().
    """
    indices, wvs, spectrum, R,kernel = paras

    if type(R) is np.ndarray:
        Rvec = R
    else:
        Rvec = np.zeros(wvs.shape) + R # Resolution is assumed constant

    conv_spectrum = np.zeros(np.size(indices))
    dwvs = wvs[1::] - wvs[0:(np.size(wvs) - 1)]
    dwvs = np.append(dwvs,dwvs[-1])    # Size of each wavelength bin
    for l, k in enumerate(indices):
        FWHM = wvs[k] / Rvec[k] # Full width at half maximum of the LSF at current wavelength
        sig = FWHM / (2 * np.sqrt(2 * np.log(2))) # standard deviation of the LSF (1D gaussian)
        w = int(np.round(sig / dwvs[k] * 10.)) # Number of bins on each side defining the spec window

        # Extract a smaller a small window around the current wavelength
        stamp_spec = spectrum[np.max([0, k - w]):np.min([np.size(spectrum), k + w])]
        stamp_wvs = wvs[np.max([0, k - w]):np.min([np.size(wvs), k + w])]
        stamp_dwvs = dwvs[np.max([0, k - w]):np.min([np.size(wvs), k + w])]

        if kernel is None:
            gausskernel = 1 / (np.sqrt(2 * np.pi) * sig) * np.exp(-0.5 * (stamp_wvs - wvs[k]) ** 2 / sig ** 2)
        else:
            gausskernel = kernel((stamp_wvs - wvs[k])/wvs[k])
        gausskernel[np.where(np.isnan(stamp_spec))] = np.nan
        conv_spectrum[l] = np.nansum(gausskernel*stamp_spec*stamp_dwvs) / np.nansum(gausskernel*stamp_dwvs)

    return conv_spectrum


[docs]
def file_directory(file):
    """

    Parameters
    ----------
    file

    Returns
    -------

    """

    return os.path.dirname(local(file))



[docs]
def LPFvsHPF(myvec, cutoff):
    """ Ask JB to write documentation!

    Parameters
    ----------
    myvec
    cutoff

    Returns
    -------

    """
    myvec_cp = copy(myvec)
    #handling nans:
    wherenans = np.where(np.isnan(myvec_cp))
    window = int(round(np.size(myvec_cp)/(cutoff/2.)/2.))#cutoff
    tmp = np.array(pd.DataFrame(np.concatenate([myvec_cp, myvec_cp[::-1]], axis=0)).interpolate(method="linear").fillna(method="bfill").fillna(method="ffill"))
    myvec_cp_lpf = np.array(pd.DataFrame(tmp).rolling(window=window, center=True).median().interpolate(method="linear").fillna(method="bfill").fillna(method="ffill"))[0:np.size(myvec), 0]
    myvec_cp[wherenans] = myvec_cp_lpf[wherenans]


    fftmyvec = np.fft.fft(np.concatenate([myvec_cp, myvec_cp[::-1]], axis=0))
    LPF_fftmyvec = copy(fftmyvec)
    LPF_fftmyvec[cutoff:(2*np.size(myvec_cp)-cutoff+1)] = 0
    LPF_myvec = np.real(np.fft.ifft(LPF_fftmyvec))[0:np.size(myvec_cp)]
    HPF_myvec = myvec_cp - LPF_myvec


    LPF_myvec[wherenans] = np.nan
    HPF_myvec[wherenans] = np.nan

    # plt.figure(10)
    # plt.plot(myvec_cp,label="fixed")
    # plt.plot(myvec,label="ori")
    # plt.plot(myvec_cp_lpf,label="lpf")
    # plt.plot(LPF_myvec,label="lpf fft")
    # plt.legend()
    # plt.show()
    return LPF_myvec,HPF_myvec



[docs]
def gaussian2D(nx, ny, mu_x, mu_y, sig_x, sig_y, A):
    """ Two Dimensional Gaussian for getting PSF for different wavelength slices

    Parameters
    ----------
    nx
    ny
    mu_x
    mu_y
    sig_x
    sig_y
    a

    Returns
    -------

    """

    x_vals, y_vals = np.meshgrid(np.arange(nx), np.arange(ny), indexing='ij')
    gauss = A * np.exp(-((x_vals - mu_x) ** 2) / (2 * sig_x * sig_x)) * \
        np.exp(-((y_vals - mu_y) ** 2) / (2 * sig_y * sig_y))
    return gauss



[docs]
def get_spline_model(x_knots, x_samples, spline_degree=3):
    """ Compute a spline based linear model.
    If Y = [y1, y2, ...] are the values of the function at the location of the node [x1,x2,...].
    np.dot(M,Y) is the interpolated spline corresponding to the sampling of the x-axis (x_samples)


    Args:
        x_knots: List of nodes for the spline interpolation as np.ndarray in the same units as x_samples.
            x_knots can also be a list of ndarrays/list to model discontinous functions.
        x_samples: Vector of x values. ie, the sampling of the data.
        spline_degree: Degree of the spline interpolation (default: 3).
            if np.size(x_knots) <= spline_degree, then spline_degree = np.size(x_knots)-1

    Returns:
        M: Matrix of size (D,N) with D the size of x_samples and N the total number of nodes.
    """
    if type(x_knots[0]) is list or type(x_knots[0]) is np.ndarray:
        x_knots_list = x_knots
    else:
        x_knots_list = [x_knots]

    if np.size(x_knots_list) <= 1:
        return np.ones((np.size(x_samples),1))
    if np.size(x_knots_list) <= spline_degree:
        spline_degree = np.size(x_knots)-1

    M_list = []
    for nodes in x_knots_list:
        M = np.zeros((np.size(x_samples), np.size(nodes)))
        min,max = np.min(nodes),np.max(nodes)
        inbounds = np.where((min<x_samples)&(x_samples<max))
        _x = x_samples[inbounds]

        for chunk in range(np.size(nodes)):
            tmp_y_vec = np.zeros(np.size(nodes))
            tmp_y_vec[chunk] = 1
            spl = InterpolatedUnivariateSpline(nodes, tmp_y_vec, k=spline_degree, ext=0)
            M[inbounds[0], chunk] = spl(_x)
        M_list.append(M)
    return np.concatenate(M_list, axis=1)



[docs]
def broaden_kernel(wvs,spectrum,kernel):
    """ Broaden a spectrum to instrument resolution assuming a custom kernel.

    Args:
        wvs: Wavelength vector (ndarray).
        spectrum: Spectrum vector (ndarray).
        kernel: custom broadening kernel as a function kernel((wvs - wvs_curr) / wvs_curr)

    Returns
        Broadened spectrum
    """
    cp_spectrum = copy(spectrum)
    dwvs = wvs[1::] - wvs[0:(np.size(wvs) - 1)]
    dwvs = np.append(dwvs, dwvs[-1])  # Size of each wavelength bin
    where_nans = np.where(np.isnan(cp_spectrum))
    cp_spectrum[where_nans] = 0
    dwvs[where_nans] = 0

    wvs_mat = np.tile(wvs[None, :],(np.size(wvs),1))
    kernel_mat = kernel((wvs_mat - wvs[:,None]) / wvs[:,None])
    conv_spectrum = np.dot(kernel_mat,cp_spectrum * dwvs)#/np.dot(kernel_mat,dwvs)
    return conv_spectrum



[docs]
def open_psg_allmol(filename,l0,l1):
    """ Open psg model for all molecules
    returns wavelength, h2o, co2, ch4, co for l0-l1 range specified


    no o3 here .. make this more flexible
    --------
    """
    f = fits.getdata(filename)

    x = f['Wave/freq']

    h2o = f['H2O']
    co2 = f['CO2']
    ch4 = f['CH4']
    co  = f['CO']
    o3  = f['O3'] # O3 messes up in PSG at lam<550nm and high resolution bc computationally expensive, so don't use it if l1<550
    n2o = f['N2O']
    o2  = f['O2']
    # also dont use rayleigh scattering, it fails at NIR wavelengths. absorbs into a continuum fit anyhow

    idelete = np.where(np.diff(x) < .0001)[0]  # delete non unique points - though I fixed it in code but seems to pop up still at very high resolutions
    x, h2o, co2, ch4, co, o3, n2o, o2= np.delete(x,idelete),np.delete(h2o,idelete), np.delete(co2,idelete),np.delete(ch4,idelete),np.delete(co,idelete),np.delete(o3,idelete),np.delete(n2o,idelete),np.delete(o2,idelete)

    isub = np.where((x > l0) & (x < l1))[0]
    return x[isub], (h2o[isub], co2[isub], ch4[isub], co[isub], o3[isub], n2o[isub], o2[isub])




[docs]
def scale_psg(psg_tuple, airmass, pwv):
    """

    Parameters
    ----------
    psg_tuple : (tuple) of loaded psg spectral components from "open_psg_allmol" fxn
    airmass: (float) airmass of final spectrum applied to all molecules spectra
    pwv: (float) extra scaling for h2o spectrum to account for changes in the precipitable water vapor
    """
    h2o, co2, ch4, co, o3, n2o, o2 = psg_tuple

    model = h2o**(airmass + pwv) * (co2 * ch4 * co * o3 * n2o * o2)**airmass # do the scalings

    return model




[docs]
def rotate_coordinates(x, y, angle, flipx=False):
    """

    Parameters
    ----------
    x
    y
    angle
    flipx

    Returns
    -------

    """
    x_shape = np.array(x).shape
    if flipx:
        _x,_y = -np.array(x).ravel(),np.array(y).ravel()
    else:
        _x,_y = np.array(x).ravel(),np.array(y).ravel()
    # Convert angle to radians
    angle_rad = np.radians(angle)

    # Create a 2D array of coordinates
    coordinates = np.array([_x, _y])

    # Create the rotation matrix
    rotation_matrix = np.array([[np.cos(angle_rad), np.sin(angle_rad)],
                                [-np.sin(angle_rad), np.cos(angle_rad)]])

    # Apply the rotation transformation
    rotated_coordinates = np.dot(rotation_matrix, coordinates)

    # Split the rotated coordinates back into separate arrays
    rotated_x, rotated_y = rotated_coordinates
    return np.reshape(rotated_x,x_shape), np.reshape(rotated_y,x_shape)




[docs]
def propagate_coordinates_at_epoch(targetname, date, verbose=True):
    """Get coordinates at an epoch for some target, taking into account proper motions.

    Retrieves the SIMBAD coordinates, applies proper motion, returns the result as an
    astropy coordinates object

    Parameters
    ----------
    targetname : str
        Target name, resolvable by SIMBAD
    date : str, or astropy.time.Time
        Epoch of observation, in a format understandable by astropy.time.Time, e.g. "YYYY-MM-DD"
    verbose : bool
        Print more verbose text output?

    Returns
    -------
    an astropy.coordinates.SkyCoord for the computed position

    """

    # Configure Simbad query to retrieve some extra fields
    Simbad.add_votable_fields("ra")  # Retrieve proper motion in RA
    Simbad.add_votable_fields("dec")  # Retrieve proper motion in RA
    Simbad.add_votable_fields("pmra")  # Retrieve proper motion in RA
    Simbad.add_votable_fields("pmdec")  # Retrieve proper motion in Dec.
    Simbad.add_votable_fields("plx_value")  # Retrieve parallax

    if verbose:
        print(f"Retrieving SIMBAD coordinates for {targetname}")

    result_table = Simbad.query_object(targetname)

    if result_table is None:
        raise ValueError(f"{targetname} not found in SIMBAD database. Try with another target name recognized by SIMBAD.")

    # Get the coordinates and proper motion from the result table
    ra = result_table["ra"][0]
    dec = result_table["dec"][0]
    pm_ra = result_table["pmra"][0]
    pm_dec = result_table["pmdec"][0]
    plx = result_table["plx_value"][0]

    # Create a SkyCoord object with the coordinates and proper motion
    target_coord_j2000 = astropy.coordinates.SkyCoord(ra, dec, unit=(u.deg, u.deg),
                                                      pm_ra_cosdec=pm_ra * u.mas / u.year,
                                                      pm_dec=pm_dec * u.mas / u.year,
                                                      distance=astropy.coordinates.Distance(parallax=plx * u.mas),
                                                      frame='icrs', obstime='J2000.0')
    # Convert the desired date to an astropy Time object
    t = astropy.time.Time(date)

    # Calculate the updated SkyCoord object for the desired date
    host_coord_at_date = target_coord_j2000.apply_space_motion(new_obstime=t)

    if verbose:
        print(f"Coordinates at J2000:  {target_coord_j2000.icrs.to_string('hmsdms')}")
        print(f"Coordinates at {date}:  {host_coord_at_date.icrs.to_string('hmsdms')}")

    return host_coord_at_date



[docs]
@u.quantity_input(comp_sep=u.arcsec, comp_pa=u.deg)
def companion_relative_to_absolute_position(star_name, comp_name, comp_sep, comp_pa, obs_date, verbose=True):
    """ Compute absolute ICRS coordinates of a substellar companion at a given date

    - Retrieves the host star's coordinates (including RA, Dec, proper motion, and parallax)
    - Propagates to the desired date
    - Performs coordinate offset to the companion location
    - Prints out the results, in format suitable to enter into APT


    Parameters
    ----------
    star_name : str
        Star name, resolvable by SIMBAD
    comp_name : str
        Companion name, for display
    comp_sep : astropy.units.Quantity
        Separation of the companion relative to the host, for instance in arcseconds
    comp_pa : astropy.units.Quantity
        Position angle of the companion relative to North, for instance in degrees east of north
    obs_date : str or astropy.time.Time
        Observation epoch, in a format understandable by astropy.time
    verbose : bool
        Be more verbose in output?

    Returns
    -------
    planet_coord : astropy.coordinates.SkyCoord
        Computed absolute ICRS coordinates of the companion at the specified epoch
    """

    if verbose:
        print("**HOST STAR:**")
    star_coord = propagate_coordinates_at_epoch(star_name, date=obs_date, verbose=verbose)
    if verbose:
        print(f'Proper motion  pm_ra_cosdec: {star_coord.pm_ra_cosdec:.3f}\tpm_dec: {star_coord.pm_dec:.3f}'  )
        print(f'Parallax : {1000/star_coord.distance.to_value(u.pc):.3f} mas'  )

    # Offset coordinates calculation for the companion using astropy coords machinery
    # Convert from sep, pa to dRA, dDec
    d_dec= comp_sep *  np.cos(np.deg2rad(comp_pa))
    d_ra = comp_sep *  np.sin(np.deg2rad(comp_pa))
    # Compute the offset coordinate at those deltas
    star_frame = astropy.coordinates.SkyOffsetFrame(origin=star_coord)
    planet_relative_loc = astropy.coordinates.SkyCoord(lon=d_ra, lat=d_dec, frame=star_frame)
    planet_coord = planet_relative_loc.transform_to(astropy.coordinates.ICRS)

    if verbose:
        print("\n**COMPANION:**")
        print(f"{comp_name} has r={comp_sep}, pa={comp_pa}, which is (dDec,dR.A.) = {d_dec:.3f}, {d_ra:.3f}")
        print(f"{comp_name} ICRS coords at {obs_date}: "+planet_coord.to_string('hmsdms'))
        print("")
        print(f"        Crosscheck PA: {star_coord.position_angle(planet_coord).to(u.deg):.3f}  should equal {comp_pa}")
        print(f"        Crosscheck sep: {star_coord.separation(planet_coord).to(u.arcsec):.6f}  should equal {comp_sep} ")
        print(f"        if the above are not equal then something went wrong in this calculation. ")
        print("")


        print('**COMPANION ABSOLUTE POINTING INFO FOR APT:**')
        print(f'\tName:\t\t\t{comp_name}')
        print(f'\tICRS coordinates:\t{planet_coord.to_string("hmsdms", sep=" ")}')
        print(f'\tEpoch:\t\t\t{astropy.time.Time(obs_date).jyear:.2f}')
        print(f'\tProper Motion:\t\tRA: {star_coord.pm_ra_cosdec:.3f}\tDec: {star_coord.pm_dec:.3f}')
        print(f'\tAnnual Parallax:\t{1/star_coord.distance.to_value(u.pc):.4f} arcsec')
    return planet_coord




[docs]
def pixgauss2d(p, shape, hdfactor=10, xhdgrid=None, yhdgrid=None):
    """
    2d gaussian model. Documentation to be completed. Also faint of t
    """
    A, xA, yA, w, bkg = p
    ny, nx = shape
    if xhdgrid is None or yhdgrid is None:
        xhdgrid, yhdgrid = np.meshgrid(np.arange(hdfactor * nx).astype(np.float) / hdfactor,
                                       np.arange(hdfactor * ny).astype(np.float) / hdfactor)
    else:
        hdfactor = xhdgrid.shape[0] // ny
    gaussA_hd = A / (2 * np.pi * w ** 2) * np.exp(
        -0.5 * ((xA - xhdgrid) ** 2 + (yA - yhdgrid) ** 2) / w ** 2)
    gaussA = np.nanmean(np.reshape(gaussA_hd, (ny, hdfactor, nx, hdfactor)), axis=(1, 3))
    return gaussA + bkg




[docs]
def nonlin_lnprior_func(nonlin_paras, nonlin_paras_mins,nonlin_paras_maxs):
    """basic function to limit prior ranges for emcee

    If the prior is outside of the range defined by nonlin_paras_mins and nonlin_paras_max, the prior is -infinity
    """
    for p, _min, _max in zip(nonlin_paras, nonlin_paras_mins, nonlin_paras_maxs):
        if p > _max or p < _min:
            return -np.inf
    return 0