Source code for seda.chi2_fit

import numpy as np
import time
import os
import astropy.units as u
import pickle
import copy
from spectres import spectres
from tqdm.auto import tqdm
from astropy.io import ascii
from astropy.table import vstack
from lmfit import Minimizer, minimize, Parameters, report_fit # model fit for non-linear least-squares problems
from sys import exit
from . import utils
from . import models


[docs]def chi2(my_chi2):
	'''
	Description:
	------------
		Minimize the chi-square statistic to find the best model fits.

	Parameters:
	-----------
	- my_chi2 : return parameters from ``seda.Chi2Options``, which also includes the parameters from ``seda.InputData`` and ``seda.ModelOptions``.

	Returns:
	--------
	- '``model``\_chi2\_minimization.dat' : ascii table
		Table with the names of all model spectra fits sorted by chi square and including the information: 
		spectrum name, chi square, reduced chi square, scaling, scaling error, extinction, extinction error, 
		model free parameters, radius and error (if ``distance and ``edistance`` are provided), and
		iterations to minimize chi-square.
	- '``model``\_chi2\_minimization.pickle' : dictionary
		Dictionary with the results from the chi-square minimization, namely:
			- ``my_chi2`` input dictionary returned by ``input_parameters.Chi2Options``.
			- ``iterations_fit``: number of iterations to minimize chi-square.
			- ``Av_fit``: visual extinction (in mag) that minimizes chi-square.
			- ``eAv_fit``: visual extinction uncertainty (in mag).
			- ``scaling_fit``: scaling factor that minimizes chi-square.
			- ``escaling_fit``: scaling factor uncertainty.
			- ``chi2_wl_fit``: chi-square as a function of wavelength.
			- ``chi2_red_wl_fit``: reduced chi-square as a function of wavelength.
			- ``chi2_fit``: total chi-square.
			- ``chi2_red_fit``: total reduced chi-square.
			- ``radius``: (if ``distance`` is provided) radius (in Rjup) considering the ``scaling_fit`` and input ``distance``.
			- ``eradius``: (if ``edistance`` is provided) radius uncertainty (in Rjup).
			- ``params``: model free parameters for each model spectrum.
			- ``flux_array_model_conv_resam_scaled``: (if ``fit spectra``) input ``flux_array_model_conv_resam`` fluxes multiplied by the scaling factor ``scaling_fit``.
			- ``flux_array_model_conv_resam_scaled_fit``: (if ``fit spectra``) input ``flux_array_model_conv_resam_fit`` fluxes multiplied by the scaling factor ``scaling_fit``.
			- ``flux_residuals_spec``: (if ``fit spectra``) linear flux residual (in erg/cm2/s/A) between observed spectra and model spectra in ``fit_wl_range``.
			- ``logflux_residuals_spec``: (if ``fit spectra``) logarithm flux residual (in erg/cm2/s/A) between observed spectra and model spectra in ``fit_wl_range``.
			- ``flux_syn_array_model_scaled_fit``: (if ``fit photometry``) input ``flux_syn_array_model_fit`` fluxes multiplied by the scaling factor ``scaling_fit``.
			- ``flux_residuals_phot``: (if ``fit photometry``) linear flux residual (in erg/cm2/s/A) between observed photometry and model spectra in ``fit_phot_range``.
			- ``logflux_residuals_phot``: (if ``fit photometry``) logarithm flux residual (in erg/cm2/s/A) between observed photometry and model spectra in ``fit_phot_range``.

	Example:
	--------
	>>> import seda
	>>> 
	>>> # load input data
	>>> wl_spectra = wl_input # in um
	>>> flux_spectra = flux_input # in erg/cm^2/s/A
	>>> eflux_spectra = eflux_input # in erg/cm^2/s/A
	>>> my_data = seda.InputData(wl_spectra=wl_spectra, flux_spectra=flux_spectra, 
	>>>                          eflux_spectra=eflux_spectra)
	>>> 
	>>> # load model options
	>>> model = 'Sonora_Elf_Owl'
	>>> model_dir = ['my_path/output_700.0_800.0/', 
	>>>              'my_path/output_850.0_950.0/'] # folders to seek model spectra
	>>> params_ranges = {'Teff': [700, 900, 'logg': [4.0, 5.0]
	>>> my_model = seda.ModelOptions(model=model, model_dir=model_dir, 
	>>>                              params_ranges=params_ranges)
	>>> 
	>>> # load chi-square options
	>>> fit_wl_range = np.array([value1, value2]) # to make the fit between value1 and value2
	>>> my_chi2 = seda.Chi2FitOptions(my_data=my_data, my_model=my_model, 
	>>>                               fit_wl_range=fit_wl_range)
	>>> 
	>>> # run chi-square fit
	>>> out_chi2 = seda.chi2(my_chi2)
	    Chi square fit ran successfully

	Author: Genaro Suárez
	'''

	ini_time_chi2 = time.time() # to estimate the time elapsed running chi2
	print('\n   Running chi-square fitting...')

	# load input parameters
	# all are stored in my_chi2 but they were defined in different classes
	# from InputData
	fit_spectra = my_chi2.fit_spectra
	fit_photometry = my_chi2.fit_photometry
	wl_spectra = my_chi2.wl_spectra
	flux_spectra = my_chi2.flux_spectra
	eflux_spectra = my_chi2.eflux_spectra
	phot = my_chi2.phot
	ephot = my_chi2.ephot
	filters = my_chi2.filters
	res = my_chi2.res
	lam_res = my_chi2.lam_res
	distance = my_chi2.distance
	edistance = my_chi2.edistance
	# from ModelOptions
	model = my_chi2.model
	model_dir = my_chi2.model_dir
	wl_model = my_chi2.wl_model
	flux_model = my_chi2.flux_model
	params_ranges = my_chi2.params_ranges
	path_save_spectra_conv = my_chi2.path_save_spectra_conv
	skip_convolution = my_chi2.skip_convolution
	# from Chi2Options
	save_results = my_chi2.save_results
	scaling_free_param = my_chi2.scaling_free_param
	scaling = my_chi2.scaling
	extinction_free_param = my_chi2.extinction_free_param
	avoid_IR_excess = my_chi2.avoid_IR_excess
	IR_excess_limit = my_chi2.IR_excess_limit
	fit_wl_range = my_chi2.fit_wl_range
	model_wl_range = my_chi2.model_wl_range
	disp_wl_range = my_chi2.disp_wl_range
	N_model_spectra = my_chi2.N_model_spectra
	if (model is not None) & (model_dir is not None):
		spectra_name = my_chi2.spectra_name
		spectra_name_full = my_chi2.spectra_name_full
	if fit_spectra:
		N_spectra = my_chi2.N_spectra
		wl_spectra_min = my_chi2.wl_spectra_min
		wl_spectra_max = my_chi2.wl_spectra_max
		N_datapoints = my_chi2.N_datapoints
		wl_array_obs_fit = my_chi2.wl_array_obs_fit
		flux_array_obs_fit = my_chi2.flux_array_obs_fit
		eflux_array_obs_fit = my_chi2.eflux_array_obs_fit
		# make deepcopy of the following attributes to avoid modifying the original ones (stores in my_chi2) 
		# when updating the fluxing after applying the scaling factor
		wl_array_model_conv_resam = copy.deepcopy(my_chi2.wl_array_model_conv_resam)
		flux_array_model_conv_resam = copy.deepcopy(my_chi2.flux_array_model_conv_resam)
		wl_array_model_conv_resam_fit = copy.deepcopy(my_chi2.wl_array_model_conv_resam_fit)
		flux_array_model_conv_resam_fit = copy.deepcopy(my_chi2.flux_array_model_conv_resam_fit)
		weight_spec_fit = my_chi2.weight_spec_fit 
	if fit_photometry:
		flux_syn_array_model_fit = my_chi2.flux_syn_array_model_fit.copy() # make a copy because it will be scaled
		lambda_eff_array_model_fit = my_chi2.lambda_eff_array_model_fit
		width_eff_array_model_fit = my_chi2.width_eff_array_model_fit
		lambda_eff_SVO = my_chi2.lambda_eff_SVO
		width_eff_SVO = my_chi2.width_eff_SVO
		phot_fit = my_chi2.phot_fit
		ephot_fit = my_chi2.ephot_fit
		filters_fit = my_chi2.filters_fit
		lambda_eff_SVO_fit = my_chi2.lambda_eff_SVO_fit
		width_eff_SVO_fit = my_chi2.width_eff_SVO_fit
		weight_phot_fit = my_chi2.weight_phot_fit 

	# initialize variables to save key parameters from the fit
	scaling_fit = np.zeros(N_model_spectra) * np.nan
	escaling_fit = np.zeros(N_model_spectra) * np.nan
	Av_fit = np.zeros(N_model_spectra) * np.nan
	eAv_fit = np.zeros(N_model_spectra) * np.nan
	iterations_fit = np.zeros(N_model_spectra) * np.nan
	chi2_fit = np.zeros(N_model_spectra) * np.nan
	chi2_red_fit = np.zeros(N_model_spectra) * np.nan
	chi2_wl_fit = []
	chi2_red_wl_fit = []

	# create a tqdm progress bar
	chi2_bar = tqdm(total=N_model_spectra, desc='Minimizing chi-square')
	for i in range(N_model_spectra): # for each model spectrum
		# update the progress bar
		chi2_bar.update(1)

		# define free parameters in the fit
		params = Parameters()
		if not extinction_free_param: params.add('extinction', value=0, vary=False) # fixed parameter
		if extinction_free_param: params.add('extinction', value=0) # free parameter
		if not scaling_free_param: params.add('scaling', value=scaling, vary=False) # fixed parameter
		if scaling_free_param: params.add('scaling', value=1e-20) # free parameter

		# minimize chi square
		if fit_spectra and not fit_photometry:
			data_fit = flux_array_obs_fit[i] # all input fluxes
			edata_fit = eflux_array_obs_fit[i] # all input flux uncertainties
			model_fit = flux_array_model_conv_resam_fit[i] # model fluxes from each resampled and convolved model spectrum
			weight_fit = weight_spec_fit
		if not fit_spectra and fit_photometry:
			data_fit = [phot_fit]
			edata_fit = [ephot_fit]
			model_fit = [flux_syn_array_model_fit[i]]
			weight_fit = [weight_phot_fit]
		if fit_spectra and fit_photometry:
			data_fit = flux_array_obs_fit[i] + [phot_fit]
			edata_fit = eflux_array_obs_fit[i] + [ephot_fit]
			model_fit = flux_array_model_conv_resam_fit[i] + [flux_syn_array_model_fit[i]]
			weight_fit = weight_spec_fit + [weight_phot_fit]

		minner = Minimizer(residuals_for_chi2, params, fcn_args=(data_fit, edata_fit, model_fit, weight_fit))
		out_lmfit = minner.minimize(method='leastsq') # 'leastsq': Levenberg-Marquardt (default)

		# save parameters
		iterations_fit[i] = out_lmfit.nfev # number of function evaluations in the fit
		Av_fit[i] = out_lmfit.params['extinction'].value
		eAv_fit[i] = out_lmfit.params['extinction'].stderr # half the difference between the 15.8 and 84.2 percentiles of the PDF
		scaling_fit[i] = out_lmfit.params['scaling'].value
		escaling_fit[i] = out_lmfit.params['scaling'].stderr # half the difference between the 15.8 and 84.2 percentiles of the PDF
		chi2_fit[i] = out_lmfit.chisqr # resulting chi-square from lmfit
		chi2_red_fit[i] = out_lmfit.redchi # resulting reduced chi square from lmfit
		chi2_wl_fit.append(out_lmfit.residual**2) # chi square for each data point from lmfit
		chi2_red_wl_fit.append(out_lmfit.residual**2 / out_lmfit.nfree) # reduced chi square for each data point from lmfit

		# scale model fluxes by the value that minimizes chi2
		if fit_spectra:
			for k in range(N_spectra): # for each input observed spectrum
				flux_array_model_conv_resam[i][k] = flux_array_model_conv_resam[i][k] * scaling_fit[i]
				flux_array_model_conv_resam_fit[i][k] = flux_array_model_conv_resam_fit[i][k] * scaling_fit[i]
		if fit_photometry:
			flux_syn_array_model_fit[i] = flux_syn_array_model_fit[i] * scaling_fit[i]

	# close progress bar
	chi2_bar.close()

	# radius from the scaling factor and cloud distance
	if distance!=None: # derive radius only if a distance is provided
		distance_km = (distance*u.parsec).to(u.km) # distance in km
		radius_km = np.sqrt(scaling_fit) * distance_km # in km
		radius = radius_km.to(u.R_jup).value # in R_jup
		if edistance!=None: # obtain radius error only if a distance error is provided
			edistance_km = (edistance*u.parsec).to(u.km) # distance error in km
			eradius_km = radius_km * np.sqrt((edistance_km/distance_km)**2 + (escaling_fit/(2*scaling_fit))**2) # in km
			eradius = eradius_km.to(u.R_jup).value # in Rjup

	#+++++++++++++++++++++++++++++++++
	# output dictionary
	out_chi2 = {'my_chi2': my_chi2}
	# add more elements to the dictionary
	if (model is not None) & (model_dir is not None):
		out_chi2.update({'spectra_name_full': spectra_name_full, 'spectra_name': spectra_name})
	out_chi2.update({'N_model_spectra': N_model_spectra, 'iterations_fit': iterations_fit, 'Av_fit': Av_fit, 
		            'eAv_fit': eAv_fit, 'scaling_fit': scaling_fit, 'escaling_fit': escaling_fit, 
		            'chi2_wl_fit': chi2_wl_fit, 'chi2_red_wl_fit': chi2_red_wl_fit, 
		            'chi2_fit': chi2_fit, 'chi2_red_fit': chi2_red_fit})#, 'weight_fit': weight_fit})

	# add more output parameters depending on the input information
	if fit_spectra: # when only spectra are used in the fit
		# resampled and convolved model spectra in the input spectra wavelength ranges
#		out_chi2['wl_array_model_conv_resam'] = wl_array_model_conv_resam
		out_chi2['flux_array_model_conv_resam_scaled'] = flux_array_model_conv_resam
		# resampled and convolved model spectra within the fit ranges
#		out_chi2['wl_array_model_conv_resam_fit'] = wl_array_model_conv_resam_fit
		out_chi2['flux_array_model_conv_resam_scaled_fit'] = flux_array_model_conv_resam_fit
#		# observed fluxes within the fit ranges
#		out_chi2['wl_array_obs_fit'] = wl_array_obs_fit
#		out_chi2['flux_array_obs_fit'] = flux_array_obs_fit
#		out_chi2['eflux_array_obs_fit'] = eflux_array_obs_fit
	if fit_photometry: # when photometry is used in the fit
#		# photometric magnitudes within the wavelength range for the fit
#		out_chi2['phot_fit'] = phot_fit
#		out_chi2['ephot_fit'] = ephot_fit
#		out_chi2['filters_fit'] = filters_fit
#		# information from SVO for the selected filters
#		out_chi2['lambda_eff_SVO_fit'] = lambda_eff_SVO_fit
#		out_chi2['width_eff_SVO_fit'] = width_eff_SVO_fit
#		# information from model spectra for the selected filters
#		out_chi2['lambda_eff_array_model_fit'] = lambda_eff_array_model_fit
#		out_chi2['width_eff_array_model_fit'] = width_eff_array_model_fit
		# synthetic photometry from each model for the selected filters
		out_chi2['flux_syn_array_model_scaled_fit'] = flux_syn_array_model_fit
	if distance!=None: # when a radius was obtained
		out_chi2['radius'] = radius
		if edistance!=None:
			out_chi2['eradius'] = eradius

	# obtain residuals in linear and logarithmic-scale for fluxes in the fit range
	flux_residuals_spec = []
	logflux_residuals_spec = []
	flux_residuals_phot = []
	logflux_residuals_phot = []
	for i in range(N_model_spectra): # for each model spectrum
		flux_residuals_each = []
		logflux_residuals_each = []
		if fit_spectra:
			for k in range(N_spectra): # for each input observed spectrum
				# linear scale
				res_lin = flux_array_model_conv_resam_fit[i][k] - flux_array_obs_fit[i][k]
				flux_residuals_each.append(res_lin)
				# log scale
				mask_pos = flux_array_obs_fit[i][k]>0 # mask to avoid negative input fluxes to obtain the logarithm
				res_log = np.log10(flux_array_model_conv_resam_fit[i][k][mask_pos]) - np.log10(flux_array_obs_fit[i][k][mask_pos])
				logflux_residuals_each.append(res_log)
			# nested list with all resampled and convolved model spectra in the fit range
			flux_residuals_spec.append(flux_residuals_each)
			logflux_residuals_spec.append(logflux_residuals_each)
		if fit_photometry: 
			# linear scale
			res_lin = flux_syn_array_model_fit[i] - phot_fit
			# log scale
			mask_pos = phot_fit>0 # mask to avoid negative input fluxes to obtain the logarithm
			res_log = np.log10(flux_syn_array_model_fit[i][mask_pos]) - np.log10(phot_fit[mask_pos])
			# nested list with residuals for filters within the fit range for each model spectrum
			flux_residuals_phot.append(res_lin)
			logflux_residuals_phot.append(res_log)

	if fit_spectra:
		out_chi2['flux_residuals_spec'] = flux_residuals_spec
		out_chi2['logflux_residuals_spec'] = logflux_residuals_spec
	if fit_photometry: 
		out_chi2['flux_residuals_phot'] = flux_residuals_phot
		out_chi2['logflux_residuals_phot'] = logflux_residuals_phot

	# separate physical parameters from each model spectrum name
	if (model is not None) & (model_dir is not None):
		out_separate_params = models.separate_params(model=model, spectra_name=spectra_name)
		# add model spectra parameters to the output dictionary
		out_chi2.update(out_separate_params)

	# save some information
	if (model is not None) & (model_dir is not None):
		if save_results: # save table with model spectra sorted by chi square
			# save output dictionary as pickle
			with open(my_chi2.chi2_pickle_file, 'wb') as file:
				# serialize and write the variable to the file
				pickle.dump(out_chi2, file)
			print('      chi-square minimization results saved successfully')

			# save table with model spectra names sorted by chi square along with the parameters from each spectrum
			out_save_params = save_params(out_chi2=out_chi2)

	print('\n   Chi-square fit ran successfully')
	fin_time_chi2 = time.time()
	utils.print_time(fin_time_chi2-ini_time_chi2)

	return out_chi2

#########################
# Objective function to be minimized by ``Minimizer``.
def residuals_for_chi2(params, data, edata, model, weight):
#	'''
#	Description:
#	------------
#		Define objective function that returns the array to be minimized.
#
#	Parameters:
#	-----------
#	- params : ''lmfit.parameter.Parameters''
#		Parameters as ``Parameters()`` for fitting models to data using ``Minimizer``.
#	- data : array
#		Input data (spectra and/or photometry) for the fit.
#	- edata : array
#		Input data uncertainties for the fit.
#	- model : array
#		Model spectrum for the fit.
#	- extinction_curve : array, (0 when ``extinction_free_param=='no'``)
#		Extinction curve for wavelengths in the fit.
#	- weight: array
#		Weight given to each data point in the fit.
#
#	Returns:
#	--------
#	Objective function to be minimized by ``Minimizer``.
#
#	Author: Genaro Suárez
#	'''

	scaling = params['scaling']

	residuals = np.array([]) # initialize numpy array to save array with residual
	for i in range(len(data)): # for each input spectrum
		res = (data[i]-scaling*model[i]) / edata[i] # the square of this equation will be minimized by minner.minimize
		wnorm = weight[i]/np.mean(np.concatenate(weight)) # this keeps the overall chi2 scale consistent, but does not change the relative importance between spectra and photometry
		res = np.sqrt(wnorm)*res # multiply by weights normalized by mean(weight) so chi2 values have similar magnitude to the unweighted case
		residuals = np.concatenate([residuals, res])

	return  residuals

##########################
[docs]def save_params(out_chi2):
	'''
	Description:
	------------
		Create table with model spectra names sorted by chi square along with relevant parameters.

	Parameters:
	-----------
	- out_chi2 : dictionary
		Dictionary with the following parameters:
			- ``spectra_name`` : spectrum name
			- ``chi2_fit`` : chi-square
			- ``chi2_red_fit`` : reduced chi-square
			- ``scaling_fit`` : scaling factor 
			- ``e_scaling_fit`` : scaling factor uncertainty
			- ``Av_fit`` : extinction
			- ``eAv_fit`` : extinction uncertainty
			- ``params`` : fundamental parameters provided by ``model``.
			- ``R`` : radius, when a ``distance`` was provided.
			- ``eR`` : radius error, when ``distance`` and ``edistance`` were provided.
			- ``iterations_fit`` : iterations to minimize chi square.

	Returns:
	--------
	- ``chi2_table_file`` : ascii table
		ASCII table with input parameters sorted according to reduced chi-square.
		Table named ``chi2_table_file``, as specified in ``seda.Chi2Options``.

	Author: Genaro Suárez
	'''

	# sort index with respect to reduced chi-square
	ind = np.argsort(out_chi2['chi2_red_fit'])

	# read and sort relevant parameters from the input dictionary
	chi2 = out_chi2['chi2_fit'][ind] # chi-square as integer
	chi2_red = out_chi2['chi2_red_fit'][ind] # reduced chi-square with three decimals
	scaling_factor = out_chi2['scaling_fit'][ind]
	escaling_factor = out_chi2['escaling_fit'][ind]
	Av = out_chi2['Av_fit'][ind] # Av
	eAv = out_chi2['eAv_fit'][ind] # Av error
	iterations = out_chi2['iterations_fit'][ind] # iterations in the minimization
	if 'spectra_name' in out_chi2:
		filename = out_chi2['spectra_name'][ind] # filename
		params = out_chi2['params']  # free model paramters
		for param in params:
			params[param] = params[param][ind]
	if out_chi2['my_chi2'].distance is not None:
		R = out_chi2['radius'][ind] # radius
		eR = out_chi2['eradius'][ind] # radius error

	# make dictionary with parameters of interest
	my_dict = {} # initialize dictionary
	if 'spectra_name' in out_chi2:
		my_dict['filename'] = filename
	my_dict['chi2'] = np.round(chi2).astype(int) # chi-square as integer
	my_dict['chi2_red'] = np.round(chi2_red,3) # reduced chi-square with three decimals
	# round scaling and its error, which have scientific notation
	scaling = np.array([])
	escaling = np.array([])
	for i,scal in enumerate(scaling_factor): # for each scaling value
	    scaling = np.append(scaling, format(scaling_factor[i], '.3e')) # keep three decimals
	    escaling = np.append(escaling, format(escaling_factor[i], '.3e')) # keep three decimals
	my_dict['scaling'] = scaling # scaling
	my_dict['escaling'] = escaling # scaling error
	my_dict['Av'] = Av # Av
	my_dict['eAv'] = eAv # Av error
	if 'spectra_name' in out_chi2:
		my_dict.update(params) # free model paramters
	if out_chi2['my_chi2'].distance is not None:
		my_dict['R'] = np.round(R,3) # radius
		my_dict['eR'] = np.round(eR,3) # radius error
	my_dict['iterations'] = iterations.astype(int) # iterations in the minimization

	# save dictionary as a PrettyTable table
	table_name = out_chi2['my_chi2'].chi2_table_file
	utils.save_prettytable(my_dict=my_dict, table_name=table_name)

	return  

##########################
# number of elements in a nested list
def count_elements_nested_list(lst):
	count = 0
	for i in range(len(lst)):
		for j in range(len(lst[i])):
			count += len(lst[i][j])

	return count