diff options
author | Aaron LI <aaronly.me@outlook.com> | 2015-06-06 15:56:55 +0800 |
---|---|---|
committer | Aaron LI <aaronly.me@outlook.com> | 2015-06-06 15:56:55 +0800 |
commit | 5e6819924a832b6ab5cf860dc2adfbf14e1fd120 (patch) | |
tree | e4a6035e09fc9825322ca9b6d219196c694f9964 /astro/fitting | |
parent | b2022f919cc595464c1f650fab64563c1055ad87 (diff) | |
download | atoolbox-5e6819924a832b6ab5cf860dc2adfbf14e1fd120.tar.bz2 |
Major update to 'fit_betasbp_cut.py'.
fit_betasbp_cut.py:
* replace getopt with 'argparse'
* added 'get_parameter' to process model parameter initial value and bounds
* support read parameter bounds from input file
* added options '--s0', '--rc', '--beta', '--const' to get paramter
initial values and bounds
* renamed 'fit_beta_model' to 'fit_model', and added argument 'func' to
support other models
Diffstat (limited to 'astro/fitting')
-rwxr-xr-x | astro/fitting/fit_betasbp_cut.py | 306 |
1 files changed, 210 insertions, 96 deletions
diff --git a/astro/fitting/fit_betasbp_cut.py b/astro/fitting/fit_betasbp_cut.py index 4b530f4..4e37f91 100755 --- a/astro/fitting/fit_betasbp_cut.py +++ b/astro/fitting/fit_betasbp_cut.py @@ -11,22 +11,39 @@ # 2015/05/29 # # Changelogs: -# 2015/05/30: +# v0.4.0, 2015/06/06, Aaron LI +# * replace getopt with 'argparse' +# * added 'get_parameter' to process model parameter initial value and bounds +# * support read parameter bounds from input file +# * added options '--s0', '--rc', '--beta', '--const' to get paramter +# initial values and bounds +# * renamed 'fit_beta_model' to 'fit_model', and added argument 'func' to +# support other models +# v0.3.0, 2015/06/02, Aaron LI +# * can output chi-squared and dof values +# * can output one standard deviation errors on the parameters +# v0.2.0, 2015/05/30: # * Added option '-n' / '--no-radius' to ignore radius less than the # given value. # * Support read model initial parameter values from input file. # +# TODO: +# * to allow restrict the range of parameters / just fix it +# from __future__ import print_function, division +__version__ = "0.4.0" +__date__ = "2015/06/06" + import numpy as np -from scipy.optimize import curve_fit +from scipy.optimize import curve_fit, minimize import os import sys -import getopt import re +import argparse # modes of to cut data @@ -41,7 +58,18 @@ def beta_model(r, s0, rc, beta, c): return s0 * np.power((1.0+(r/rc)**2), 0.5-3*beta) + c -def fit_beta_model(xdata, ydata, yerrdata, p0, +def calc_chisq(func, xdata, ydata, yerrdata, *args): + """ + Calculate the chi-squared values for the given function according + to the provided data points. + """ + xdata = np.array(xdata) + ydata = np.array(ydata) + yerrdata = np.array(yerrdata) + return np.sum(((ydata - func(xdata, *args)) / yerrdata) ** 2) + + +def fit_model(func, xdata, ydata, yerrdata, p0, cutmode=CUT_POINT, cutvalue=0): """ Fit the provided data with the beta model. @@ -53,7 +81,14 @@ def fit_beta_model(xdata, ydata, yerrdata, p0, cutvalue: the cut limit Return: - [fitted_par, fitted_cov, fitted_model_value] + (popt, pcov, infodict) + popt: optimal values for the parameters + pcov: 2d array; the estimated covariance of popt + infodict: + * fvec: the function evaluated at the output parameters + * dof: degree of freedom + * chisq: chi-squared + * perr: one standard deviation errors on the parameters """ if cutmode == CUT_POINT: xdata2 = xdata[cutvalue:] @@ -66,10 +101,52 @@ def fit_beta_model(xdata, ydata, yerrdata, p0, yerrdata2 = yerrdata[ii] else: raise ValueError('Unknown cut mode: %s' % cutmode) - par_fit, cov_fit = curve_fit(beta_model, xdata2, ydata2, + popt, pcov = curve_fit(func, xdata2, ydata2, p0=p0, sigma=yerrdata2) - y_fit = beta_model(xdata, *par_fit) - return (par_fit, cov_fit, y_fit) + # the function evaluated at the output parameters + fvec = lambda x: func(x, *popt) + # degree of freedom + dof = len(xdata2) - len(popt) + # chi squared + chisq = np.sum(((ydata2 - fvec(xdata2)) / yerrdata2) ** 2) + # one standard deviation errors on the parameters + perr = np.sqrt(np.diag(pcov)) + infodict = { + 'fvec': fvec, + 'dof': dof, + 'chisq': chisq, + 'perr': perr + } + return (popt, pcov, infodict) + + +def get_parameter(pstring): + """ + Process the parameter string of the following format, and return + the initial value, lower limit, and upper limit. + "init_value" + "init_value lower upper" + "init_value,lower,upper" + If want to ignore the lower/upper limit, use 'None' (case-insensitive), + and the None is returned. + """ + parameters = pstring.replace(',', ' ').split() + if len(parameters) == 1: + init_value = float(parameters[0]) + return (init_value, None, None) + elif len(parameters) == 3: + init_value = float(parameters[0]) + if parameters[1].upper() == 'NONE': + lower_value = None + else: + lower_value = float(parameters[1]) + if parameters[2].upper() == 'NONE': + upper_value = None + else: + upper_value = float(parameters[2]) + return (init_value, lower_value, upper_value) + else: + raise ValueError('Invalid parameter format: %s' % pstring) def main(): @@ -83,44 +160,73 @@ def main(): rc_0 = 10.0 beta_0 = 0.6 c_0 = 0.0 - # debug - verbose = False - - try: - opts, args = getopt.getopt(sys.argv[1:], 'c:hi:n:o:v', - ['cut-point=', 'help', 'infile=', 'no-radius=', - 'outfile=', 'verbose']) - except getopt.GetoptError as e: - print(e, file=sys.stderr) - usage() - sys.exit(2) - - for opt, arg in opts: - if opt in ('-h', '--help'): - usage() - sys.exit(0) - elif opt in ('-v', '--verbose'): - verbose = True - elif opt in ('-i', '--infile'): - infile = arg - elif opt in ('-o', '--outfile'): - outfilename = arg - elif opt in ('-c', '--cut-point'): - cutvalue = int(arg) - cutmode = CUT_POINT - elif opt in ('-n', '--no-radius'): - cutvalue = float(arg) - cutmode = CUT_RADIUS - else: - assert False, 'unhandled option' - - if not infile: - print('ERROR: --infile required', file=sys.stderr) - sys.exit(11) - if outfilename: - outfile = open(outfilename, 'w') + # default bounds for the four parameters + s0_lower, s0_upper = None, None + rc_lower, rc_upper = None, None + beta_lower, beta_upper = None, None + c_lower, c_upper = None, None + + # parser for command line options and arguments + parser = argparse.ArgumentParser( + description="Fitting provided data with the beta model.", + epilog="Version: %s (%s)" % (__version__, __date__)) + parser.add_argument("-v", "--verbose", dest="verbose", + action="store_true", default=False, + help="show verbose/debug information") + parser.add_argument("-V", "--version", action="version", + version="%(prog)s " + "%s (%s)" % (__version__, __date__)) + parser.add_argument("-i", "--infile", + dest="infile", required=True, + help="""input data file with the following 4 or 3 columns: + [radius radius_err brightness brightness_err], + [radius brightness brightness_err]. + Note: The initial values and lower/upper limits + for the beta models can also be provided with the + following syntax: + # s0_0 = init_value, lower_limit, upper_limit + # rc_0 = init_value, lower_limit, upper_limit + # beta_0 = init_value, lower_limit, upper_limit + # c_0 = init_value, lower_limit, upper_limit""") + parser.add_argument("-o", "--outfile", dest="outfilename", + help="output file to store the fitted data") + parser.add_argument("-c", "--cut-point", + dest="cut_point", metavar="N", type=int, default=0, + help="number of inner-most data points to be ignored") + parser.add_argument("-n", "--no-radius", + dest="cut_radius", metavar="RADIUS", type=float, default=0.0, + help="ignore data points with smaller radius") + parser.add_argument("--s0", dest="s0", + metavar="init_value,lower,upper", + help="initial value and lower/upper limits for parameter s0. " + \ + "Use 'none' (case-insensitive) to ignore the limit") + parser.add_argument("--rc", dest="rc", + metavar="init_value,lower,upper", + help="initial value and lower/upper limits for parameter rc. " + \ + "Use 'none' (case-insensitive) to ignore the limit") + parser.add_argument("--beta", dest="beta", + metavar="init_value,lower,upper", + help="initial value and lower/upper limits for parameter beta. " + \ + "Use 'none' (case-insensitive) to ignore the limit") + parser.add_argument("--const", dest="const", + metavar="init_value,lower,upper", + help="initial value and lower/upper limits for parameter const. " + \ + "Use 'none' (case-insensitive) to ignore the limit") + + args = parser.parse_args() + if args.outfilename: + outfile = open(args.outfilename, 'w') else: outfile = sys.stdout + # cut mode and value + if args.cut_point: + cutmode = CUT_POINT + cutvalue = args.cut_point + elif args.cut_radius: + cutmode = CUT_RADIUS + cutvalue = args.cut_radius + + if args.verbose: + print("DEBUG: cutmode: %s, cutvalue: %s" % (cutmode, cutvalue)) # input data list r_data = [] @@ -135,19 +241,23 @@ def main(): re_rc = re.compile(r'^\s*#\s*rc_0\s*[:=]') re_beta = re.compile(r'^\s*#\s*beta_0\s*[:=]') re_c = re.compile(r'^\s*#\s*c_0\s*[:=]') - for line in open(infile, 'r'): + for line in open(args.infile, 'r'): if re_s0.match(line): # read 's0_0': initial value for parameter 's0' - s0_0 = float(re_s0.split(line)[1]) + s0_pstring = re_s0.split(line)[1] + s0_0, s0_lower, s0_upper = get_parameter(s0_pstring) elif re_rc.match(line): # read 'rc_0': initial value for parameter 'rc' - rc_0 = float(re_rc.split(line)[1]) + rc_pstring = re_rc.split(line)[1] + rc_0, rc_lower, rc_upper = get_parameter(rc_pstring) elif re_beta.match(line): # read 'beta_0': initial value for parameter 'beta' - beta_0 = float(re_beta.split(line)[1]) + beta_pstring = re_beta.split(line)[1] + beta_0, beta_lower, beta_upper = get_parameter(beta_pstring) elif re_c.match(line): # read 'c_0': initial value for parameter 'c' - c_0 = float(re_c.split(line)[1]) + c_pstring = re_c.split(line)[1] + c_0, c_lower, c_upper = get_parameter(c_pstring) elif re_blank.match(line): # ignore blank line continue @@ -170,68 +280,72 @@ def main(): s_data.append(s) serr_data.append(serr) + if args.verbose: + print('DEBUG: infile: s0_0 = %g (%s, %s)' % \ + (s0_0, s0_lower, s0_upper), file=sys.stderr) + print('DEBUG: infile: rc_0 = %g (%s, %s)' % \ + (rc_0, rc_lower, rc_upper), file=sys.stderr) + print('DEBUG: infile: beta_0 = %g (%s, %s)' % \ + (beta_0, beta_lower, beta_upper), file=sys.stderr) + print('DEBUG: infile: c_0 = %g (%s, %s)' % \ + (c_0, c_lower, c_upper), file=sys.stderr) + + # get parameter initial values and bounds from command line arguments + if args.s0: + s0_0, s0_lower, s0_upper = get_parameter(args.s0) + if args.rc: + rc_0, rc_lower, rc_upper = get_parameter(args.rc) + if args.beta: + beta_0, beta_lower, beta_upper = get_parameter(args.beta) + if args.const: + c_0, c_lower, c_upper = get_parameter(args.const) + + if args.verbose: + print('DEBUG: final: s0_0 = %g (%s, %s)' % \ + (s0_0, s0_lower, s0_upper), file=sys.stderr) + print('DEBUG: final: rc_0 = %g (%s, %s)' % \ + (rc_0, rc_lower, rc_upper), file=sys.stderr) + print('DEBUG: final: beta_0 = %g (%s, %s)' % \ + (beta_0, beta_lower, beta_upper), file=sys.stderr) + print('DEBUG: final: c_0 = %g (%s, %s)' % \ + (c_0, c_lower, c_upper), file=sys.stderr) + # convert to numpy array r_data = np.array(r_data) rerr_data = np.array(rerr_data) s_data = np.array(s_data) serr_data = np.array(serr_data) - - if verbose: - print('DEBUG: s0_0 = %g, rc_0 = %g, beta_0 = %g, c_0 = %g' % \ - (s0_0, rc_0, beta_0, c_0), file=sys.stderr) - + # model parameters + par_names = ["s0", "rc", "beta", "c"] + # initial values par_0 = [s0_0, rc_0, beta_0, c_0] - - par_fit, cov_fit, s_fit = fit_beta_model(r_data, s_data, serr_data, - p0=par_0, cutmode=cutmode, cutvalue=cutvalue) + # parameter bounds + par_bounds = [(s0_lower, s0_upper), (rc_lower, rc_upper), + (beta_lower, beta_upper), (c_lower, c_upper)] + + ## 'fit_beta_model' do not support parameter bounds + par_fit, cov_fit, infodict = fit_model(beta_model, r_data, s_data, + serr_data, p0=par_0, cutmode=cutmode, cutvalue=cutvalue) + fvec = infodict['fvec'] + dof = infodict['dof'] + chisq = infodict['chisq'] + perr = infodict['perr'] print("# beta-model fitting results:", file=outfile) print("# s(r) = s0 * pow((1.0+(r/rc)^2), 0.5-3*beta) + c", file=outfile) - print("# s0 = %g\n# rc = %g\n# beta = %g\n# c = %g" % tuple(par_fit), + for i in range(len(par_names)): + print("# %s = %g +/- %g" % (par_names[i], par_fit[i], perr[i]), + file=outfile) + print("# chisq / dof = %g / %g = %g" % (chisq, dof, chisq/dof), file=outfile) print("# radius(input) brightness(fitted)", file=outfile) - for i in range(len(s_fit)): - print("%g %g" % (r_data[i], s_fit[i]), file=outfile) + for i in range(len(r_data)): + print("%g %g" % (r_data[i], fvec(r_data[i])), file=outfile) - if outfilename: + if args.outfilename: outfile.close() -USAGE = """Usage: - %(prog)s [ -h -c -o outfile ] -i infile - -Required arguments: - -i, --infile - input data file with the following *four* or *three* columns: - r, rerr, s, serr - r, s, serr - Note: the initial values for beta model paramters can also be - provided with the following syntax: - # s0_0 = ?? - # rc_0 = ?? - # beta_0 = ?? - # c_0 = ?? - -o, --outfile - output file to store the fitted data - if not provided, then print results to screen - -Optional arguments: - -h, --help - print this usage - -c, --cut-point - accept an integer number (n) - ignore the inner-most n data points - -n, --no-radius - accept a float number (r) - ignore the data points whose radius is less than r -""" % { 'prog': os.path.basename(sys.argv[0]) } - - -def usage(): - print(USAGE) - - if __name__ == '__main__': main() - |