GaiaTools/run_fit.py at master · DebasishHazarika/GaiaTools · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269

# whether to account for spatially correlated systematic errors when estimating the uncertainty on mean PM
use_systematic_error = True
if use_systematic_error:
    import get_mean_pm

import numpy, scipy.optimize
try:
    # autograd module allows to compute analytically the Hessian of the log-likelihood function
    import autograd
    log  = autograd.numpy.log
    exp  = autograd.numpy.exp
except ImportError:
    # will not be able to compute statistical uncertainties if autograd is not available,
    # however, if use_systematic_error==True, the uncertainties will be computed in a different way
    # which does not use autograd anyway
    autograd = None
    log  = numpy.log
    exp  = numpy.exp

filein   = open("input.txt",  "r")
fileout  = open("result.txt", 'w')
for linein in filein:
    # parse the input file (one line per cluster)
    line  = linein.strip().split()
    name  = line[0]
    if linein[0]=='#':
        fileout.write(linein)
        continue
    ra0   = float(line[1])  # degrees
    dec0  = float(line[2])  # degrees
    dist  = float(line[3])  # kpc
    vdisp = float(line[7])  # km/s
    rmax  = float(line[8])  # arcmin
    pmra0 = float(line[9])  # initial guess for the cluster PMra
    pmdec0= float(line[10]) # same for PMdec

    # read data file that was previously retrieved from the Gaia archive
    data  = numpy.load('data/'+name+'.npz')
    ra    = data['ra'].astype(float)
    dec   = data['dec'].astype(float)
    pmra  = data['pmra'].astype(float)
    pmdec = data['pmdec'].astype(float)
    pmrae = data['pmra_error'].astype(float)
    pmdece= data['pmdec_error'].astype(float)
    pmcorr= data['pmra_pmdec_corr'].astype(float)
    plx   = data['parallax'].astype(float)
    plxe  = data['parallax_error'].astype(float)
    bprp  = data['bp_rp']
    gmag  = data['phot_g_mean_mag']
    ruwe  = data['ruwe']
    aen   = data['astrometric_excess_noise']
    penn  = numpy.where(bprp<0.5, 1.1544+0.0338*bprp+0.0323*bprp**2,
            numpy.where(bprp<4.0, 1.1620+0.0115*bprp+0.0493*bprp**2-0.00588*bprp**3, 1.0576+0.1405*bprp))
    pen   = data['phot_bp_rp_excess_factor'] - penn  # excess flux minus the global trend
    pens  = pen / (0.006 + 8.8e-12 * gmag**7.62)     # magnitude-dependent scaling factor

    # coordinate transformation from sky to tangent plane (orthogonal projection)
    sin   = numpy.sin
    cos   = numpy.cos
    d2r   = numpy.pi/180  # degrees to radians
    x     = (cos(dec * d2r) * sin((ra-ra0) * d2r)) / d2r   # x,y are in degrees
    y     = (sin(dec * d2r) * cos(dec0 * d2r) - cos(dec * d2r) * sin(dec0 * d2r) * cos((ra-ra0) * d2r)) / d2r
    # transformation of PM and its uncertainty covariance matrix
    Jxa   = cos((ra-ra0) * d2r)
    Jxd   = -sin(dec * d2r) * sin((ra-ra0) * d2r)
    Jya   = sin(dec0 * d2r) * sin((ra-ra0) * d2r)
    Jyd   = cos(dec  * d2r) * cos(dec0 * d2r) + sin(dec * d2r) * sin(dec0 * d2r) * cos((ra-ra0) * d2r)
    mx    = pmra * Jxa + pmdec * Jxd
    my    = pmra * Jya + pmdec * Jyd
    Cxx   = (Jxa * pmrae)**2 + (Jxd * pmdece)**2 + 2 * Jxa * Jxd * pmcorr * pmrae * pmdece
    Cyy   = (Jya * pmrae)**2 + (Jyd * pmdece)**2 + 2 * Jya * Jyd * pmcorr * pmrae * pmdece
    Cxy   = Jxa * Jya * pmrae**2 + Jxd * Jyd * pmdece**2 + (Jya * Jxd + Jxa * Jyd) * pmcorr * pmrae * pmdece
    mxe   = Cxx**0.5
    mye   = Cyy**0.5
    mcorr = Cxy / (mxe * mye)
    rdist = (x**2 + y**2)**0.5 * 60.  # distance from cluster center in arcmin

    # apply various quality filters
    filt  = (rdist < rmax)                # distance filter
    filt *= (pmra**2 + pmdec**2 < 30**2)  # eliminate spurious very large PM
    filt *= (ruwe<1.2) * (aen<1.0)        # eliminate unreliable PM from astrometric excess noise and RUWE
    filt *= pens < 3.0                    # filter on photometric excess (mostly faint sources in crowded regions)
    if numpy.sum(filt)<50 or name in ['Liller_1', 'VVV_CL002', 'UKS_1', 'Ryu_879_RLGC2']:
        filt += True  # ignore filter, otherwise there are too few sources

    # filtered PM and their uncertainty covariance matrices for each star
    # (for simplicity, refer to them as "x,y", not "ra,dec")
    errmul     = 1.1   # increase the statistical uncertainty by this factor
    star_pmra  = pmra  [filt]
    star_pmdec = pmdec [filt]
    star_covrr =(pmrae [filt] * errmul)**2
    star_covdd =(pmdece[filt] * errmul)**2
    star_covrd = pmcorr[filt] * (star_covrr * star_covdd)**0.5
    star_rdist = rdist [filt]

    # center and variance of PM distribution of field stars (initially assign from all stars)
    field_pmra0  = numpy.mean(star_pmra)
    field_pmdec0 = numpy.mean(star_pmdec)
    field_covrr0 = numpy.var (star_pmra)
    field_covdd0 = numpy.var (star_pmdec)
    # same for cluster stars (take the initial guess for the center from the input file,
    # and the initial dispersion - or more correctly, standard deviation - from line-of-sight vel dispersion
    clust_pmra0  = pmra0
    clust_pmdec0 = pmdec0
    clust_disp0  = vdisp/dist/4.74

    # initial guess for the parameters of the Gaussian mixture likelihood function
    params = numpy.array([
        clust_pmra0,  clust_pmdec0,    # [0-1] = center of 0th component (cluster) in the PM space
        field_pmra0,  field_pmdec0,    # [2-3] = center of 1st component (field)
        field_covrr0, field_covdd0, 0, # [4-6] = covariance matrix of 1st component (xx, yy, xy)
        0.5,                           # [7]   = weight of 0st component
        0.5,                           # [8]   = Plummer scale radius of the cluster, normalized to rmax
        clust_disp0                    # [9]   = PM dispersion of cluster stars
    ])

    def eval_model(params, give_prob=False):
        """
        Construct a mixture model with the given parameters and evaluate the distribution function
        of both cluster and field components for each star.
        This function can be used in two different contexts:
        if give_prob==False,  return -ln(likelihood) - used in minimizer;
        otherwise, return the array of posterior probabilities of cluster membership for each star.
        """
        clust_pmra, clust_pmdec, field_pmra, field_pmdec, field_covrr, field_covdd, field_covrd, \
            clust_weight, clust_rscale_mult, clust_disp = params
        # Plummer scale radius of cluster stars
        clust_rscale = clust_rscale_mult * rmax
        # scale radius for PM dispersion profile - assume a fixed fraction of Rscale
        clust_rsigma = clust_rscale * 0.5
        # number of cluster members in the circle of radius rmax
        clust_count  = len(star_rdist) * clust_weight
        # same for field stars
        field_count  = len(star_rdist) - clust_count
        # check ranges
        if clust_count<=2 or field_count<=0 or clust_rscale<=0 or \
            clust_disp<=0 or field_covrr<=0 or field_covdd<=0 or field_covrd**2>=field_covrr*field_covdd:
            return numpy.inf

        # spatially dependent squared velocity dispersion of cluster stars (diagonal elements of covar.matrix)
        clust_covar  = clust_disp**2 / (1 + (star_rdist / clust_rsigma)**2)**0.5
        # offset between PM of each star and the mean PM of the cluster
        clust_pmra  -= star_pmra
        clust_pmdec -= star_pmdec
        # covariance matrices of each star as if it were a cluster member
        clust_covrr  = star_covrr + clust_covar
        clust_covdd  = star_covdd + clust_covar
        clust_covrd  = star_covrd
        # determinants of these covariance matrices for each star
        clust_det    = clust_covrr * clust_covdd - clust_covrd**2
        # same for each star as if it were a field star
        field_pmra  -= star_pmra
        field_pmdec -= star_pmdec
        field_covrr += star_covrr
        field_covdd += star_covdd
        field_covrd += star_covrd
        field_det    = field_covrr * field_covdd - field_covrd**2
        # amplitude of the surface density of cluster stars (spatially dependent)
        clust_ampl   = clust_count
        # value of the distribution function of the 0th component (cluster) for each star,
        # including the spatially-dependent prior multiplying factor
        clust_distr  = clust_count * \
            (1 + (rmax / clust_rscale)**2) * (1 + (star_rdist / clust_rscale)**2)**-2 * \
            clust_det**-0.5 * exp( -0.5 / clust_det * (
            clust_pmra**2  * clust_covdd +
            clust_pmdec**2 * clust_covrr -
            2 * clust_pmra * clust_pmdec * clust_covrd) )
        # same for the 1st component (field)
        field_distr  = field_count * \
            field_det**-0.5 * exp( -0.5 / field_det * (
            field_pmra**2  * field_covdd +
            field_pmdec**2 * field_covrr -
            2 * field_pmra * field_pmdec * field_covrd) )
        if give_prob:
            # return the posterior membership probability for each star
            return numpy.nan_to_num(clust_distr / (clust_distr + field_distr))
        else:
            # return the total log-likelihood of the model
            result = sum(log(clust_distr + field_distr))
            # prior discourages PM dispersion and scale radius from getting too high
            prior  = -exp( 5 * (clust_disp/clust_disp0-1) ) - exp( 5 * (clust_rscale/rmax-0.75) )
            return -(result + prior)  # return minus log-likelihood, the function to be minimized

    # minimization of minus log-likelihood - perform several runs of Nelder-Mead algorithm,
    # restarting it each time from the last best-fit position (to prevent stalling in a local minimum)
    llprev = numpy.inf
    params = scipy.optimize.minimize(eval_model, params, method='Nelder-Mead').x
    llcurr = eval_model(params)
    while llcurr < llprev-0.1:
        params = scipy.optimize.minimize(eval_model, params, method='Nelder-Mead').x
        llprev = llcurr
        llcurr = eval_model(params)

    # final values of best-fit parameters
    clust_pmra, clust_pmdec, field_pmra, field_pmdec, field_covrr, field_covdd, field_covrd, \
        clust_weight, clust_rscale_mult, clust_disp = params
    clust_rscale = clust_rscale_mult * rmax
    clust_rsigma = clust_rscale * 0.5

    # estimate the uncertainty covariance matrix of all model parameters from the inverse Hessian;
    # which is computed by automatic differentiation (if available)
    covmat = numpy.eye(len(params)) * 0.
    if not autograd is None:
        hessian  = autograd.hessian(eval_model)(params)
        if not numpy.any(numpy.isnan(hessian)):
            try: covmat = numpy.linalg.inv(hessian)
            except: print("Hessian matrix is not positive-definite")
        else: print("Hessian matrix contains invalid elements")
    clust_pmrae  = covmat[0,0]**0.5
    clust_pmdece = covmat[1,1]**0.5
    clust_pmcorr = covmat[0,1] / (covmat[0,0]*covmat[1,1] + 1e-200)**0.5

    # evaluate the membership probability for each star
    memberprob = numpy.zeros(len(pmra))  # set to zero for stars which did not pass initial filter
    memberprob[filt] = eval_model(params, give_prob=True)
    memberprob[memberprob<1e-6] = 0.

    # optional: estimate the uncertainty in mean PM taking into account systematic errors
    if use_systematic_error:
        # select stars likely belonging to the cluster (cannot use probabilistic membership at this stage)
        filtprob= memberprob>=0.8
        maxused = 2000   # limit the maximum number of stars, as the cost scales as N^3
        if sum(filtprob) > maxused:
            filtprob *= gmag < numpy.sort(gmag[filtprob])[maxused]  # retain only brighter stars

        # use the routine from the supplementary module to compute the mean PM and its uncertainty
        result = get_mean_pm.get_mean_pm(ra[filtprob], dec[filtprob], pmra[filtprob], pmdec[filtprob],
            pmrae[filtprob], pmdece[filtprob], pmcorr[filtprob],
            sigma=clust_disp, rsigma=clust_rsigma, covfnc=get_mean_pm.covfncpm)

        # take these values if the uncertainty is larger than inferred without accounting for systematics
        if result[2]+result[3] > clust_pmrae+clust_pmdece:
            clust_pmra  = result[0]
            clust_pmdec = result[1]
            clust_pmrae = result[2]
            clust_pmdece= result[3]
            clust_pmcorr= result[4]

        # also compute the mean parallax accounting for correlated systematics
        clust_plx, clust_plxe = get_mean_pm.get_mean_plx(
            ra[filtprob], dec[filtprob], plx[filtprob], plxe[filtprob],
            covfnc=get_mean_pm.covfncplx, gmag=gmag[filtprob])

    else:  # compute mean plx with only statistical uncertainties
        clust_plx, clust_plxe = get_mean_pm.get_mean_plx(ra, dec, plx, plxe)

    # finally, write the summary results for this cluster to the output file and print them to screen
    print("%s:  Total=%d,  PMfilt=%.1f,  PMra=%.3f +- %.3f,  PMdec=%.3f +- %.3f,  corr=%.3f,  rscale=%.2f,  PMdisp=%.3f" % \
        (name, sum(filt), sum(memberprob), clust_pmra, clust_pmrae, clust_pmdec, clust_pmdece, clust_pmcorr, clust_rscale, clust_disp))
    line = ["%-15s"% name] + ['%7s' % item for item in line[1:9]] + [
        "%7.3f" % clust_pmra,
        "%7.3f" % clust_pmdec,
        "%7.3f" % clust_plx,
        "%7.3f" % clust_pmrae,
        "%7.3f" % clust_pmdece,
        "%7.3f" % clust_pmcorr,
        "%7.3f" % clust_plxe ]
    fileout.write("\t".join(line) + "\n")
    fileout.flush()

    # write the data for all stars into a text file
    numpy.savetxt('data/'+name+'.txt', numpy.column_stack((
        ra, dec, x, y, pmra, pmdec, pmrae, pmdece, pmcorr,
        gmag, bprp, filt, memberprob)), fmt='%.4f %.4f'+' %.6g'*11,
        header='ra   dec   x   y   pmra    pmdec    pmra_e  pmdec_e  pm_corr g_mag bp_rp filter  memberprob')

filein.close()
fileout.close()