In [3]:
import celerite
from celerite import terms
import cPickle as pickle
import numpy as np
import matplotlib.pyplot as plt
from scipy.optimize import minimize
c = 2.99792458e8 # m/s
Construct the data:
In [4]:
data = pickle.load(open( "binary_data.p", "rb" ))
print len(data)
In [5]:
wave_lo = np.log(4680.)
wave_hi = np.log(4700.)
subset = []
#for i in range(len(data)):
for i in range(0,len(data),10):
m = (data[i][0] > wave_lo) & (data[i][0] < wave_hi)
x = np.copy(data[i][0][m])
y = np.log(np.copy(data[i][1][m]))
yerr = np.copy(data[i][2][m]/data[i][1][m])
Set up the GP:
In [6]:
kernel = terms.RealTerm(np.log(0.04), -np.log(0.001), bounds=((np.log(.01*0.04),np.log(100.*0.04)),(None, None)))
gp = celerite.GP(kernel,
In [7]:
Set up for marginalization of the scales:
In [8]:
nepoch = len(subset)
eye = np.eye(nepoch)
ndata_byepoch = [len(d[0]) for d in subset]
design = np.repeat(eye, ndata_byepoch, axis=0)
print design.shape
print design
Set up the minimization:
In [9]:
def shift_and_flatten(xis, data):
ndata = sum([len(d[0]) for d in data])
ndata_byepoch = [len(d[0]) for d in data]
n = 0
x = np.empty(ndata)
y = np.empty(ndata)
yerr = np.empty(ndata)
for i, d in enumerate(data):
length = len(d[0])
x[n:n+length] = d[0] - xis[i]
y[n:n+length] = d[1]
yerr[n:n+length] = d[2]
n += length
return x, y, yerr
In [10]:
def set_params(params):
xis, gp_par = params[0:len(subset)], params[len(subset):]
x, y, yerr = shift_and_flatten(xis, subset)
inds = np.argsort(x)
x = x[inds]
y = y[inds]
yerr = yerr[inds]
A = np.copy(design)[inds,:]
gp.compute(x, yerr)
scales = np.linalg.solve(, gp.apply_inverse(A)),,gp.apply_inverse(y)))
ndata_byepoch = [len(d[0]) for d in subset]
y[np.argsort(inds)] -= np.repeat(scales, ndata_byepoch)
return scales, xis, y
In [11]:
def nll(params):
scales, xis, y = set_params(params)
return -gp.log_likelihood(y) + 1./2. # * np.sum(xis**2)
In [12]:
def xi_to_v(xi):
# translate ln(wavelength) Doppler shift to a velocity in m/s
return np.tanh(xi) * c
def v_to_xi(v):
return np.arctanh(v/c)
In [13]:
from import readsav
print len(subset)
data_dir = "/Users/mbedell/Documents/Research/HARPSTwins/Results/"
pipeline = readsav(data_dir+'HIP14501_result.dat')
xis0 = np.empty(len(subset))
rvs = np.empty(len(subset))
dates = np.empty(len(subset))
for i in range(len(subset)):
rvs[i] = pipeline.rv[i*10] * 1.e3
xis0[i] = v_to_xi(rvs[i])
dates[i] =[i*10]
#xis0 = np.zeros(len(subset))
print rvs
print xis0
In [14]:
p0 = np.append(xis0, gp.get_parameter_vector())
print p0
bounds = [(-1e-4, 1e-4) for d in subset] + gp.get_parameter_bounds()
print bounds
scales, xis, y = set_params(p0)
In [15]:
soln = minimize(nll, p0, bounds=bounds, method='L-BFGS-B')
scales, xis, y = set_params(soln.x)
In [17]:
print soln
print xi_to_v(xis)
In [34]:
fig,ax = plt.subplots(1,1,figsize=(12,4))
for i,d in enumerate(subset):
ax.plot(d[0] - xis[i],d[1] - scales[i])
Check out the prediction:
In [35]:
def prediction(params):
scales, xis, y = set_params(params)
result_flat = gp.predict(y, return_cov=False)
x, _, _ = shift_and_flatten(xis, subset)
inds = np.argsort(x)
result_sorted = result_flat[np.argsort(inds)]
result = []
n = 0
for i,d in enumerate(subset):
length = len(d[0])
result.append(result_sorted[n:n+length] + scales[i])
n += length
return result
In [36]:
mu = prediction(soln.x)
In [37]:
print mu
In [18]:
fig,ax = plt.subplots(1,1,figsize=(12,4))
for i,d in enumerate(subset):
ax.plot(np.exp(d[0]), d[1], color='black')
ax.plot(np.exp(d[0]), mu[i], color='red')
In [39]:
fig,ax = plt.subplots(1,1,figsize=(12,4))
for i,d in enumerate(subset):
ax.plot(d[0], (np.exp(d[1]) - np.exp(mu[i])) + 1000*i, color='black')
In [55]:
plt.scatter(, pipeline.rv*1.e3, color='black', label='HARPS RVs')
plt.scatter(dates, xi_to_v(xis), color='red', label='Avast RVs')
plt.ylabel('RV (m/s)')
In [68]:
rvs1 = np.arange(5) + 2000.
rvs2 = np.arange(5)
xis1 = v_to_xi(rvs1)
xis2 = v_to_xi(rvs2)
print (xis1 - xis1[0]) - (xis2 - xis2[0])
print xi_to_v((xis2 - xis1[0]))
In [ ]: