In [13]:
import pandas as pd
In [66]:
x_pbe = pd.read_csv('X_pbe.csv', header=None)
y_pbe = pd.read_csv('Y_pbe.csv', header=None)
z_pbe = pd.read_csv('q_pbe.csv', header=None)
In [67]:
print(x_pbe.shape)
print(z_pbe.shape)
In [68]:
x_pbe.head()
Out[68]:
In [69]:
rm_col = range(0,32,4)
x_pbe = x_pbe.drop(rm_col, axis=1)
x_pbe.shape
Out[69]:
In [70]:
x_pbe.columns=['C1x', 'C1y', 'C1z', 'H1x', 'H1y', 'H1z', 'H2x', 'H2y', 'H2z', 'H3x', 'H3y', 'H3z', 'H4x', 'H4y', 'H4z', 'C2x', 'C2y', 'C2z', 'Nx', 'Ny', 'Nz']
In [71]:
y_pbe.columns=['energy_pbe']
In [72]:
rm_col = range(0,16,2)
In [73]:
z_pbe = z_pbe.drop(rm_col, axis=1)
z_pbe.head()
Out[73]:
In [74]:
z_pbe.columns=['C1q', 'H1q','H2q','H3q','H4q','C2q','Nq']
In [75]:
xzy_pbe = pd.concat([x_pbe, z_pbe, y_pbe], axis=1)
xzy_pbe.head()
Out[75]:
In [76]:
xzy_pbe_u = xzy_pbe.drop_duplicates(inplace=False)
In [77]:
print xzy_pbe.shape
print xzy_pbe_u.shape
In [78]:
x_b3lyp = pd.read_csv('X_b3lyp.csv', header=None)
y_b3lyp = pd.read_csv('Y_b3lyp.csv', header=None)
In [79]:
print(x_b3lyp.shape)
print(y_b3lyp.shape)
In [80]:
rm_col = range(0,32,4)
x_b3lyp = x_b3lyp.drop(rm_col, axis=1)
x_b3lyp.shape
Out[80]:
In [81]:
x_b3lyp.columns=['C1x', 'C1y', 'C1z', 'H1x', 'H1y', 'H1z', 'H2x', 'H2y', 'H2z', 'H3x', 'H3y', 'H3z', 'H4x', 'H4y', 'H4z', 'C2x', 'C2y', 'C2z', 'Nx', 'Ny', 'Nz']
In [82]:
y_b3lyp.columns=['energy_b3lyp']
In [83]:
xy_b3lyp = pd.concat([x_b3lyp, y_b3lyp], axis=1)
In [84]:
xy_b3lyp.head()
Out[84]:
In [87]:
xy_b3lyp_u = xy_b3lyp.drop_duplicates(inplace=False)
print(xy_b3lyp.shape)
print(xy_b3lyp_u.shape)
In [94]:
jcols = list(xzy_pbe_u.columns)[:-8]
print(jcols)
In [97]:
xy = xzy_pbe_u.merge(right=xy_b3lyp_u, how='right', on=jcols, suffixes=('_b3lyp', '_pbe'))
print(xy.shape)
xy.head()
Out[97]:
In [98]:
print(list(xy.columns))
In [99]:
xy.to_csv('pbe_b3lyp_partQ.csv')
In [ ]: