In [2]:
import pandas as pd
import numpy as np
import csv
import gc
import os
In [14]:
directory='../GeneInteractionsBN_Datasets/Labeled'
if not os.path.exists(directory):
os.makedirs(directory)
In [26]:
directory = '../GeneInteractionsBN_Datasets/DataGeneCausality/Raw/'
total=0
for filename in os.listdir(directory):
if filename.endswith(".csv") or filename.endswith(".py"):
pseudo_total=0
print(os.path.join(directory, filename))
csv = pd.read_csv(filepath_or_buffer=os.path.join(directory, filename), sep=';')
csv['Target']=list(map(lambda x: 1 if x<=0.01 else (0 if x>=0.5 else -1),csv['Pvalue']))
df=pd.DataFrame(data=csv['Target'].values,columns=['Target'])
#print(df.head())
df.to_csv('../GeneInteractionsBN_Datasets/Labeled/'+filename.split('.')[0]+'_Target.csv',index=True,index_label='Index')
#print(sum(1 for i in csv['Target'] if i==1))
#print(sum(1 for i in csv['Target'] if i==0))
pseudo_total=sum(1 for i in csv['Target'] if i==1)+sum(1 for i in csv['Target'] if i==0)
total=total+pseudo_total
print(pseudo_total)
del csv
gc.collect()
continue
else:
continue
print(total)
In [ ]:
In [ ]: