In [7]:
using DataFrames
X = readtable("../data/chembl_19_mf1/chembl-IC50-10targets.csv", header=true)
rename!(X, [:row, :col], [:compound, :target])
Out[7]:
In [8]:
X[:, :value] = log10(X[:, :value])
Out[8]:
In [9]:
idx = sample(1:size(X,1), int(floor(20/100 * size(X,1))); replace=false)
Out[9]:
In [11]:
int(floor(20/100 * size(X,1)))
Out[11]:
In [12]:
probe_vec = array(X[idx,:])
Out[12]:
In [13]:
ratings_test = probe_vec[:,3] .< log10(200)
Out[13]:
In [ ]: