In [1]:
import os
from gensim import corpora, models, similarities
lsi_matsim_fname="lsi-matsim.save"
matsim = similarities.MatrixSimilarity.load(lsi_matsim_fname)
In [4]:
import pandas as pd
df=pd.read_csv("db-readability-length.csv",index_col=0)
In [5]:
df.head(1)
Out[5]:
In [9]:
df.loc[0,'Readability']
Out[9]:
In [7]:
#forum_sources=["http://www.medhelp.org",
# ]
df = pd.read_csv("articles-n-forums-posts.csv")
df['source'].unique()
Out[7]:
In [ ]:
array(['https://www.autismparentingmagazine.com/',
forum_sources=['http://ehealthforum.com',
'http://www.medhelp.org',
'http://www.reditt.com']
In [ ]: