In [1]:
import os
from gensim import corpora, models, similarities
lsi_matsim_fname="lsi-matsim.save"
matsim = similarities.MatrixSimilarity.load(lsi_matsim_fname)
In [2]:
import pandas as pd
df_readability=pd.read_csv("db-readability.csv",index_col=0)
In [7]:
#forum_sources=["http://www.medhelp.org",
# ]
df = pd.read_csv("articles-n-forums-posts.csv")
df['source'].unique()
Out[7]:
In [ ]:
array(['https://www.autismparentingmagazine.com/',
forum_sources=['http://ehealthforum.com',
'http://www.medhelp.org',
'http://www.reditt.com']
In [ ]: