In [1]:
%run ~/relmapping/annot/notebooks/__init__.ipynb
In [2]:
df_regl = regl_cv()
print(len(df_regl))
df_regl['atac_flank_rev'] = df_regl['start'] - 50
df_regl['atac_flank_fwd'] = df_regl['end'] + 50
COLS_FLANK = ['chrom', 'atac_flank_rev', 'atac_flank_fwd']
df_regl.head()
Out[2]:
In [3]:
#fp_ = 'http://genome.cshlp.org/content/suppl/2014/04/24/gr.161992.113.DC1/Supplemental_Information_S1.zip'
#!cd ~/relmapping/wget; wget -m --no-parent {fp_}
fp_ = 'wget/genome.cshlp.org/content/suppl/2014/04/24/gr.161992.113.DC1/S01 Information of TF overlap worm_ce10.csv'
df_ = pd.read_csv(fp_)
print('%d records in S1' % (len(df_),))
df_.head(5)
Out[3]:
In [4]:
df_core = df_[['chromosome', 'core_start', 'core_stop']]
df_core.columns = ['chrom', 'start', 'end']
df_core.head(5)
Out[4]:
In [5]:
df_extd = df_[['chromosome', 'extended_start', 'extended_stop']]
df_extd.columns = ['chrom', 'start', 'end']
df_extd.head(5)
Out[5]:
In [8]:
gv = yp.GenomicVenn2(
BedTool.from_dataframe(df_regl[COLS_FLANK + ['annot']]),
BedTool.from_dataframe(df_core),
label_a='Accessible sites',
label_b='(Chen et al., 2014)\ncore regions',
)
plt.figure(figsize=(18,8))
plt.subplot(1,2,1)
gv.plot()
plt.subplot(1,2,2)
gv = yp.GenomicVenn2(
BedTool.from_dataframe(df_regl[COLS_FLANK + ['annot']]),
BedTool.from_dataframe(df_extd),
label_a='Accessible sites',
label_b='(Chen et al., 2014)\nextended regions',
)
gv.plot()
plt.savefig('annot/FigA_overlaps/overlaps_Chen2014_TFs.pdf', bbox_inches='tight')
In [ ]: