In [1]:
import pandas as pd
import os
import sys
import pybedtools
In [26]:
pybedtools.cleanup(remove_all=True)
In [27]:
chromsizes = {'NC_000913.3': (0, 4641651)}
arcz = pybedtools.BedTool('../results/arcz.fixed.bed')
dsra = pybedtools.BedTool('../results/dsra.fixed.bed')
rpra = pybedtools.BedTool('../results/rpra.fixed.bed')
utr5 = pybedtools.BedTool('../results/redux/wt_tmut.utrs.corr.old.bed')
In [28]:
utr5_arcz = utr5.intersect(arcz, wa=True, wb=True)
In [29]:
utr5_arcz.head()
In [30]:
utr5_arcz.saveas('../results/redux/utr5_arcz.bed')
Out[30]:
In [31]:
arcz_genes = set()
with open('../../results/redux/utr5_arcz.bed') as fi:
for line in fi:
fields = line.strip().split('\t')
arcz_genes.update(fields[4])
len(arcz_genes)
Out[31]:
In [53]:
arcz.set_chromsizes(chromsizes)
result = arcz.randomstats(utr5,
iterations=10000,
processes=30,
shuffle_kwargs={'chrom': True})
In [54]:
result
Out[54]:
In [57]:
dsra.set_chromsizes(chromsizes)
result_dsra = dsra.randomstats(utr5,
iterations=10000,
processes=30,
shuffle_kwargs={'chrom': True})
In [58]:
result_dsra
Out[58]:
In [59]:
rpra.set_chromsizes(chromsizes)
result_rpra = rpra.randomstats(utr5,
iterations=10000,
processes=30,
shuffle_kwargs={'chrom': True})
In [60]:
result_rpra
Out[60]:
In [ ]:
#### pybedtools.cleanup(remove_all=True)