In [1]:
import os
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np
In [3]:
os.chdir('../')
print(os.getcwd())
In [4]:
def plotTagCount(TagDir):
TagFile = 'tagCountDistribution.txt'
File = "homer/Tag.dir/" + TagDir + "/" + TagFile
tagCountDistribution=pd.read_csv(File, sep ="\t", header=1)
tagCountDistribution.columns = ['Reads per position', 'Fraction of total reads (%)']
tagCountDistribution['Fraction of total reads (%)'] = tagCountDistribution['Fraction of total reads (%)']*100
plot_tagCountDistribution = tagCountDistribution[0:10]
plt.figure(figsize=(10,6))
sns.set_style("whitegrid", {'axes.grid' : False})
ax = sns.barplot(x="Reads per position", y="Fraction of total reads (%)", data=plot_tagCountDistribution)
plt.show()
In [5]:
names = set()
design = pd.read_table('design.tsv')
samples = design.bamReads.values
for sample in samples:
#print(sample.strip(".bam"))
names.add(sample.strip(".bam"))
for (dirpath, dirnames, filenames) in os.walk(os.getcwd()):
for dirname in dirnames:
if dirname in names:
plotTagCount(dirname)