In [4]:
%matplotlib inline
import matplotlib
import numpy as np
import matplotlib.pyplot as plt
import sys,os
path='/'.join(os.getcwd().split('/')[:-4])
sys.path.insert(1,path)
import Utils.Util as utl
import pandas as pd
pd.options.display.max_rows = 20;
pd.options.display.expand_frame_repr = True
from IPython.display import display
import seaborn as sns
import Scripts.HLI.Kyrgyz.FILTER.analysis as flt
In [6]:
reload(flt);a=flt.load()
b=a[a.Other==0].PASS
In [7]:
reload(flt);flt.poltFILTER(a)
In [8]:
b.value_counts().sort_index().plot.bar();plt.title('Distribution of number of PASS in the NOFAIL sites.');
In [10]:
c=a.reset_index()
c['start']=c.POS;c['end']=c.POS
c
Out[10]:
In [ ]:
reload(utl)
xmap=utl.BED.xmap_bed(c,hgFrom=38,hgTo=19,keepOnlyPos=True)