In [1]:
%matplotlib inline
from __future__ import absolute_import
from __future__ import print_function
from __future__ import division
from matplotlib import pylab as pl
import numpy as np
import pandas as pd
import seaborn as sns
import h5py
from matplotlib.backends.backend_pdf import PdfPages
from bx.bbi.bigwig_file import BigWigFile
import json
import os
import itertools
import numpy as np
import six
# import bcolz
# from pysam import FastaFile
# import roman as rm
import pandas as pd
import pdb
import numpy as np
import math

In [2]:
ls


FIDDLE_alpha/                   predictionCheckpoint.ipynb
Figures/                        suffnecScores.ipynb
bigWigFileManipulations.ipynb   testing_generate_regions.ipynb
data/                           venv/
hdf5_fileManipulations.ipynb

In [27]:
f1 = h5py.File("FIDDLE_alpha/data/hdf5datasets/test_march10/validation_test_march10.h5", "r")
f2 = h5py.File("FIDDLE_alpha/data/hdf5datasets/test_march10/train_test_march10.h5", "r")

In [28]:
f2.keys()


Out[28]:
[u'DNAseq', u'MNaseseq', u'NETseq', u'RNAseq', u'TSSseq']

In [33]:
# check for nans, post creation... we're good!
test = f2["TSSseq"]
array = test.value
pd.isnull(array).sum()


Out[33]:
0

In [ ]: