In [1]:
import numpy as np
import bcolz
import h5py
import os
os.chdir('../..')
import allel
allel.__version__
Out[1]:
In [2]:
a = np.arange(20000000)
a
Out[2]:
In [3]:
c = allel.chunked.bcolztmp_storage.array(a, cparams=bcolz.cparams(cname='zlib', clevel=1, shuffle=True))
c.flush()
c
Out[3]:
In [4]:
!du -hs {c.rootdir}
In [5]:
allel.chunked.ChunkedArrayWrapper(c)
Out[5]:
In [6]:
h = allel.chunked.hdf5tmp_storage.array(a, compression='gzip', compression_opts=1, shuffle=True, chunks=(c.chunklen,))
h.file.flush()
h
Out[6]:
In [7]:
!du -h {h.file.filename}
In [8]:
allel.chunked.ChunkedArrayWrapper(h)
Out[8]:
In [9]:
z = allel.chunked.copy(a, storage='zarrmem')
z
Out[9]:
In [10]:
z = allel.chunked.copy(a, storage='zarrtmp')
z
Out[10]:
In [11]:
z.store.path
Out[11]:
In [12]:
z = allel.chunked.copy(a, storage='zarr', store='array.zarr', overwrite=True)
z
Out[12]:
In [13]:
z.store.path
Out[13]:
In [14]:
g = allel.chunked.hdf5tmp_storage.table([a, a], compression='gzip', compression_opts=1, shuffle=True)
g
Out[14]:
In [15]:
allel.chunked.ChunkedTableWrapper(g)
Out[15]:
In [16]:
allel.chunked.copy_table(g, storage='bcolz')
Out[16]:
In [21]:
z = allel.chunked.copy_table(g, storage='zarr')
z
Out[21]:
In [22]:
z.grp
Out[22]:
In [23]:
z = allel.chunked.copy_table(g, storage='zarr', store='test.zarr', overwrite=True)
z
Out[23]:
In [24]:
z.grp
Out[24]:
In [25]:
!ls -lh test.zarr/
In [26]:
!ls -lh test.zarr/f0 | head -n10
In [27]:
z = allel.chunked.copy_table(g, storage='zarrtmp')
z.grp
Out[27]:
In [28]:
z['f0'].store.path
Out[28]:
In [30]:
allel.chunked.ChunkedTableWrapper(z)
Out[30]:
In [ ]: