In [25]:
import numpy as np
from skbio import BiologicalSequence
seq = [np.random.choice(list('ACGT')) for i in range (250000)]
seq_id = "42"
In [26]:
for i in (500, 5000, 50000):
subseq = seq[:i]
print i
%timeit (subseq, seq_id)
In [27]:
for i in (500, 5000, 50000):
subseq = seq[:i]
print i
%timeit (''.join(subseq), seq_id)
In [28]:
for i in (500, 5000, 50000):
subseq = seq[:i]
print i
%timeit BiologicalSequence(subseq, seq_id)
In [ ]: