Goal:

  • Download most up-to-date version of NCBI 'complete' genomes

Setting variables


In [17]:
workDir = '/var/seq_data/ncbi_db/genome/Jan2016/'
proksFile = 'proks_complete.txt'
taxFile = 'proks_complete_tax.txt'

Init


In [2]:
import os
%load_ext rpy2.ipython
%load_ext pushnote

In [3]:
%%R
library(ggplot2)
library(dplyr)
library(tidyr)
library(genomes)


/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘dplyr’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:stats’:

    filter, lag


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: XML

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘XML’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:tools’:

    toHTML


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: RCurl

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: bitops

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘RCurl’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:tidyr’:

    complete


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: GenomicRanges

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: BiocGenerics

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: parallel

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘BiocGenerics’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:parallel’:

    clusterApply, clusterApplyLB, clusterCall, clusterEvalQ,
    clusterExport, clusterMap, parApply, parCapply, parLapply,
    parLapplyLB, parRapply, parSapply, parSapplyLB


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:dplyr’:

    combine, intersect, setdiff, union


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:stats’:

    xtabs


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:base’:

    anyDuplicated, append, as.data.frame, as.vector, cbind, colnames,
    do.call, duplicated, eval, evalq, Filter, Find, get, intersect,
    is.unsorted, lapply, Map, mapply, match, mget, order, paste, pmax,
    pmax.int, pmin, pmin.int, Position, rank, rbind, Reduce, rep.int,
    rownames, sapply, setdiff, sort, table, tapply, union, unique,
    unlist, unsplit


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: S4Vectors

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: stats4

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘S4Vectors’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:dplyr’:

    rename


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: IRanges

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘IRanges’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:tidyr’:

    expand


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following objects are masked from ‘package:dplyr’:

    collapse, desc, slice


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: GenomeInfoDb

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: Biostrings

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: Loading required package: XVector

  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: 
Attaching package: ‘genomes’


  res = super(Function, self).__call__(*new_args, **new_kwargs)
/opt/anaconda/lib/python2.7/site-packages/rpy2/robjects/functions.py:106: UserWarning: The following object is masked from ‘package:GenomeInfoDb’:

    species


  res = super(Function, self).__call__(*new_args, **new_kwargs)

In [55]:
if not os.path.isdir(workDir):
    os.makedirs(workDir)

%cd $workDir


/var/seq_data/ncbi_db/genome/Jan2016

Loading list of complete prok genomes


In [19]:
%%R -i workDir -i proksFile 

F = file.path(workDir, proksFile)

df.proks.complete = read.delim(F, sep='\t')

# checking join
df.proks.complete %>% nrow %>% print
df.proks.complete %>% head(n=3)


[1] 4732
     pid                           name          status   released  taxid
1  12997 Acaryochloris marina MBIC11017 Complete Genome 2007-10-16 329726
2  60713 Acetobacterium woodii DSM 1030 Complete Genome 2012-02-14 931626
3 242487       Acetobacter pasteurianus Complete Genome 2015-07-21    438
   bioproject          group              subgroup    size      gc
1  PRJNA12997  Cyanobacteria Oscillatoriophycideae 8.36160 46.9889
2  PRJNA60713     Firmicutes            Clostridia 4.04478 39.3000
3 PRJNA242487 Proteobacteria   Alphaproteobacteria 2.80615 53.3000
         refseq      insdc
1   NC_009925.1 CP000828.1
2   NC_016894.1 CP002987.1
3 NZ_CP012111.1 CP012111.1
                                                                                               plasmid.refseq
1 NC_009930.1,NC_009928.1,NC_009927.1,NC_009931.1,NC_009933.1,NC_009934.1,NC_009932.1,NC_009926.1,NC_009929.1
2                                                                                                        <NA>
3                                                                                                        <NA>
                                                                                       plasmid.insdc
1 CP000842.1,CP000840.1,CP000839.1,CP000843.1,CP000845.1,CP000846.1,CP000844.1,CP000838.1,CP000841.1
2                                                                                               <NA>
3                                                                                               <NA>
   wgs scaffolds genes proteins   modified                             center
1 <NA>        10  7469     7187 2015-07-30              Washington University
2 <NA>         1  3649     3521 2015-08-18 Georg-August-University Goettingen
3 <NA>         1  2688     2535 2015-12-09      Zhejiang Gongshang University
     biosample        assembly reference ftp   pubmed
1 SAMN02604308 GCA_000018105.1      REFR  NA 18252824
2 SAMN02603267 GCA_000247605.1      REFR  NA 22479398
3 SAMN02709032 GCA_001183745.1      <NA>  NA     <NA>

In [20]:
%%R -i workDir -i taxFile

F = file.path(workDir, taxFile)

df.tax = read.delim(F, sep='\t') %>%
    distinct(taxid)
df.proks.complete = dplyr::inner_join(df.proks.complete, df.tax, c('taxid' = 'taxid'))

# checking join
df.proks.complete %>% nrow %>% print
df.proks.complete %>% nrow %>% print
df.proks.complete %>% head(n=3)


[1] 4732
[1] 4732
     pid                           name          status   released  taxid
1  12997 Acaryochloris marina MBIC11017 Complete Genome 2007-10-16 329726
2  60713 Acetobacterium woodii DSM 1030 Complete Genome 2012-02-14 931626
3 242487       Acetobacter pasteurianus Complete Genome 2015-07-21    438
   bioproject          group              subgroup    size      gc
1  PRJNA12997  Cyanobacteria Oscillatoriophycideae 8.36160 46.9889
2  PRJNA60713     Firmicutes            Clostridia 4.04478 39.3000
3 PRJNA242487 Proteobacteria   Alphaproteobacteria 2.80615 53.3000
         refseq      insdc
1   NC_009925.1 CP000828.1
2   NC_016894.1 CP002987.1
3 NZ_CP012111.1 CP012111.1
                                                                                               plasmid.refseq
1 NC_009930.1,NC_009928.1,NC_009927.1,NC_009931.1,NC_009933.1,NC_009934.1,NC_009932.1,NC_009926.1,NC_009929.1
2                                                                                                        <NA>
3                                                                                                        <NA>
                                                                                       plasmid.insdc
1 CP000842.1,CP000840.1,CP000839.1,CP000843.1,CP000845.1,CP000846.1,CP000844.1,CP000838.1,CP000841.1
2                                                                                               <NA>
3                                                                                               <NA>
   wgs scaffolds genes proteins   modified                             center
1 <NA>        10  7469     7187 2015-07-30              Washington University
2 <NA>         1  3649     3521 2015-08-18 Georg-August-University Goettingen
3 <NA>         1  2688     2535 2015-12-09      Zhejiang Gongshang University
     biosample        assembly reference ftp   pubmed superkingdom
1 SAMN02604308 GCA_000018105.1      REFR  NA 18252824     Bacteria
2 SAMN02603267 GCA_000247605.1      REFR  NA 22479398     Bacteria
3 SAMN02709032 GCA_001183745.1      <NA>  NA     <NA>     Bacteria
          phylum               class            order           family
1  Cyanobacteria                <NA>    Chroococcales             <NA>
2     Firmicutes          Clostridia    Clostridiales   Eubacteriaceae
3 Proteobacteria Alphaproteobacteria Rhodospirillales Acetobacteraceae
           genus               species
1  Acaryochloris  Acaryochloris marina
2 Acetobacterium Acetobacterium woodii
3    Acetobacter                  <NA>

Just Bacteria


In [21]:
%%R
df.bac.complete = df.proks.complete %>%
    filter(superkingdom == 'Bacteria')

df.bac.complete %>% nrow


[1] 4498

Phylum representation


In [22]:
%%R -w 800
df.bac.complete.s = df.bac.complete %>%
    group_by(phylum) %>%
    summarize(n = n()) %>%
    filter(! is.na(n), n > 0)

ggplot(df.bac.complete.s, aes(phylum, n)) +
    geom_bar(stat='identity') +
    scale_y_log10() +
    labs(y = 'Number of genomes') +
    theme_bw() +
    theme(
        text = element_text(size=16),
        axis.text.x = element_text(angle=60, hjust=1)
    )


removing what are really phage/plasmid genomes


In [23]:
%%R
cat('Pre-filter:', df.bac.complete %>% nrow, '\n')

to.rm = c("Thermoanaerobacterium saccharolyticum JW/SL-YS485",
          "Streptococcus salivarius 57.I")

df.bac.complete = df.bac.complete %>%
    filter(! name %in% to.rm)

cat('Post-filter:', df.bac.complete %>% nrow, '\n')


Pre-filter: 4498 
Post-filter: 4496 

Sequence download


In [56]:
%%R -i workDir

outFile = file.path(workDir, 'bac_complete.txt')
write.table(df.bac.complete, outFile, sep='\t', quote=FALSE, row.names=FALSE)

In [ ]:
!seqDB_tools accession-GI2fasta \
    -a 11 -n 2 -f 12 -header -o bac_complete \
    < bac_complete.txt \
    2> bac_complete.log

In [ ]:
%pushnote genome download complete

Getting list of empty genome files


In [60]:
fileSizes = !ls -tlc *.fna | perl -pe 's/[ \t]+/ /g' 

outFile = 'empty_genome_files.txt'
with open(outFile, 'wb') as outFH:
    for x in fileSizes:
        xx = x.split(' ')
        if xx[4] == '0':
            xx[-1] = xx[-1].replace('_', ' ').rstrip('.fna')
            outFH.write(xx[-1] + '\n')

# status
!printf 'Number of empty genome files: '     
!wc -l $outFile
!head $outFile


Number of empty genome files: 0 empty_genome_files.txt

Deleting empty files


In [61]:
fileSizes = !ls -tlc bac_complete/*.fna | perl -pe 's/[ \t]+/ /g' 

for x in fileSizes:
    xx = x.split(' ')
    if float(xx[4]) < 100000.0:
        os.remove(xx[-1])

Checking output


In [62]:
genomeDir = os.path.join(workDir, 'bac_complete')
%cd $genomeDir


/var/seq_data/ncbi_db/genome/Jan2016/bac_complete

In [63]:
# number of genomes downloaded
!printf "Number of bacterial genomes: "
!find . -name "*.fna" | wc -l


Number of bacterial genomes: 3508

In [64]:
# file size
!echo "Genome file size distribution (bytes):"
!ls -tlc *.fna | \
    perl -pe 's/ +/\t/g' | \
    cut -f 5 | NY_misc_perl stats_descriptive


Genome file size distribution (bytes):
1	min	160314.00
1	Q1	2124608.00
1	mean	3679260.40
1	median	3480661.00
1	Q3	4913670.00
1	max	15028601.00
1	stdev	1949951.34

In [68]:
# checking for non-bacterial genomes
!find . -name "*.fna" | xargs -P 26 -I % bash -c 'egrep "phage|virus|plasmid" %'

In [69]:
# deleting non-bacterial genomes
#!rm -f ./Clostridium_perfringens_SM101.fna \
#    ./Chlamydophila_pneumoniae_AR39.fna \
#    ./Enterococcus_faecalis_62.fna

In [70]:
# number of genomes downloaded
!printf "Number of bacterial genomes: "
!find . -name "*.fna" | wc -l


Number of bacterial genomes: 3508

Renaming genomes


In [73]:
genomeDirRn = genomeDir + '_rn'
genomeDirRn


Out[73]:
'/var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn'

In [74]:
# renameing
!find . -name "*.fna" | \
    SIPSim genome_rename -n 26 --prefix $genomeDirRn -


File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydophila_pneumoniae_CWL029.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Helicobacter_cetorum_MIT_99-5656.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_B_TZ1A828_OT.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_anginosus_C238.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bibersteinia_trehalosi_USDA-ARS-USMARC-190.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Comamonadaceae_bacterium_A1.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Lactobacillus_johnsonii_DPC_6026.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Segniliparus_rotundus_DSM_44985.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Thermacetogenium_phaeum_DSM_12270.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Neisseria_meningitidis_G2136.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Desulfotomaculum_reducens_MI-1.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Corynebacterium_falsenii_DSM_44353.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Candidatus_Kinetoplastibacterium_galatii_TCC219.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_pneumoniae_P1031.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_Ia_SotonIa3.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Muricauda_lutaonensis.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Salmonella_enterica_subsp_enterica_serovar_Enteritidis_str_EC20110353.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Acinetobacter_baumannii_AYE.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_L3_404_LN.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Shewanella_baltica_OS678.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Clostridium_botulinum_A3_str_Loch_Maree.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_constellatus_subsp_pharyngis_C1050.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bartonella_tribocorum_CIP_105476.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Planococcus_kocurii.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Lactococcus_piscium_MKFS47.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Campylobacter_coli_15-537360.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Brevibacterium_flavum.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_psittaci_C19_98.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Rickettsia_prowazekii_str_Chernikova.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Escherichia_coli_O139:H28_str_E24377A.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Wolbachia_endosymbiont_of_Onchocerca_ochengi.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Escherichia_coli_UTI89.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Sanguibacter_keddieii_DSM_10542.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_tuberculosis_49-02.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Acidithiobacillus_ferrooxidans_ATCC_23270.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Pseudomonas_putida_ND6.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Xanthomonas_campestris_pv_campestris_str_8004.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_marinum_E11.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Roseburia_hominis_A2-183.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_tuberculosis_KZN_1435.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Dehalogenimonas_lykanthroporepellens_BL-DC-9.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Arthrobacter_sp_FB24.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Methyloceanibacter_caenitepidi.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Salmonella_enterica_subsp_enterica_serovar_Typhimurium_str_LT2.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Escherichia_albertii_KF1.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Hymenobacter_sp_DG25A.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Escherichia_coli_O157:H7_str_EC4115.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_avium_subsp_paratuberculosis.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Tropheryma_whipplei_str_Twist.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlorobaculum_parvum_NCIB_8327.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bacillus_subtilis_subsp_subtilis_str_RO-NN-1.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Helicobacter_pylori_oki673.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Buchnera_aphidicola_BCc.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bartonella_bacilliformis_KC583.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bacillus_methanolicus_MGA3.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Helicobacter_pylori_PeCan18.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bacillus_methylotrophicus_NJN-6.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Plautia_stali_symbiont.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_tuberculosis_str_Kurono.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_6276.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_D_s_2923.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Xanthomonas_oryzae_pv_oryzae_MAFF_311018.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Rickettsia_bellii_OSU_85-389.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycoplasma_suis_KI3806.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Coxiella_burnetii_RSA_493.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Acinetobacter_baumannii_MDR-TJ.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Rhodococcus_sp_B7740.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Allochromatium_vinosum_DSM_180.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Escherichia_coli_O103:H2_str_12009.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Belliella_baltica_DSM_15883.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycoplasma_hyorhinis_MCLD.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Candidatus_Desulforudis_audaxviator_MP104C.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Pediococcus_claussenii_ATCC_BAA-344.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Thioalkalivibrio_sulfidiphilus_HL-EbGr7.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycoplasma_haemofelis_str_Langford_1.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Salmonella_enterica_subsp_enterica_serovar_Choleraesuis_str_ATCC_10708.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Fusobacterium_hwasookii_ChDC_F300.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycobacterium_bovis_BCG.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Robiginitalea_biformata_HTCC2501.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Pararhodospirillum_photometricum_DSM_122.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_salivarius_JIM8777.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Lactobacillus_helveticus_H9.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Bacillus_anthracis_str_Sterne.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_trachomatis_L2b_795.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Brucella_suis_bv_3_str_686.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Cronobacter_sakazakii_CMCC_45402.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Mycoplasma_hyorhinis_DBS_1050.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Herbaspirillum_hiltneri_N3.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Pasteurella_multocida_subsp_multocida_str_3480.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_sp_VT_162.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Xenorhabdus_poinarii_G6.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Leptospira_borgpetersenii_serovar_Hardjo-bovis_str_L550.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Shigella_flexneri_2a_str_301.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Paenibacillus_sp_FSL_R7-0273.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Brucella_abortus_bv_6_str_870.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Neisseria_meningitidis_alpha14.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Salmonella_enterica_subsp_enterica_serovar_Enteritidis_str_EC20120916.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Nitrobacter_hamburgensis_X14.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_pneumoniae_AP200.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Pectobacterium_wasabiae_WPP163.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_pyogenes_MGAS8232.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Lactobacillus_paracasei.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Ruegeria_sp_TM1040.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Burkholderia_thailandensis_USAMRU_Malaysia_#20.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Chlamydia_psittaci_CP3.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Streptococcus_pneumoniae_ATCC_700669.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Cronobacter_muytjensii_ATCC_51329.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Actinobacillus_succinogenes_130Z.fna
File written: /var/seq_data/ncbi_db/genome/Jan2016/bac_complete_rn/Burkholderia_pseudomallei_HBPUB10134a.fna
**OUTPUT MUTED**

In [ ]: