In [45]:
def FASTA(filename):
  try:
    f = file(filename)
  except IOError:                     
    print "The file, %s, does not exist" % filename
    return

  order = []
  sequences = {}
    
  for line in f:
    if line.startswith('>'):
        name = line[1:].rstrip('\n')
        name = name.replace('_', ' ')
        order.append(name)
        sequences[name] = ''
    else:
        sequences[name] += line.rstrip('\n').rstrip('*')
            
  print "%d sequence(s) found" % len(order)
  print order
  print ('\n')
  print sequences
FASTA("example.fasta")


1 sequence(s) found
['gi|110559334|gb|DQ681069.1| Shrimp white spot syndrome virus from India VP28 (VP28) gene, complete cds']


{'gi|110559334|gb|DQ681069.1| Shrimp white spot syndrome virus from India VP28 (VP28) gene, complete cds': 'ATGGATCTTTCTTTCACTCTTTCGGTCGTGTCGGCCATCCTCGCCATCACTGCTGTGATTGCTGTATTTATTGTGATTTTTAGGTATCACAACACTGTGACCAAGACCATCGAAACCCACACAGACAATATCGAGACAAACATGGATGAAAACCTCCGCATTCCTGTGACTGCTGAGGTTGGATCAGGCTACTTCAAGATGACTGATGTGTCCTTTGACAGCGACACCTTGGGCAAAATCAAGATCCGCAATGGAAAGTCTGATGCACAGATGAAGGAAGAAGATGCGGATCTTGTCATCACTCCCGTGGAGGGCCGAGCACTCGAAGTGACTGTGGGGCAGAATCTCACCTTTGAGGGAACATTCAAGGTGTGGAACAACACATCAAGAAAGATCAACATCACTGGTATGCAGATGGTGCCAAAGATTAACCCATCAAAGGCCTTTGTCGGTAGCTCCAACACCTCCTCCTTCACCCCCGTCTCTATTGATGAGGATGAAGTTGGCACCTTTGTGTGTGGTACCACCTTTGGCGCACCAATTGCAGCTACCGCCGGTGGAAATCTTTTCGACATGTACGTGCACGTCACCTACTCTGGCACTGAGACCGAGTAA'}

In [30]:


In [29]:


In [ ]: