In [1]:
!wget http://web.mta.info/developers/data/nyct/turnstile/turnstile_150404.txt


--2015-04-07 11:47:17--  http://web.mta.info/developers/data/nyct/turnstile/turnstile_150404.txt
Resolving web.mta.info... 63.88.100.184, 63.88.100.202
Connecting to web.mta.info|63.88.100.184|:80... connected.
HTTP request sent, awaiting response... 200 OK
Length: unspecified [text/plain]
Saving to: 'turnstile_150404.txt'

turnstile_150404.tx     [    <=>               ]  23.91M  3.56MB/s   in 6.9s   

2015-04-07 11:47:25 (3.46 MB/s) - 'turnstile_150404.txt' saved [25071566]


In [2]:
!wget http://web.mta.info/developers/data/nyct/turnstile/turnstile_150321.txt


--2015-04-07 11:47:57--  http://web.mta.info/developers/data/nyct/turnstile/turnstile_150321.txt
Resolving web.mta.info... 63.88.100.170, 63.88.100.184
Connecting to web.mta.info|63.88.100.170|:80... connected.
HTTP request sent, awaiting response... 200 OK
Length: unspecified [text/plain]
Saving to: 'turnstile_150321.txt'

turnstile_150321.tx     [   <=>                ]  23.92M  2.04MB/s   in 9.1s   

2015-04-07 11:48:07 (2.62 MB/s) - 'turnstile_150321.txt' saved [25079688]


In [22]:
import csv
with open("turnstile_150404.txt", "r") as turn_data:
    reader=csv.reader(turn_data)
    my_hash={}
    for row in reader:
        key = row[0:4]
        val = row[4:-1]
        if my_hash[key] != None:
            my_hash[key].append( [ val ] )
        else:
            my_hash[key] = [ [ val ] ] 
print my_hash


---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-22-79c5917155e5> in <module>()
      6         key = row[0:4]
      7         val = row[4:-1]
----> 8         if my_hash[key] != None:
      9             my_hash[key].append( [ val ] )
     10         else:

TypeError: unhashable type: 'list'

In [14]:
with open("formatted.csv", "w") as formed:
    reader = csv.reader(formed)

In [ ]: