In [23]:
fu = open('users-london.csv', 'r')
In [24]:
fout = open('users-london-renum.txt', 'w')
In [25]:
idmap = {}
In [26]:
newid = 0
In [27]:
for line in fu:
uid, uname = map(int, line[:-1].split(','))
idmap[uid] = newid
fout.write('%d,%d\n' % (newid, newid))
newid += 1
In [28]:
fu.close()
fout.close()
In [13]:
ffr = open('FoursquareFriendship.csv', 'r')
In [14]:
ffr.readline() # Skip header
Out[14]:
In [15]:
ffrnew = open('FoursquareFriendship-london.csv', 'w')
In [16]:
org_uids = set(idmap.keys())
for line in ffr:
u1, u2 = map(int, line[:-2].split(','))
if u1 in org_uids and u2 in org_uids:
ffrnew.write('%d,%d\n' % (idmap[u1], idmap[u2]))
In [17]:
ffr.close()
ffrnew.close()
In [18]:
fcheck = open('FoursquareCheckins20110101-20111231_near_london.csv', 'r')
In [19]:
fcheck_new = open('london/FoursquareCheckins20110101-20111231_near_london-renum.csv', 'w')
In [20]:
fcheck_new.write(fcheck.readline()) # Rewrite header
In [21]:
for line in fcheck:
us, lat, lng, tm, loc = line[:-1].split(',')
fcheck_new.write('%d,%s,%s,%s,%s\n' % (idmap[int(us)], lat, lng, tm, loc))
In [22]:
fcheck.close()
fcheck_new.close()
In [ ]: