In [1]:
import os
import copy 
from rumormill import archive

from pprint import pprint
from bs4 import BeautifulSoup
from dateutil.parser import parse

In [4]:
reload(archive)
archive.PARAMS['newver'] = 12
archive.PARAMS['oldver'] = 11
archive.PARAMS


Out[4]:
{'compare': 'Compare',
 'diff_style': 'unidiff',
 'history_offset': 0,
 'history_pagesize': 25,
 'newver': 12,
 'oldver': 11,
 'page': 'Rumor+Mill',
 'paginate': 'off',
 'show_all_versions': 'y'}

In [5]:
result = archive.get_page()


http://www.astrobetter.com/wiki/tiki-pagehistory.php?history_offset=0&compare=Compare&paginate=off&history_pagesize=25&oldver=11&newver=12&diff_style=unidiff&show_all_versions=y&page=Rumor+Mill

In [68]:
reload(archive)
archive.get_info(result)


Out[68]:
{'comment': u'\nFixed headers, shortened add description',
 'date': datetime.datetime(2014, 8, 18, 15, 8, tzinfo=tzlocal()),
 'user': u'jlu',
 'version': 11}

In [67]:
soup = (result.soup
       .find('div', {'style':['text-align:center;']})
       .find('table',{'class':'formcolor'}) 
#        .find('strong').findParents()[2]
)
# for s in soup.find_all('td'):
#     print 'o', s.text

In [ ]: