In [27]:

    
#!/usr/bin/env python
# -*- coding: utf-8 -*-
#!python3

import tweepy, time, sys, json, requests, random
 
def check_neotoma():
    ## This function call to neotoma, reads a text file, compares the two
    ## and then returns all the 'new' records to a different text file.

    #  inputs:
    #  1. text file: old_results.json
    #  2. text file: to_print.json
    #  3. json call: neotoma

    with open('old_results.json', 'r') as old_file:
        old_calls = json.loads(old_file.read())
    
    with open('to_print.json', 'r')    as print_file:
        to_print  = json.loads(print_file.read())
    
    neotoma  = requests.get("http://ceiwin10.cei.psu.edu/NDB/RecentUploads?months=1")
    inp_json = json.loads(neotoma.text)['data']

    def get_datasets(x):
        did = []
        for y in x:
            did.append(y["DatasetID"])
        return did

    neo_datasets = get_datasets(inp_json)
    old_datasets = get_datasets(old_calls)
    new_datasets = get_datasets(to_print)
    
    #  So this works
    #  We now have the numeric dataset IDs for the most recent month of
    #  new files to neotoma (neo_datasets), all the ones we've already tweeted
    #  (old_datasets) and all the ones in our queue (new_datasets).
    #
    #  The next thing we want to do is to remove all the neo_datasets that
    #  are in old_datasets and then remove all the new_datasets that are
    #  in neo_datasets, append neo_datasets to new_datasets (if new_datasets
    #  has a length > 0) and then dump new_datasets.
    #
    #  Old datasets gets re-written when the tweets go out.

    #  remove all the neo_datasets:
    for i in range(len(neo_datasets)-1, 0, -1):
        if neo_datasets[i] in old_datasets:
            del inp_json[i]

    # This now gives us a pared down version of inp_json
    # Now we need to make sure to add any of the to_print to neo_dataset.
    #  We do this by cycling through new_datasets.  Any dataset number that
    #  is not in old_datasets or neo_datasets gets added to the beginning of
    #  the new list.  This way it is always the first called up when twitter
    #  posts:
    
    for i in range(0, len(new_datasets)-1):
        if new_datasets[i] not in old_datasets and new_datasets[i] not in neo_datasets:
            inp_json.insert(0,to_print[i])

    #  Now write out to file.  Old file doesn't get changed until the
    #  twitter app is run.
    with open('to_print.json', 'w')    as print_file:
        json.dump(inp_json, print_file)

def post_tweet():
    CONSUMER_KEY = 'jou6H9DZLPzw6f3aSIY7wzC6n'
    CONSUMER_SECRET = 'eum3NCrtrVC1tFsGvEj0GuqsxwQCWFfN8nmgcbMyA5xdmQhSdU'
    ACCESS_KEY = '3184480124-AHNgg72lXKYEuOjyzh5WKzBMkBBejpKIX9OxKpX'
    ACCESS_SECRET = 'GAmE6PX3ulj61tluwXA6jUKcPJwoCNToCg5JrJS8BbA3U'
    auth = tweepy.OAuthHandler(CONSUMER_KEY, CONSUMER_SECRET)
    auth.set_access_token(ACCESS_KEY, ACCESS_SECRET)
    api = tweepy.API(auth)

    print('Twitter authenticated \n')
        
        # Read in the printable tweets:
    with open('to_print.json', 'r') as print_file:
        to_print  = json.loads(print_file.read())
            
    with open('old_results.json', 'r') as print_file:
        old_files  = json.loads(print_file.read())
        
    print('Files opened\n')
        
    #  Now loop through the records:
    while len(to_print) > 0:
        weblink = 'http://apps.neotomadb.org/Explorer/?datasetid=' + str(to_print[0]["DatasetID"])
        
        line = 'Neotoma welcomes another ' + to_print[0]["DatabaseName"] + ' dataset: ' + to_print[0]["SiteName"] + " from " + to_print[0]["Investigator"] + " " + weblink
        
        if len(line) > 170:
            line = 'Neotoma welcomes another dataset: ' + to_print[0]["SiteName"] + " from " + to_print[0]["Investigator"] + " " + weblink
                        
        print('%s' % line)
        
        if random.randint(0,30) == 10:
            line = 'This is a twitter bot for the Neotoma Paleoecological Database, letting you know what\'s new. http://neotomadb.org managed by @sjgoring'
            api.update_status(status=line)
        else:
            api.update_status(status=line)

            #  Add the tweeted site to `old_files` and then delete it from the to_print.
            old_files.append(to_print[0])

            del to_print[0]

            with open('to_print.json', 'w')    as print_file:
                json.dump(to_print, print_file)

            with open('old_results.json', 'w')    as print_file:
                json.dump(old_files, print_file)

        time.sleep(600) # Tweet every 10 minutes.
        
        if len(to_print) < 5:
            check_neotoma()

post_tweet()









    



Twitter authenticated 

Files opened

Neotoma welcomes another dataset: Greenbrier Lake from A.J. Smith, D.F. Palmer http://apps.neotomadb.org/Explorer/?datasetid=15823






    



---------------------------------------------------------------------------
TweepError                                Traceback (most recent call last)
<ipython-input-27-b5d7b6b253f2> in <module>()
    119             check_neotoma()
    120 
--> 121 post_tweet()

<ipython-input-27-b5d7b6b253f2> in post_tweet()
    101             api.update_status(status=line)
    102         else:
--> 103             api.update_status(status=line)
    104 
    105             #  Add the tweeted site to `old_files` and then delete it from the to_print.

C:\Python34\lib\site-packages\tweepy\api.py in update_status(self, media_ids, *args, **kwargs)
    191             allowed_param=['status', 'in_reply_to_status_id', 'lat', 'long', 'source', 'place_id', 'display_coordinates'],
    192             require_auth=True
--> 193         )(post_data=post_data, *args, **kwargs)
    194 
    195     def media_upload(self, filename, *args, **kwargs):

C:\Python34\lib\site-packages\tweepy\binder.py in _call(*args, **kwargs)
    237             return method
    238         else:
--> 239             return method.execute()
    240 
    241     # Set pagination mode

C:\Python34\lib\site-packages\tweepy\binder.py in execute(self)
    221                 except Exception:
    222                     error_msg = "Twitter error response: status code = %s" % resp.status_code
--> 223                 raise TweepError(error_msg, resp)
    224 
    225             # Parse the response payload

TweepError: Twitter error response: status code = 403