
import cPickle
import nltk
import twitter

t_search = twitter.Twitter(domain="search.twitter.com")

madonna_results = []
for page in range(1,6):
    madonna_results.append(t_search.search(q="Madonna", rpp=100, page=page))

mtweets = [ tweet
                            for page in madonna_results 
                                for tweet in page['results'] ]

mttext= [ r['text'] 
    for result in madonna_results 
        for r in result['results'] ]

mwords = []
for t in mttext:
    mwords += [ w for w in t.split() ]

print "Number of words in Madonna related tweets:",len(mwords)

f = open("versus.madonna.tweets.pickle","wb")
cPickle.dump(mtweets,f)
f.close()
f = open("versus.madonna.ttext.pickle","wb")
cPickle.dump(mttext,f)
f.close()
f = open("versus.madonna.words.pickle","wb")
cPickle.dump(mwords,f)
f.close()

elton_results = []
for page in range(1,6):
    elton_results.append(t_search.search(q="Elton John", rpp=100, page=page))

etweets = [ tweet
                            for page in elton_results 
                                for tweet in page['results'] ]

ettext = [ r['text'] 
    for result in elton_results 
        for r in result['results'] ]

ewords = []
for t in ettext:
    ewords += [ w for w in t.split() ]

print "Number of words in Elton John related tweets:",len(ewords)


f = open("versus.elton.tweets.pickle","wb")
cPickle.dump(etweets,f)
f.close()
f = open("versus.elton.ttext.pickle","wb")
cPickle.dump(ettext,f)
f.close()
f = open("versus.elton.words.pickle","wb")
cPickle.dump(ewords,f)
f.close()

