This repository was archived by the owner on Nov 1, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfetchTWEETS.py
72 lines (56 loc) · 2.33 KB
/
fetchTWEETS.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# -*- coding: utf-8 -*-
"""
Created on Thu Dec 14 15:59:31 2017
@author: vase & satyam
"""
import sys
import tweepy
import time
process_status = 0
access_key = ""
access_secret = ""
consumer_key = ""
consumer_secret = ""
auth = tweepy.OAuthHandler(consumer_key, consumer_secret)
auth.set_access_token(access_key, access_secret)
api = tweepy.API(auth)
class CustomStreamListener(tweepy.StreamListener):
global i #variable for counting saved tweets
global err #variable for not USA countries
i = 0
err = 0
def on_status(self, status):
global i
global err
if i < 20000:
if status.lang == 'en': #we need only English language
if status.place.country == 'United States': #filter for USA
f = open("tweets.txt", "a")
try:
f.write((status.text.replace("\n", "")).encode("utf8")) #saving text parameter & stripping of \n which might have been added by the user
except AttributeError:
print ('error -- ') #Witnessed an instance of Attribute error, purposely declared to know it it existed
f.write("\n") #as we've already stripped of \n now adding \n to the end of each tweet (text)
f.close()
for hashtag in status.entities['hashtags']:
f = open("hashtags.txt", "a")
try:
f.write(hashtag['text'].encode("utf8")) #saving hashtags
except:
raise
f.write("\n")
f.close()
i = i + 1
else:
sys.exit()
def on_error(self, status_code):
print >> sys.stderr, 'Encountered error with status code:', status_code
return True #Don't kill the stream
def on_timeout(self):
print >> sys.stderr, 'Timeout...'
return True #Don't kill the stream
def testrun():
sapi = tweepy.streaming.Stream(auth, CustomStreamListener()) #create Stream
sapi.filter(locations=[-122.995004, 32.323198, -67.799695, 49.893813]) #limit only for USA
return true
process_status=1