У меня проблемы со сбором данных из твиттера API.Я использую правильные ключи и использовал tweet = api.get_status(tweet_id, tweet_mode='extended')
, но все равно собрал только 886 данных вместо 2345. Вот мой код:
#Twitter API for more data (save to local file)
consumer_key = ''
consumer_secret = ''
access_token = ''
access_secret = ''
auth = tweepy.OAuthHandler(consumer_key, consumer_secret)
auth.set_access_token(access_token, access_secret)
#Store data on tweet_json.txt
with open('tweet_json.txt', 'w') as outfile:
for tweet_id in twitter_archive['tweet_id']:
try:
tweet = api.get_status(tweet_id, tweet_mode='extended')
#Convert to JSON and write
json.dump(tweet._json, outfile)
outfile.write("\n")
except:
print('ERROR: Error on tweet id {}'.format(tweet_id))
e = os.sys.exc_info()[0]
#Save only certain tweet elements in dataframe
elements_to_save = ['id', 'favorite_count', 'retweet_count']
#Convert list to dataframe
data = []
with open('tweet_json.txt', 'r') as readfile:
tweet_json = readfile.readline()
# Read line by line into DataFrame
while tweet_json:
tweet_dict = json.loads(tweet_json)
# Create a smaller dict
data_row = dict((k, tweet_dict[k]) for k in elements_to_save)
data.append(data_row)
# Read in JSON line and convert to dict
tweet_json = readfile.readline()
df_tweet_info = pd.DataFrame.from_dict(data)