This repository was archived by the owner on Sep 8, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathutils.py
82 lines (64 loc) · 2.42 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
import requests
import time
import json
import redis
r = redis.Redis(host='localhost', port=6379, db=0)
API_KEY = 'a3706dc738a588bc685dc8acc648d076c7aeddf3'
headers = {
'Authorization': 'Token {API_KEY}'.format(API_KEY=API_KEY)
}
def split_list(a_list):
half = len(a_list)//2
return a_list[:half], a_list[half:]
def cache_data_save(key, data):
r.set(key, json.dumps(data))
def api_request(ids):
query_params = '?include_followers=1&twitter_ids={array}'.format(array=json.dumps(ids).replace(' ', ''))
batch_req = requests.get('https://api.hive.one/api/v1/influencers/batch/' + query_params, headers=headers)
return batch_req
def batch_request(ids):
batch_req = api_request(ids)
print(batch_req.url)
print(batch_req.status_code)
if batch_req.status_code == 200:
return batch_req.json()['data']['success']
elif batch_req.status_code == 504:
print("having to split chunks")
data = []
for chunk in split_list(ids):
batch_req = api_request(chunk)
data += batch_req.json()['data']['success']
return data
else:
raise Exception('ERROR')
def get_all_hive_profiles():
available_resp = requests.get('https://api.hive.one/api/v1/influencers/', headers)
available_array = available_resp.json()['data']['available']
available_chunks = [available_array[i:i + 20] for i in range(0, len(available_array), 20)]
iter = 0
for chunk in available_chunks:
chunk_start_time = time.time()
print("ITERATION", iter)
print((iter / len(available_chunks)) * 100, "%")
try:
try:
data = batch_request([int(item[0]) for item in chunk])
except Exception:
data = batch_request([int(item[0]) for item in chunk])
except:
pass
for profile in data:
key = '/api/v1/influencers/screen_name/{screen_name}/'.format(screen_name=profile['screenName'])
cache_data = {
"cached_on": int(time.time()),
"data": data
}
cache_data_save(key, cache_data)
print('Got data for chunk')
chunk_end_time = time.time()
chunk_time_taken = chunk_end_time - chunk_start_time
if chunk_time_taken < 0.5:
sleep_time = 0.5 - chunk_time_taken
print('sleeping for', sleep_time)
time.sleep(sleep_time)
iter += 1