-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathheliumapi.py
434 lines (357 loc) · 13.8 KB
/
heliumapi.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
import atexit
import json
import logging
import math
import sqlite3
import statistics
from datetime import date, datetime, timedelta, timezone
import requests
from dateutil.parser import parse as dateparse
log = logging.getLogger(__name__)
HELIUM_BLOCKCHAIN_START = datetime.fromisoformat("2017-07-29T00:00:00")
HELIUM_ORACLE_START = datetime.fromisoformat("2020-06-10T00:00:00")
BONES_PER_HNT = 100000000
API_URL = "https://api.helium.io/v1"
REQUESTS_USER_AGENT = "helium-dailypricer/1.0 (https://github.com/kellybyrd/helium-dailypricer) [email protected]"
_DB = None
_DB_FILE = "cache.sqlite"
def _close_db():
if _DB is not None:
_DB.close()
_DB = sqlite3.connect(_DB_FILE)
cur = _DB.cursor()
cur.execute(
"CREATE TABLE IF NOT EXISTS OraclePrices ("
"block INTEGER PRIMARY KEY, "
"timestamp TEXT NOT NULL, "
"price_bones INTEGER DEFAULT 0);"
)
cur.execute(
"CREATE TABLE IF NOT EXISTS DailyRewards ("
"timestamp TEXT NOT NULL, "
"address TEXT NOT NULL, "
"sum_bones INTEGER NOT NULL, "
"UNIQUE(timestamp, address) "
");"
)
atexit.register(_close_db)
# END MODULE INIT
def _daterange(start_date, end_date):
for n in range(int((end_date - start_date).days)):
yield start_date + timedelta(n)
def _api_request(url, query_params, useragent):
"""
Takes a helium api URL which returns JSON and may have paged results as
described in the "Cursors" section here:
https://docs.helium.com/api/blockchain/introduction
Merges the "data" keys from all pages
Returns
List of dicts from merged results.
Note: This assumes all the repsonse json has "data" and optionaly
"cursor" top level keys. So far has been true
"""
ret = list()
cursor = None
query_params = dict() if query_params is None else query_params
# repeat-until cursor is None
while True:
if cursor is not None:
query_params["cursor"] = cursor
try:
resp = requests.get(url, params=query_params, headers = {'user-agent': useragent})
resp.raise_for_status()
json = resp.json()
data = json.get("data")
if type(data) is list:
ret.extend(data)
cursor = json.get("cursor")
log.debug(f"New cursor is : {cursor}")
else:
# Not a JSON array, so not a paged result
ret = data
cursor = None
except Exception as ex:
# This is debug level because sometimes we intentionally expect 404
log.debug(f"Error: {ex}")
# This will break us out of the while loop
cursor = None
if cursor is None:
break
return ret
def _cache_oracle_price(ts, useragent):
block_url = f"{API_URL}/blocks/height"
block_params = dict()
block_params["max_time"] = ts.isoformat()
try:
log.debug(f"_cache_oracle_price: fetching block for {ts}")
ret = _api_request(block_url, block_params, useragent)
log.debug(f"_cache_oracle_price: ret {ret}")
block_num = ret["height"]
log.debug(f"_cache_oracle_price: fetching price for {block_num}")
price_url = f"{API_URL}/oracle/prices/{block_num}"
price_result = _api_request(price_url, None, useragent)
log.debug(f"_cache_oracle_price: caching price {price_result}")
_db_price_put(price_result["block"], ts, price_result["price"])
except Exception as ex:
log.error(f"_cache_oracle_price: Error: {ex}")
pass
def _db_price_at_time(as_of_time):
"""
Give the most recent Oracle prices record right before as_of_time, this will be the
effective price at that timestamps
Returns:
A DB record containing the price
"""
log.debug(f"_db_price_at_time: looking up record for {as_of_time}")
ret = dict()
cur = _DB.cursor()
cur.execute(
"SELECT block, max(timestamp), price_bones FROM OraclePrices WHERE timestamp = :time ",
{"time": as_of_time},
)
price = cur.fetchone()
log.debug(f"_db_price_at_time: found {price}")
ret["block"] = price[0]
ret["timestamp"] = price[1]
ret["price"] = price[2]
return ret
def _db_price_put_many(prices):
"""
Save a several reward records to the DB.
I probably should be doing this with executemany(), but it felt like transforming
a large rewards list-of-dicts into a list of properly ordered tuples was as much
work as calling execute() a bunch between commit()
"""
# Break rows up into chunks of 50 rows. See:
# https://stackoverflow.com/questions/312443/how-do-you-split-a-list-into-evenly-sized-chunks
CHUNK_SIZE = 50
chunks = [prices[i : i + CHUNK_SIZE] for i in range(0, len(prices), CHUNK_SIZE)]
cur = _DB.cursor()
for chunk in chunks:
# There's a constraint on block, but code that calls this gets blocks from the
# API that are already in the DB. We're using REPLACE here so we can be lazy and
# not deal with CONSTRAINT violations.
for r in chunk:
cur.execute(
"REPLACE INTO OraclePrices VALUES (:block, :timestamp, :price_bones)",
{
"block": r["block"],
"timestamp": r["timestamp"],
"price_bones": r["price"],
},
)
# commit per chunk, not per execute.
_DB.commit()
def _db_price_put(block, timestamp, price):
"""
Save an Oracle price to the db. Does not yet handle errors like an existing
record
"""
cur = _DB.cursor()
cur.execute(
"REPLACE INTO OraclePrices VALUES (:block, :timestamp, :price_bones)",
{"block": block, "timestamp": timestamp, "price_bones": price},
)
_DB.commit()
def _db_price_max_time():
"""
Get the timestamp of the most recent oracle price in the DB
"""
ret = None
cur = _DB.cursor()
cur.execute("SELECT MAX(timestamp) FROM OraclePrices;")
result = cur.fetchone()[0]
if result is not None:
ret = dateparse(result).date()
return ret
def _db_reward_fetch(address, start, stop):
"""
Fetch rewards from the cache filling of the cache from the REST API
if needed.
Returns:
A list of reward records
"""
ret = list()
cur = _DB.cursor()
cur.execute(
"SELECT timestamp, address, sum_bones FROM DailyRewards "
"WHERE address=:addr AND "
"timestamp BETWEEN :start AND :stop "
"ORDER BY timestamp ASC;",
{"addr": address, "start": start.isoformat(), "stop": stop.isoformat()},
)
rewards = cur.fetchall()
for r in rewards:
tmp = dict()
tmp["timestamp"] = r[0]
tmp["address"] = r[1]
tmp["sum"] = r[2]
ret.append(tmp)
return ret
def _db_reward_put_many(address, rewards):
"""
Save a several reward records to the DB.
I probably should be doing this with executemany(), but it felt like transforming
a large rewards list-of-dicts into a list of properly ordered tuples was as much
work as calling execute() a bunch between commit()
"""
# Break rows up into chunks of 50 rows. See:
# https://stackoverflow.com/questions/312443/how-do-you-split-a-list-into-evenly-sized-chunks
CHUNK_SIZE = 50
chunks = [rewards[i : i + CHUNK_SIZE] for i in range(0, len(rewards), CHUNK_SIZE)]
cur = _DB.cursor()
for chunk in chunks:
# There's a constraint on hash, but code that calls this intentionally overlaps
# the times it fetches from the API with time should be in the DB in order to be
# sure it doesn't miss anything. We're using REPLACE here so we can be lazy and
# not deal with CONSTRAINT viloations.
for r in chunk:
cur.execute(
"REPLACE INTO DailyRewards VALUES (:timestamp, :address, :sum_bones)",
{
"timestamp": r["timestamp"],
"address": address,
"sum_bones": r["sum"],
},
)
# commit per chunk, not per execute.
_DB.commit()
def _db_reward_put(timestamp, address, sum_bones):
"""
Save a daily reward total to the db. Does not yet handle errors like an
existing record
"""
cur = _DB.cursor()
# There's a constraint on hash, but code that calls this intentionally overlaps
# the times it fetches from the API with time should be in the DB in order to be
# sure it doesn't miss anything. We're using REPLACE here so we can be lazy and
# not deal with CONSTRAINT viloations.
cur.execute(
"REPLACE INTO DailyRewards VALUES (:timestamp, :address, :sum_bones)",
{"timestamp": timestamp, "address": address, "sum_bones": sum_bones},
)
_DB.commit()
def is_validator(address, useragent):
"""
Return true if the helium API thinks the address is a validator
"""
url = f"{API_URL}/validators/{address}"
return True if _api_request(url, None, useragent) else False
def is_hotspot(address, useragent):
"""
Return true if the helium API thinks the address is a hotspot
"""
url = f"{API_URL}/hotspots/{address}"
return True if _api_request(url, None, useragent) else False
def _db_reward_max_min(address):
"""
Given an address, get the oldest and newest reward timestamps.
"""
ts_min = None
ts_max = None
cur = _DB.cursor()
cur.execute(
"SELECT MIN(timestamp) FROM DailyRewards "
"WHERE address=:address AND sum_bones > 0;",
{"address": address},
)
result = cur.fetchone()[0]
if result is not None:
ts_min = dateparse(result).date()
cur.execute(
"SELECT MAX(timestamp) FROM DailyRewards "
"WHERE address=:address and sum_bones > 0;",
{"address": address},
)
result = cur.fetchone()[0]
if result is not None:
ts_max = dateparse(result).date()
return (ts_min, ts_max)
def _api_reward_fetch(address, start, stop, useragent):
# Handle paged results and put items in the DB
ret = list()
if is_validator(address, useragent):
url = f"{API_URL}/validators/{address}/rewards/sum"
elif is_hotspot(address, useragent):
url = f"{API_URL}/hotspots/{address}/rewards/sum"
else:
log.error(f"Address is not a hotspot or validator")
return ret
params = dict()
params["max_time"] = stop.isoformat()
params["min_time"] = start.isoformat()
params["bucket"] = "day"
log.debug(f"_api_request: {url} {params} {useragent}")
try:
ret = _api_request(url, params, useragent)
except:
pass
log.debug(f"_api_reward_fetch: putting {len(ret)} records in the DB")
_db_reward_put_many(address, ret)
return ret
def oracle_price_for_day(day, useragent):
"""
Return the closing Helium oracle price for a given day. This is the Oracle price
at just before midnight the next day. Ex:
If day is 2021-03-27, we will return the price as of '2021-03-27T23:59:59.999Z'
"""
END_OF_DAY = timedelta(days=1, microseconds=-1)
# The oracle price API doesn't take a time range. It takes a block
#
# We can now look up a block for a given time, then look up oracle price for
# that block. So, first try the DB for this timestamp
ts = datetime.combine(day, datetime.min.time()) + END_OF_DAY
# All prices before the start of the oracles are 0
if ts < HELIUM_ORACLE_START:
return 0
log.debug(f"oracle_price_for_day: Looking in DB for price at {ts}")
ret = _db_price_at_time(ts)["price"]
if ret is None:
log.debug(f"oracle_price_for_day: {ts} Not found in DB, fetching")
_cache_oracle_price(ts, useragent)
log.debug(f"oracle_price_for_day: {ts} fetched, looking up again")
ret = _db_price_at_time(ts)["price"]
log.debug(f"oracle_price_for_day: ret {ret} in db")
if ret is None:
log.debug(f"oracle_price_for_day: ret is none returning 0")
ret = 0
log.debug(f"oracle_price_for_day: returning {ret}")
return ret
def earnings(address, start, stop, useragent):
"""
Get all earnings [start, end) for the given hotspot/validator address.
Returns
A list of dicts, one dict for each reward.
Will return an empty list if the address is not found or no earnings
were found.
"""
# Don't bother with earnings before the start of the chain
start = max(start, HELIUM_BLOCKCHAIN_START.date())
ONE_SEC = timedelta(
seconds=1
) # Added to API fetch times to ensure we overlap a bit
# The overall strategy is to ensure no holes in the date range of the db cache.
# To do this we always try to extend the cache, even if the start/stop params do
# not overlap with the cached data.
# * Get db_min and db_max
# * If start < db_min: api_fetch for start to db_min(+1sec)
# Insert these into db. At this point db range is start to db_max
# * If stop > db_max: api_fetch for db_max(-1sec) to stop
# Insert these into db. At this point db range will be at least start to stop.
# * Read start to stop from DB
(db_min_ts, db_max_ts) = _db_reward_max_min(address)
if db_min_ts is None:
# Nothing in the DB yet
log.debug(f"DB: rewards empty {start} - {stop} ")
_api_reward_fetch(address, start, stop, useragent)
else:
if start < db_min_ts:
# Need data earlier than range in db
log.debug(f"DB: rewards fetch before {start} - {db_min_ts + ONE_SEC}")
_api_reward_fetch(address, start, db_min_ts + ONE_SEC, useragent)
if stop > db_max_ts:
# Need data later than range in db
log.debug(f"DB: rewards fetch after {db_max_ts - ONE_SEC} - {stop}")
_api_reward_fetch(address, db_max_ts - ONE_SEC, stop, useragent)
# The DB now covers the time range we need, so fetch it from there.
return _db_reward_fetch(address, start, stop)