-
Notifications
You must be signed in to change notification settings - Fork 2
/
data_collector.py
102 lines (65 loc) · 2.75 KB
/
data_collector.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
import typing
import logging
import time
from database import Hdf5Client
from utils import *
from exchanges.binance import BinanceClient
from exchanges.ftx import FtxClient
logger = logging.getLogger()
def collect_all(client: typing.Union[BinanceClient, FtxClient], exchange: str, symbol: str):
h5_db = Hdf5Client(exchange)
h5_db.create_dataset(symbol)
oldest_ts, most_recent_ts = h5_db.get_first_last_timestamp(symbol)
# Initial Request
if oldest_ts is None:
data = client.get_historical_data(symbol, end_time=int(time.time() * 1000) - 60000)
if len(data) == 0:
logger.warning("%s %s: no initial data found", exchange, symbol)
return
else:
logger.info("%s %s: Collected %s initial data from %s to %s", exchange, symbol, len(data),
ms_to_dt(data[0][0]), ms_to_dt(data[-1][0]))
oldest_ts = data[0][0]
most_recent_ts = data[-1][0]
h5_db.write_data(symbol, data)
data_to_insert = []
# Most recent data
while True:
data = client.get_historical_data(symbol, start_time=int(most_recent_ts + 60000))
if data is None:
time.sleep(4) # Pause in case an error occurs during the request
continue
if len(data) < 2:
break
data = data[:-1]
data_to_insert = data_to_insert + data
if len(data_to_insert) > 10000:
h5_db.write_data(symbol, data_to_insert)
data_to_insert.clear()
if data[-1][0] > most_recent_ts:
most_recent_ts = data[-1][0]
logger.info("%s %s: Collected %s recent data from %s to %s", exchange, symbol, len(data),
ms_to_dt(data[0][0]), ms_to_dt(data[-1][0]))
time.sleep(1.1)
h5_db.write_data(symbol, data_to_insert)
data_to_insert.clear()
# Older data
while True:
data = client.get_historical_data(symbol, end_time=int(oldest_ts - 60000))
if data is None:
time.sleep(4) # Pause in case an error occurs during the request
continue
if len(data) == 0:
logger.info("%s %s: Stopped older data collection because no data was found before %s", exchange, symbol,
ms_to_dt(oldest_ts))
break
data_to_insert = data_to_insert + data
if len(data_to_insert) > 10000:
h5_db.write_data(symbol, data_to_insert)
data_to_insert.clear()
if data[0][0] < oldest_ts:
oldest_ts = data[0][0]
logger.info("%s %s: Collected %s older data from %s to %s", exchange, symbol, len(data),
ms_to_dt(data[0][0]), ms_to_dt(data[-1][0]))
time.sleep(1.1)
h5_db.write_data(symbol, data_to_insert)