-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathconverter.py
65 lines (43 loc) · 1.53 KB
/
converter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
from os import listdir, remove
from os.path import basename, splitext
from glob import glob
from itertools import permutations
from multiprocessing import Pool
from pandas import read_csv
# Валюты, которые нас интересуют
CURRENCIES = [
'btc', 'eth', 'bnb', 'usdt', 'xrp', 'xlm', 'ada', 'ltc', 'dash', 'xmr',
'zec', 'etc', 'neo', 'doge', 'mkr', 'omg', 'zrx', 'dcr', 'qtum']
def get_ticker_names(currencies=CURRENCIES):
return [''.join(pair) for pair in permutations(currencies, 2)]
def get_csv_files(tickers):
return filter(lambda file: tickername(file) in tickers,
listdir('data/csv/'))
def tickername(file):
return splitext(basename(file))[0]
def pluck_ticker_dataframe(csv):
dataframe = read_csv(
f"data/csv/{csv}", index_col=0, usecols=['Date', 'Time', 'Close'],
parse_dates=[['Date', 'Time']])
return dataframe['Close']
def to_dataframe(csv):
dataframe = pluck_ticker_dataframe(csv)
dataframe.name = tickername(csv)
return dataframe
def save_hdf(dataframe):
ticker = dataframe.name
dataframe.to_hdf(
f"data/hdf/{ticker}.hdf", key=ticker, mode='w', complib='zlib')
def convert(csv):
dataframe = to_dataframe(csv)
save_hdf(dataframe)
def clean(path):
files = [f"{path}{f}" for f in listdir(path)]
list(map(remove, files))
def run():
clean('data/hdf/')
ticker_names = get_ticker_names()
csv_files = get_csv_files(ticker_names)
Pool().map(convert, csv_files)
if __name__ == '__main__':
run()