2017-11-25 00:04:11 +00:00
|
|
|
# pragma pylint: disable=missing-docstring
|
|
|
|
|
2018-03-17 21:44:47 +00:00
|
|
|
import gzip
|
2017-11-25 00:04:11 +00:00
|
|
|
import json
|
2018-03-25 19:37:14 +00:00
|
|
|
import logging
|
2017-11-25 00:04:11 +00:00
|
|
|
import os
|
2018-04-27 21:16:34 +00:00
|
|
|
import arrow
|
2018-03-17 21:43:36 +00:00
|
|
|
from typing import Optional, List, Dict, Tuple
|
2018-01-18 07:10:48 +00:00
|
|
|
|
2018-05-04 10:38:51 +00:00
|
|
|
from freqtrade import misc, constants
|
2018-03-17 21:44:47 +00:00
|
|
|
from freqtrade.exchange import get_ticker_history
|
2018-04-27 21:16:34 +00:00
|
|
|
|
2018-01-18 07:10:48 +00:00
|
|
|
from user_data.hyperopt_conf import hyperopt_optimize_conf
|
2017-11-25 00:04:11 +00:00
|
|
|
|
2018-03-25 19:37:14 +00:00
|
|
|
logger = logging.getLogger(__name__)
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2017-11-25 00:04:11 +00:00
|
|
|
|
2018-06-01 15:21:45 +00:00
|
|
|
def sanitize_start_stop_date(tickerlist: List[Dict], timerange, pair):
|
|
|
|
"""
|
|
|
|
This function is called when either timerange start or stop are type date
|
|
|
|
-
|
|
|
|
Prevent index out or range error in trim_tickerlist, which occurs when trying
|
|
|
|
to process a stop or start range outside that in the cached data
|
|
|
|
returns (start, stop, nothing_to_trim)
|
|
|
|
nothing_to_trim > 0 is a flag to later not send the pair data to trim_tickerlist
|
|
|
|
-
|
|
|
|
Function Logic:
|
|
|
|
- if cache records begin after timerange start - reset start to first record
|
|
|
|
- if cache records end before timerange stop - reset stop to last record
|
|
|
|
- if start or stop are fully after or before cache records - return, nothing_to_trim.
|
|
|
|
- if only 1 of stop or start are set in timerange use the first or last
|
|
|
|
record appropriately from the cache as the unset value
|
|
|
|
"""
|
|
|
|
|
|
|
|
# Do nothing if timerange does not contain a type date.
|
|
|
|
stype, start, stop = timerange
|
|
|
|
nothing_to_trim = 0
|
|
|
|
if stype[0] != 'date' or stype[1] != 'date':
|
|
|
|
sanitized_dates = [start, stop, nothing_to_trim]
|
|
|
|
return sanitized_dates
|
|
|
|
|
|
|
|
# If no arg for stop or start then set to the first or last record in the cache
|
|
|
|
stop = stop if stype[1] == 'date' else int(((tickerlist[(len(tickerlist) - 1)][0]) / 1000))
|
|
|
|
start = start if stype[0] == 'date' else int(((tickerlist[0][0]) / 1000))
|
|
|
|
|
|
|
|
# If requested range start is after cache records end - no data to be trimmed
|
|
|
|
# If requested start range is before start of cache, move it to first nearest record
|
|
|
|
if stype[0] == 'date':
|
|
|
|
if (tickerlist[0][0]) > (stop * 1000):
|
|
|
|
logger.warn('No data for %s timerange in cache, update cache ', pair)
|
|
|
|
nothing_to_trim = nothing_to_trim + 1
|
|
|
|
elif (tickerlist[0][0]) > (start * 1000):
|
|
|
|
start = (tickerlist[0][0] / 1000)
|
|
|
|
logger.warn('Requested start timerange for %s not in cache, update cache ', pair)
|
|
|
|
|
|
|
|
# If requested range stop is before cache records begin - no data to be trimmed
|
|
|
|
# If requested stop range is after end of cache, move it to last nearest record
|
|
|
|
if stype[1] == 'date':
|
|
|
|
if (tickerlist[(len(tickerlist) - 1)][0]) < (start * 1000):
|
|
|
|
logger.warn('No data for %s timerange in cache, update cache ', pair)
|
|
|
|
nothing_to_trim = nothing_to_trim + 2
|
|
|
|
elif (tickerlist[(len(tickerlist) - 1)][0]) < (stop * 1000):
|
|
|
|
stop = (tickerlist[(len(tickerlist) - 1)][0] / 1000)
|
|
|
|
logger.warn('Requested stop timerange for %s not in cache, update cache ', pair)
|
|
|
|
|
|
|
|
# Impossible range, nothing to trim.
|
|
|
|
if start > stop:
|
|
|
|
nothing_to_trim = nothing_to_trim + 4
|
|
|
|
logger.warn('Check timerange for %s', pair)
|
|
|
|
|
|
|
|
sanitized_dates = [start, stop, nothing_to_trim]
|
|
|
|
return sanitized_dates
|
|
|
|
|
|
|
|
|
2018-03-17 21:43:36 +00:00
|
|
|
def trim_tickerlist(tickerlist: List[Dict], timerange: Tuple[Tuple, int, int]) -> List[Dict]:
|
2018-04-27 22:40:48 +00:00
|
|
|
if not tickerlist:
|
|
|
|
return tickerlist
|
|
|
|
|
2018-03-17 21:43:36 +00:00
|
|
|
stype, start, stop = timerange
|
2018-01-26 16:41:41 +00:00
|
|
|
|
2018-04-27 21:16:34 +00:00
|
|
|
start_index = 0
|
|
|
|
stop_index = len(tickerlist)
|
|
|
|
if stype[0] == 'line':
|
|
|
|
stop_index = start
|
|
|
|
if stype[0] == 'index':
|
|
|
|
start_index = start
|
|
|
|
elif stype[0] == 'date':
|
2018-05-21 19:31:08 +00:00
|
|
|
while start_index < len(tickerlist) and tickerlist[start_index][0] < start * 1000:
|
2018-04-27 21:16:34 +00:00
|
|
|
start_index += 1
|
|
|
|
|
|
|
|
if stype[1] == 'line':
|
|
|
|
start_index = len(tickerlist) + stop
|
|
|
|
if stype[1] == 'index':
|
|
|
|
stop_index = stop
|
|
|
|
elif stype[1] == 'date':
|
2018-05-21 19:31:08 +00:00
|
|
|
while stop_index > 0 and tickerlist[stop_index-1][0] > stop * 1000:
|
2018-04-27 21:16:34 +00:00
|
|
|
stop_index -= 1
|
|
|
|
|
|
|
|
if start_index > stop_index:
|
|
|
|
raise ValueError(f'The timerange [{start},{stop}] is incorrect')
|
|
|
|
|
|
|
|
return tickerlist[start_index:stop_index]
|
2018-01-15 21:25:02 +00:00
|
|
|
|
|
|
|
|
2018-03-17 21:43:36 +00:00
|
|
|
def load_tickerdata_file(
|
|
|
|
datadir: str, pair: str,
|
2018-03-24 09:21:59 +00:00
|
|
|
ticker_interval: str,
|
2018-03-17 21:43:36 +00:00
|
|
|
timerange: Optional[Tuple[Tuple, int, int]] = None) -> Optional[List[Dict]]:
|
2018-01-05 09:20:48 +00:00
|
|
|
"""
|
|
|
|
Load a pair from file,
|
|
|
|
:return dict OR empty if unsuccesful
|
|
|
|
"""
|
2018-01-06 22:24:35 +00:00
|
|
|
path = make_testdata_path(datadir)
|
2018-02-03 16:15:40 +00:00
|
|
|
pair_file_string = pair.replace('/', '_')
|
2018-02-15 06:56:13 +00:00
|
|
|
file = os.path.join(path, '{pair}-{ticker_interval}.json'.format(
|
2018-02-03 16:15:40 +00:00
|
|
|
pair=pair_file_string,
|
2018-01-05 09:20:48 +00:00
|
|
|
ticker_interval=ticker_interval,
|
2018-02-15 06:56:13 +00:00
|
|
|
))
|
2018-01-28 13:52:27 +00:00
|
|
|
gzipfile = file + '.gz'
|
|
|
|
|
2018-01-28 13:57:25 +00:00
|
|
|
# If the file does not exist we download it when None is returned.
|
2018-01-28 13:52:27 +00:00
|
|
|
# If file exists, read the file, load the json
|
|
|
|
if os.path.isfile(gzipfile):
|
2018-02-15 06:56:13 +00:00
|
|
|
logger.debug('Loading ticker data from file %s', gzipfile)
|
2018-01-28 13:52:27 +00:00
|
|
|
with gzip.open(gzipfile) as tickerdata:
|
|
|
|
pairdata = json.load(tickerdata)
|
|
|
|
elif os.path.isfile(file):
|
2018-02-15 06:56:13 +00:00
|
|
|
logger.debug('Loading ticker data from file %s', file)
|
2018-01-28 13:52:27 +00:00
|
|
|
with open(file) as tickerdata:
|
|
|
|
pairdata = json.load(tickerdata)
|
|
|
|
else:
|
2018-01-05 09:20:48 +00:00
|
|
|
return None
|
2018-06-01 15:21:45 +00:00
|
|
|
|
Test if timerange in json file before trimming.
trim_tickerlist throws an index out of range error when parsing a json file for a timerange outside its current contents.
This patch test for that condition and returns the the file as-is with a log warning to refresh-cache on fail
Here is an example of the error prior to path and after patching.
This is from binannce using the pair "ZEN/BTC" and timerange "20180522-20180523"
"""
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 107, in load_data
pairdata = load_tickerdata_file(datadir, pair, ticker_interval, timerange=timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 84, in load_tickerdata_file
pairdata = trim_tickerlist(pairdata, timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 36, in trim_tickerlist
while tickerlist[start_index][0] < start * 1000:
IndexError: list index out of range
""""
"""
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --timerange detected: 20180522-20180523 ...
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --datadir detected: freqtrade/tests/testdata ...
2018-05-31 22:01:13,168 - freqtrade.optimize - WARNING - start timerange for ZEN/BTC not in cache, to update cache use
2018-05-31 22:01:13,168 - freqtrade.optimize - INFO - --refresh-pairs-cached. *Nb The coin may be newer to the exchange
"""
2018-05-31 19:22:51 +00:00
|
|
|
"""
|
2018-06-01 15:21:45 +00:00
|
|
|
Call to function to catch if a start or stop date from timerange is outside
|
|
|
|
range of records in the cached ticker list.
|
|
|
|
This prevents "index out of range" error.
|
Test if timerange in json file before trimming.
trim_tickerlist throws an index out of range error when parsing a json file for a timerange outside its current contents.
This patch test for that condition and returns the the file as-is with a log warning to refresh-cache on fail
Here is an example of the error prior to path and after patching.
This is from binannce using the pair "ZEN/BTC" and timerange "20180522-20180523"
"""
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 107, in load_data
pairdata = load_tickerdata_file(datadir, pair, ticker_interval, timerange=timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 84, in load_tickerdata_file
pairdata = trim_tickerlist(pairdata, timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 36, in trim_tickerlist
while tickerlist[start_index][0] < start * 1000:
IndexError: list index out of range
""""
"""
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --timerange detected: 20180522-20180523 ...
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --datadir detected: freqtrade/tests/testdata ...
2018-05-31 22:01:13,168 - freqtrade.optimize - WARNING - start timerange for ZEN/BTC not in cache, to update cache use
2018-05-31 22:01:13,168 - freqtrade.optimize - INFO - --refresh-pairs-cached. *Nb The coin may be newer to the exchange
"""
2018-05-31 19:22:51 +00:00
|
|
|
"""
|
|
|
|
if timerange:
|
|
|
|
stype, start, stop = timerange
|
2018-06-01 15:21:45 +00:00
|
|
|
if stype[0] == 'date' or stype[1] == 'date':
|
|
|
|
sanitized_dates = sanitize_start_stop_date(pairdata, timerange, pair)
|
|
|
|
timerange = (('date', 'date'), int(sanitized_dates[0]), int(sanitized_dates[1]))
|
|
|
|
# If no overlap of timerange to cache data return pairdata, do not call trim_tickerlist
|
|
|
|
if sanitized_dates[2] > 0:
|
Test if timerange in json file before trimming.
trim_tickerlist throws an index out of range error when parsing a json file for a timerange outside its current contents.
This patch test for that condition and returns the the file as-is with a log warning to refresh-cache on fail
Here is an example of the error prior to path and after patching.
This is from binannce using the pair "ZEN/BTC" and timerange "20180522-20180523"
"""
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 107, in load_data
pairdata = load_tickerdata_file(datadir, pair, ticker_interval, timerange=timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 84, in load_tickerdata_file
pairdata = trim_tickerlist(pairdata, timerange)
File "/Users/creslin/PycharmProjects/freqtrade/freqtrade/optimize/__init__.py", line 36, in trim_tickerlist
while tickerlist[start_index][0] < start * 1000:
IndexError: list index out of range
""""
"""
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --timerange detected: 20180522-20180523 ...
2018-05-31 22:01:07,060 - freqtrade.configuration - INFO - Parameter --datadir detected: freqtrade/tests/testdata ...
2018-05-31 22:01:13,168 - freqtrade.optimize - WARNING - start timerange for ZEN/BTC not in cache, to update cache use
2018-05-31 22:01:13,168 - freqtrade.optimize - INFO - --refresh-pairs-cached. *Nb The coin may be newer to the exchange
"""
2018-05-31 19:22:51 +00:00
|
|
|
return pairdata
|
2018-01-05 09:20:48 +00:00
|
|
|
|
2018-01-15 21:25:02 +00:00
|
|
|
if timerange:
|
|
|
|
pairdata = trim_tickerlist(pairdata, timerange)
|
2018-01-05 09:20:48 +00:00
|
|
|
return pairdata
|
|
|
|
|
|
|
|
|
2018-03-24 09:21:59 +00:00
|
|
|
def load_data(datadir: str,
|
|
|
|
ticker_interval: str,
|
2018-03-17 21:43:36 +00:00
|
|
|
pairs: Optional[List[str]] = None,
|
|
|
|
refresh_pairs: Optional[bool] = False,
|
|
|
|
timerange: Optional[Tuple[Tuple, int, int]] = None) -> Dict[str, List]:
|
2017-11-25 00:04:11 +00:00
|
|
|
"""
|
|
|
|
Loads ticker history data for the given parameters
|
|
|
|
:return: dict
|
|
|
|
"""
|
|
|
|
result = {}
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2017-12-21 07:31:26 +00:00
|
|
|
_pairs = pairs or hyperopt_optimize_conf()['exchange']['pair_whitelist']
|
|
|
|
|
2017-12-16 14:42:28 +00:00
|
|
|
# If the user force the refresh of pairs
|
|
|
|
if refresh_pairs:
|
2018-01-06 22:24:35 +00:00
|
|
|
logger.info('Download data for all pairs and store them in %s', datadir)
|
2018-04-27 21:16:34 +00:00
|
|
|
download_pairs(datadir, _pairs, ticker_interval, timerange=timerange)
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2017-12-21 07:31:26 +00:00
|
|
|
for pair in _pairs:
|
2018-01-15 21:25:02 +00:00
|
|
|
pairdata = load_tickerdata_file(datadir, pair, ticker_interval, timerange=timerange)
|
2018-05-21 19:31:08 +00:00
|
|
|
if pairdata:
|
|
|
|
result[pair] = pairdata
|
|
|
|
else:
|
|
|
|
logger.warn('No data for pair %s, use --update-pairs-cached to download the data', pair)
|
2018-05-21 20:15:01 +00:00
|
|
|
|
2017-11-25 00:04:11 +00:00
|
|
|
return result
|
|
|
|
|
|
|
|
|
2018-01-06 22:24:35 +00:00
|
|
|
def make_testdata_path(datadir: str) -> str:
|
2017-12-16 14:42:28 +00:00
|
|
|
"""Return the path where testdata files are stored"""
|
2018-02-09 07:35:38 +00:00
|
|
|
return datadir or os.path.abspath(
|
|
|
|
os.path.join(
|
|
|
|
os.path.dirname(__file__), '..', 'tests', 'testdata'
|
|
|
|
)
|
|
|
|
)
|
2017-12-16 14:42:28 +00:00
|
|
|
|
|
|
|
|
2018-04-27 21:16:34 +00:00
|
|
|
def download_pairs(datadir, pairs: List[str],
|
|
|
|
ticker_interval: str,
|
|
|
|
timerange: Optional[Tuple[Tuple, int, int]] = None) -> bool:
|
2018-01-13 07:32:44 +00:00
|
|
|
"""For each pairs passed in parameters, download the ticker intervals"""
|
2017-12-16 14:42:28 +00:00
|
|
|
for pair in pairs:
|
|
|
|
try:
|
2018-04-27 21:30:42 +00:00
|
|
|
download_backtesting_testdata(datadir,
|
|
|
|
pair=pair,
|
2018-04-30 21:27:05 +00:00
|
|
|
tick_interval=ticker_interval,
|
2018-04-27 21:30:42 +00:00
|
|
|
timerange=timerange)
|
2017-12-16 14:42:28 +00:00
|
|
|
except BaseException:
|
2018-03-02 15:22:00 +00:00
|
|
|
logger.info(
|
2018-03-24 09:21:59 +00:00
|
|
|
'Failed to download the pair: "%s", Interval: %s',
|
2018-03-02 15:22:00 +00:00
|
|
|
pair,
|
|
|
|
ticker_interval
|
|
|
|
)
|
2017-12-16 14:42:28 +00:00
|
|
|
return False
|
|
|
|
return True
|
|
|
|
|
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
def load_cached_data_for_updating(filename: str,
|
|
|
|
tick_interval: str,
|
|
|
|
timerange: Optional[Tuple[Tuple, int, int]]) -> Tuple[list, int]:
|
|
|
|
"""
|
|
|
|
Load cached data and choose what part of the data should be updated
|
|
|
|
"""
|
|
|
|
|
|
|
|
since_ms = None
|
|
|
|
|
|
|
|
# user sets timerange, so find the start time
|
|
|
|
if timerange:
|
|
|
|
if timerange[0][0] == 'date':
|
|
|
|
since_ms = timerange[1] * 1000
|
|
|
|
elif timerange[0][1] == 'line':
|
2018-05-04 10:38:51 +00:00
|
|
|
num_minutes = timerange[2] * constants.TICKER_INTERVAL_MINUTES[tick_interval]
|
2018-04-30 21:27:05 +00:00
|
|
|
since_ms = arrow.utcnow().shift(minutes=num_minutes).timestamp * 1000
|
2018-04-27 21:16:34 +00:00
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
# read the cached file
|
|
|
|
if os.path.isfile(filename):
|
|
|
|
with open(filename, "rt") as file:
|
|
|
|
data = json.load(file)
|
|
|
|
# remove the last item, because we are not sure if it is correct
|
|
|
|
# it could be fetched when the candle was incompleted
|
|
|
|
if data:
|
|
|
|
data.pop()
|
|
|
|
else:
|
|
|
|
data = []
|
2018-04-27 21:30:42 +00:00
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
if data:
|
|
|
|
if since_ms and since_ms < data[0][0]:
|
|
|
|
# the data is requested for earlier period than the cache has
|
|
|
|
# so fully redownload all the data
|
|
|
|
data = []
|
|
|
|
else:
|
|
|
|
# a part of the data was already downloaded, so
|
|
|
|
# download unexist data only
|
|
|
|
since_ms = data[-1][0] + 1
|
2018-04-27 21:16:34 +00:00
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
return (data, since_ms)
|
2018-04-27 21:16:34 +00:00
|
|
|
|
|
|
|
|
|
|
|
def download_backtesting_testdata(datadir: str,
|
|
|
|
pair: str,
|
2018-04-30 21:27:05 +00:00
|
|
|
tick_interval: str = '5m',
|
2018-05-03 08:16:29 +00:00
|
|
|
timerange: Optional[Tuple[Tuple, int, int]] = None) -> None:
|
|
|
|
|
2017-12-16 14:42:28 +00:00
|
|
|
"""
|
2018-04-27 21:16:34 +00:00
|
|
|
Download the latest ticker intervals from the exchange for the pairs passed in parameters
|
2018-04-30 21:27:05 +00:00
|
|
|
The data is downloaded starting from the last correct ticker interval data that
|
|
|
|
esists in a cache. If timerange starts earlier than the data in the cache,
|
|
|
|
the full data will be redownloaded
|
|
|
|
|
2017-12-16 14:42:28 +00:00
|
|
|
Based on @Rybolov work: https://github.com/rybolov/freqtrade-data
|
|
|
|
:param pairs: list of pairs to download
|
2018-04-30 21:27:05 +00:00
|
|
|
:param tick_interval: ticker interval
|
2018-04-27 21:16:34 +00:00
|
|
|
:param timerange: range of time to download
|
2018-05-03 08:16:29 +00:00
|
|
|
:return: None
|
|
|
|
|
2017-12-16 14:42:28 +00:00
|
|
|
"""
|
|
|
|
|
2018-01-06 22:24:35 +00:00
|
|
|
path = make_testdata_path(datadir)
|
2018-04-30 21:27:05 +00:00
|
|
|
filepair = pair.replace("/", "_")
|
|
|
|
filename = os.path.join(path, f'{filepair}-{tick_interval}.json')
|
|
|
|
|
2018-03-02 15:22:00 +00:00
|
|
|
logger.info(
|
2018-03-24 09:21:59 +00:00
|
|
|
'Download the pair: "%s", Interval: %s',
|
2018-03-02 15:22:00 +00:00
|
|
|
pair,
|
2018-04-30 21:27:05 +00:00
|
|
|
tick_interval
|
2018-03-02 15:22:00 +00:00
|
|
|
)
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
data, since_ms = load_cached_data_for_updating(filename, tick_interval, timerange)
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2018-04-27 21:16:34 +00:00
|
|
|
logger.debug("Current Start: %s", misc.format_ms_time(data[1][0]) if data else 'None')
|
|
|
|
logger.debug("Current End: %s", misc.format_ms_time(data[-1][0]) if data else 'None')
|
|
|
|
|
2018-04-30 21:27:05 +00:00
|
|
|
new_data = get_ticker_history(pair=pair, tick_interval=tick_interval, since_ms=since_ms)
|
2018-04-27 21:16:34 +00:00
|
|
|
data.extend(new_data)
|
|
|
|
|
2018-03-25 11:38:17 +00:00
|
|
|
logger.debug("New Start: %s", misc.format_ms_time(data[0][0]))
|
2018-04-27 21:16:34 +00:00
|
|
|
logger.debug("New End: %s", misc.format_ms_time(data[-1][0]))
|
2017-12-16 14:42:28 +00:00
|
|
|
|
2018-01-11 14:49:04 +00:00
|
|
|
misc.file_dump_json(filename, data)
|