stable/freqtrade/optimize/backtesting.py

522 lines
22 KiB
Python
Raw Normal View History

# pragma pylint: disable=missing-docstring, W0212, too-many-arguments
2017-11-14 21:15:24 +00:00
"""
This module contains the backtesting logic
"""
2018-03-25 19:37:14 +00:00
import logging
2018-03-17 21:43:36 +00:00
from argparse import Namespace
2018-07-27 21:01:52 +00:00
from copy import deepcopy
2018-07-18 18:08:55 +00:00
from datetime import datetime, timedelta
from pathlib import Path
from typing import Any, Dict, List, NamedTuple, Optional
2018-03-17 21:44:47 +00:00
2018-03-29 18:16:25 +00:00
from pandas import DataFrame
from tabulate import tabulate
2017-09-28 21:26:28 +00:00
from freqtrade import optimize
2018-07-04 07:31:35 +00:00
from freqtrade import DependencyException, constants
2018-03-17 21:44:47 +00:00
from freqtrade.arguments import Arguments
from freqtrade.configuration import Configuration
2018-12-13 05:34:10 +00:00
from freqtrade.data import history
from freqtrade.data.dataprovider import DataProvider
from freqtrade.misc import file_dump_json, timeframe_to_minutes
2017-09-28 21:26:28 +00:00
from freqtrade.persistence import Trade
from freqtrade.resolvers import ExchangeResolver, StrategyResolver
from freqtrade.state import RunMode
from freqtrade.strategy.interface import SellType, IStrategy
2018-03-25 19:37:14 +00:00
logger = logging.getLogger(__name__)
2018-06-10 11:15:25 +00:00
class BacktestResult(NamedTuple):
"""
NamedTuple Defining BacktestResults inputs.
"""
pair: str
profit_percent: float
profit_abs: float
2018-06-10 11:32:07 +00:00
open_time: datetime
close_time: datetime
2018-06-10 18:52:42 +00:00
open_index: int
close_index: int
2018-06-10 11:15:25 +00:00
trade_duration: float
2018-06-10 11:37:53 +00:00
open_at_end: bool
open_rate: float
close_rate: float
2018-07-11 18:03:40 +00:00
sell_reason: SellType
2018-06-10 11:15:25 +00:00
class Backtesting(object):
"""
Backtesting class, this class contains all the logic to run a backtest
To run a backtest:
backtesting = Backtesting(config)
backtesting.start()
"""
2018-07-28 05:00:58 +00:00
def __init__(self, config: Dict[str, Any]) -> None:
self.config = config
# Reset keys for backtesting
2018-03-24 18:45:23 +00:00
self.config['exchange']['key'] = ''
self.config['exchange']['secret'] = ''
self.config['exchange']['password'] = ''
self.config['exchange']['uid'] = ''
self.config['dry_run'] = True
2018-07-28 05:41:38 +00:00
self.strategylist: List[IStrategy] = []
exchange_name = self.config.get('exchange', {}).get('name').title()
self.exchange = ExchangeResolver(exchange_name, self.config).exchange
self.fee = self.exchange.get_fee()
if self.config.get('runmode') != RunMode.HYPEROPT:
self.dataprovider = DataProvider(self.config, self.exchange)
IStrategy.dp = self.dataprovider
2018-07-28 05:41:38 +00:00
if self.config.get('strategy_list', None):
# Force one interval
2018-07-28 05:55:59 +00:00
self.ticker_interval = str(self.config.get('ticker_interval'))
self.ticker_interval_mins = timeframe_to_minutes(self.ticker_interval)
2018-07-28 05:55:59 +00:00
for strat in list(self.config['strategy_list']):
2018-07-28 05:41:38 +00:00
stratconf = deepcopy(self.config)
stratconf['strategy'] = strat
self.strategylist.append(StrategyResolver(stratconf).strategy)
else:
# only one strategy
self.strategylist.append(StrategyResolver(self.config).strategy)
# Load one strategy
self._set_strategy(self.strategylist[0])
2018-07-28 05:00:58 +00:00
def _set_strategy(self, strategy):
2018-07-28 04:54:33 +00:00
"""
Load strategy into backtesting
"""
self.strategy = strategy
2018-07-28 04:54:33 +00:00
self.ticker_interval = self.config.get('ticker_interval')
self.ticker_interval_mins = timeframe_to_minutes(self.ticker_interval)
self.tickerdata_to_dataframe = strategy.tickerdata_to_dataframe
2018-07-31 19:08:03 +00:00
self.advise_buy = strategy.advise_buy
self.advise_sell = strategy.advise_sell
# Set stoploss_on_exchange to false for backtesting,
# since a "perfect" stoploss-sell is assumed anyway
# And the regular "stoploss" function would not apply to that case
self.strategy.order_types['stoploss_on_exchange'] = False
2018-07-28 04:54:33 +00:00
def _generate_text_table(self, data: Dict[str, Dict], results: DataFrame,
skip_nan: bool = False) -> str:
"""
Generates and returns a text table for the given backtest data and the results dataframe
:return: pretty printed table with tabulate as str
"""
2018-06-02 11:43:51 +00:00
stake_currency = str(self.config.get('stake_currency'))
max_open_trades = self.config.get('max_open_trades')
floatfmt = ('s', 'd', '.2f', '.2f', '.8f', '.2f', 'd', '.1f', '.1f')
tabular_data = []
2018-07-08 17:55:04 +00:00
headers = ['pair', 'buy count', 'avg profit %', 'cum profit %',
'tot profit ' + stake_currency, 'tot profit %', 'avg duration',
'profit', 'loss']
for pair in data:
2018-06-10 11:15:25 +00:00
result = results[results.pair == pair]
if skip_nan and result.profit_abs.isnull().all():
continue
tabular_data.append([
pair,
len(result.index),
result.profit_percent.mean() * 100.0,
2018-07-08 17:55:04 +00:00
result.profit_percent.sum() * 100.0,
2018-06-10 11:15:25 +00:00
result.profit_abs.sum(),
result.profit_percent.sum() * 100.0 / max_open_trades,
2018-07-18 18:08:55 +00:00
str(timedelta(
minutes=round(result.trade_duration.mean()))) if not result.empty else '0:00',
2018-06-10 11:15:25 +00:00
len(result[result.profit_abs > 0]),
len(result[result.profit_abs < 0])
])
# Append Total
tabular_data.append([
'TOTAL',
len(results.index),
results.profit_percent.mean() * 100.0,
2018-07-11 12:50:04 +00:00
results.profit_percent.sum() * 100.0,
2018-06-10 11:15:25 +00:00
results.profit_abs.sum(),
results.profit_percent.sum() * 100.0 / max_open_trades,
2018-07-18 18:08:55 +00:00
str(timedelta(
minutes=round(results.trade_duration.mean()))) if not results.empty else '0:00',
2018-06-10 11:15:25 +00:00
len(results[results.profit_abs > 0]),
len(results[results.profit_abs < 0])
])
# Ignore type as floatfmt does allow tuples but mypy does not know that
return tabulate(tabular_data, headers=headers, # type: ignore
floatfmt=floatfmt, tablefmt="pipe")
2018-07-12 19:19:43 +00:00
def _generate_text_table_sell_reason(self, data: Dict[str, Dict], results: DataFrame) -> str:
"""
Generate small table outlining Backtest results
"""
tabular_data = []
headers = ['Sell Reason', 'Count']
for reason, count in results['sell_reason'].value_counts().iteritems():
tabular_data.append([reason.value, count])
return tabulate(tabular_data, headers=headers, tablefmt="pipe")
2018-07-29 11:07:11 +00:00
def _generate_text_table_strategy(self, all_results: dict) -> str:
"""
Generate summary table per strategy
"""
stake_currency = str(self.config.get('stake_currency'))
max_open_trades = self.config.get('max_open_trades')
2018-07-29 11:07:11 +00:00
floatfmt = ('s', 'd', '.2f', '.2f', '.8f', '.2f', 'd', '.1f', '.1f')
2018-07-29 11:07:11 +00:00
tabular_data = []
headers = ['Strategy', 'buy count', 'avg profit %', 'cum profit %',
'tot profit ' + stake_currency, 'tot profit %', 'avg duration',
'profit', 'loss']
2018-07-29 11:07:11 +00:00
for strategy, results in all_results.items():
tabular_data.append([
strategy,
len(results.index),
results.profit_percent.mean() * 100.0,
results.profit_percent.sum() * 100.0,
results.profit_abs.sum(),
results.profit_percent.sum() * 100.0 / max_open_trades,
2018-07-29 11:07:11 +00:00
str(timedelta(
minutes=round(results.trade_duration.mean()))) if not results.empty else '0:00',
len(results[results.profit_abs > 0]),
len(results[results.profit_abs < 0])
])
# Ignore type as floatfmt does allow tuples but mypy does not know that
return tabulate(tabular_data, headers=headers, # type: ignore
floatfmt=floatfmt, tablefmt="pipe")
2018-07-29 11:07:11 +00:00
def _store_backtest_result(self, recordfilename: str, results: DataFrame,
strategyname: Optional[str] = None) -> None:
2018-06-12 20:29:30 +00:00
records = [(t.pair, t.profit_percent, t.open_time.timestamp(),
t.close_time.timestamp(), t.open_index - 1, t.trade_duration,
2018-07-11 18:32:56 +00:00
t.open_rate, t.close_rate, t.open_at_end, t.sell_reason.value)
for index, t in results.iterrows()]
2018-06-12 20:29:30 +00:00
if records:
if strategyname:
# Inject strategyname to filename
recname = Path(recordfilename)
recordfilename = str(Path.joinpath(
recname.parent, f'{recname.stem}-{strategyname}').with_suffix(recname.suffix))
2018-06-12 20:29:30 +00:00
logger.info('Dumping backtest results to %s', recordfilename)
file_dump_json(recordfilename, records)
def _get_ticker_list(self, processed) -> Dict[str, DataFrame]:
"""
Helper function to convert a processed tickerlist into a list for performance reasons.
Used by backtest() - so keep this optimized for performance.
"""
headers = ['date', 'buy', 'open', 'close', 'sell', 'low', 'high']
ticker: Dict = {}
# Create ticker dict
for pair, pair_data in processed.items():
pair_data['buy'], pair_data['sell'] = 0, 0 # cleanup from previous run
ticker_data = self.advise_sell(
self.advise_buy(pair_data, {'pair': pair}), {'pair': pair})[headers].copy()
# to avoid using data from future, we buy/sell with signal from previous candle
ticker_data.loc[:, 'buy'] = ticker_data['buy'].shift(1)
ticker_data.loc[:, 'sell'] = ticker_data['sell'].shift(1)
ticker_data.drop(ticker_data.head(1).index, inplace=True)
# Convert from Pandas to list for performance reasons
# (Looping Pandas is slow.)
ticker[pair] = [x for x in ticker_data.itertuples()]
return ticker
2018-03-17 21:43:36 +00:00
def _get_sell_trade_entry(
self, pair: str, buy_row: DataFrame,
2018-06-10 11:15:25 +00:00
partial_ticker: List, trade_count_lock: Dict, args: Dict) -> Optional[BacktestResult]:
2018-03-17 21:43:36 +00:00
stake_amount = args['stake_amount']
max_open_trades = args.get('max_open_trades', 0)
trade = Trade(
2018-07-05 18:20:52 +00:00
open_rate=buy_row.open,
open_date=buy_row.date,
stake_amount=stake_amount,
amount=stake_amount / buy_row.open,
fee_open=self.fee,
fee_close=self.fee
)
# calculate win/lose forwards from buy point
for sell_row in partial_ticker:
if max_open_trades > 0:
# Increase trade_count_lock for every iteration
trade_count_lock[sell_row.date] = trade_count_lock.get(sell_row.date, 0) + 1
buy_signal = sell_row.buy
2018-07-11 18:03:40 +00:00
sell = self.strategy.should_sell(trade, sell_row.open, sell_row.date, buy_signal,
sell_row.sell, low=sell_row.low, high=sell_row.high)
2018-07-12 20:21:52 +00:00
if sell.sell_flag:
2018-10-30 19:02:31 +00:00
2018-08-17 05:07:50 +00:00
trade_dur = int((sell_row.date - buy_row.date).total_seconds() // 60)
2018-10-30 19:02:31 +00:00
# Special handling if high or low hit STOP_LOSS or ROI
if sell.sell_type in (SellType.STOP_LOSS, SellType.TRAILING_STOP_LOSS):
# Set close_rate to stoploss
closerate = trade.stop_loss
elif sell.sell_type == (SellType.ROI):
# get next entry in min_roi > to trade duration
# Interface.py skips on trade_duration <= duration
roi_entry = max(list(filter(lambda x: trade_dur >= x,
2018-10-30 19:23:31 +00:00
self.strategy.minimal_roi.keys())))
roi = self.strategy.minimal_roi[roi_entry]
# - (Expected abs profit + open_rate + open_fee) / (fee_close -1)
closerate = - (trade.open_rate * roi + trade.open_rate *
(1 + trade.fee_open)) / (trade.fee_close - 1)
else:
closerate = sell_row.open
2018-06-10 11:15:25 +00:00
return BacktestResult(pair=pair,
profit_percent=trade.calc_profit_percent(rate=closerate),
profit_abs=trade.calc_profit(rate=closerate),
2018-06-10 11:15:25 +00:00
open_time=buy_row.date,
close_time=sell_row.date,
2018-08-17 05:07:50 +00:00
trade_duration=trade_dur,
2018-06-12 20:29:30 +00:00
open_index=buy_row.Index,
close_index=sell_row.Index,
open_at_end=False,
2018-07-05 18:20:52 +00:00
open_rate=buy_row.open,
close_rate=closerate,
2018-07-12 20:21:52 +00:00
sell_reason=sell.sell_type
2018-06-10 11:15:25 +00:00
)
if partial_ticker:
# no sell condition found - trade stil open at end of backtest period
sell_row = partial_ticker[-1]
2018-06-10 11:15:25 +00:00
btr = BacktestResult(pair=pair,
2018-07-05 18:20:52 +00:00
profit_percent=trade.calc_profit_percent(rate=sell_row.open),
profit_abs=trade.calc_profit(rate=sell_row.open),
2018-06-10 11:15:25 +00:00
open_time=buy_row.date,
close_time=sell_row.date,
2018-07-18 07:29:51 +00:00
trade_duration=int((
sell_row.date - buy_row.date).total_seconds() // 60),
2018-06-12 20:29:30 +00:00
open_index=buy_row.Index,
close_index=sell_row.Index,
open_at_end=True,
2018-07-05 18:20:52 +00:00
open_rate=buy_row.open,
2018-07-11 18:03:40 +00:00
close_rate=sell_row.open,
sell_reason=SellType.FORCE_SELL
2018-06-10 11:15:25 +00:00
)
2018-06-13 17:43:33 +00:00
logger.debug('Force_selling still open trade %s with %s perc - %s', btr.pair,
btr.profit_percent, btr.profit_abs)
2018-06-10 11:15:25 +00:00
return btr
return None
2018-03-17 21:43:36 +00:00
def backtest(self, args: Dict) -> DataFrame:
"""
Implements backtesting functionality
NOTE: This method is used by Hyperopt at each iteration. Please keep it optimized.
Of course try to not have ugly code. By some accessor are sometime slower than functions.
Avoid, logging on this method
:param args: a dict containing:
stake_amount: btc amount to use for each trade
processed: a processed dictionary with format {pair, data}
max_open_trades: maximum number of concurrent trades (default: 0, disabled)
position_stacking: do we allow position stacking? (default: False)
:return: DataFrame
"""
processed = args['processed']
max_open_trades = args.get('max_open_trades', 0)
position_stacking = args.get('position_stacking', False)
start_date = args['start_date']
end_date = args['end_date']
trades = []
2018-06-02 11:43:51 +00:00
trade_count_lock: Dict = {}
# Dict of ticker-lists for performance (looping lists is a lot faster than dataframes)
ticker: Dict = self._get_ticker_list(processed)
lock_pair_until: Dict = {}
2019-04-04 18:23:10 +00:00
# Indexes per pair, so some pairs are allowed to have a missing start.
2019-03-20 17:38:10 +00:00
indexes: Dict = {}
tmp = start_date + timedelta(minutes=self.ticker_interval_mins)
2019-03-20 17:38:10 +00:00
2019-04-04 18:23:10 +00:00
# Loop timerange and get candle for each pair at that point in time
while tmp < end_date:
2019-03-20 17:38:10 +00:00
for i, pair in enumerate(ticker):
2019-03-20 17:38:10 +00:00
if pair not in indexes:
indexes[pair] = 0
try:
2019-03-20 17:38:10 +00:00
row = ticker[pair][indexes[pair]]
except IndexError:
# missing Data for one pair at the end.
2018-11-04 12:45:22 +00:00
# Warnings for this are shown by `validate_backtest_data`
continue
# Waits until the time-counter reaches the start of the data for this pair.
2019-03-20 18:44:59 +00:00
if row.date > tmp.datetime:
2019-03-20 17:38:10 +00:00
continue
indexes[pair] += 1
if row.buy == 0 or row.sell == 1:
continue # skip rows where no buy signal or that would immediately sell off
if (not position_stacking and pair in lock_pair_until
and row.date <= lock_pair_until[pair]):
# without positionstacking, we can only have one open trade per pair.
continue
if max_open_trades > 0:
# Check if max_open_trades has already been reached for the given date
if not trade_count_lock.get(row.date, 0) < max_open_trades:
continue
trade_count_lock[row.date] = trade_count_lock.get(row.date, 0) + 1
2019-03-20 17:38:10 +00:00
trade_entry = self._get_sell_trade_entry(pair, row, ticker[pair][indexes[pair]:],
2018-06-10 11:15:25 +00:00
trade_count_lock, args)
2018-06-10 11:15:25 +00:00
if trade_entry:
lock_pair_until[pair] = trade_entry.close_time
trades.append(trade_entry)
else:
# Set lock_pair_until to end of testing period if trade could not be closed
2019-03-20 18:44:59 +00:00
lock_pair_until[pair] = end_date.datetime
# Move time one configured time_interval ahead.
tmp += timedelta(minutes=self.ticker_interval_mins)
2018-06-10 11:15:25 +00:00
return DataFrame.from_records(trades, columns=BacktestResult._fields)
def start(self) -> None:
"""
Run a backtesting end-to-end
:return: None
"""
data: Dict[str, Any] = {}
pairs = self.config['exchange']['pair_whitelist']
2018-03-25 19:37:14 +00:00
logger.info('Using stake_currency: %s ...', self.config['stake_currency'])
logger.info('Using stake_amount: %s ...', self.config['stake_amount'])
if self.config.get('live'):
2018-03-25 19:37:14 +00:00
logger.info('Downloading data for all pairs in whitelist ...')
self.exchange.refresh_latest_ohlcv([(pair, self.ticker_interval) for pair in pairs])
data = {key[0]: value for key, value in self.exchange._klines.items()}
else:
2018-03-25 19:37:14 +00:00
logger.info('Using local backtesting data (using whitelist in given config) ...')
2018-06-02 12:07:54 +00:00
timerange = Arguments.parse_timerange(None if self.config.get(
'timerange') is None else str(self.config.get('timerange')))
2018-12-13 05:34:10 +00:00
data = history.load_data(
2018-12-15 19:14:13 +00:00
datadir=Path(self.config['datadir']) if self.config.get('datadir') else None,
pairs=pairs,
ticker_interval=self.ticker_interval,
refresh_pairs=self.config.get('refresh_pairs', False),
exchange=self.exchange,
timerange=timerange
)
if not data:
logger.critical("No data found. Terminating.")
return
2018-07-17 19:05:03 +00:00
# Use max_open_trades in backtesting, except --disable-max-market-positions is set
if self.config.get('use_max_market_positions', True):
max_open_trades = self.config['max_open_trades']
else:
2018-07-17 19:05:03 +00:00
logger.info('Ignoring max_open_trades (--disable-max-market-positions was used) ...')
max_open_trades = 0
2018-07-28 04:54:33 +00:00
all_results = {}
2018-07-28 05:41:38 +00:00
for strat in self.strategylist:
2018-07-28 04:54:33 +00:00
logger.info("Running backtesting for Strategy %s", strat.get_strategy_name())
2018-07-28 05:00:58 +00:00
self._set_strategy(strat)
2018-07-27 21:01:52 +00:00
min_date, max_date = optimize.get_timeframe(data)
# Validate dataframe for missing values (mainly at start and end, as fillup is called)
optimize.validate_backtest_data(data, min_date, max_date,
timeframe_to_minutes(self.ticker_interval))
2018-07-27 21:01:52 +00:00
logger.info(
'Measuring data from %s up to %s (%s days)..',
min_date.isoformat(),
max_date.isoformat(),
(max_date - min_date).days
)
# need to reprocess data every time to populate signals
preprocessed = self.strategy.tickerdata_to_dataframe(data)
2018-07-27 21:01:52 +00:00
# Execute backtest and print results
2018-07-28 04:54:33 +00:00
all_results[self.strategy.get_strategy_name()] = self.backtest(
2018-07-27 21:01:52 +00:00
{
'stake_amount': self.config.get('stake_amount'),
'processed': preprocessed,
'max_open_trades': max_open_trades,
'position_stacking': self.config.get('position_stacking', False),
'start_date': min_date,
'end_date': max_date,
2018-07-27 21:01:52 +00:00
}
)
2018-07-28 04:54:33 +00:00
for strategy, results in all_results.items():
2018-06-12 20:29:30 +00:00
2018-07-27 21:01:52 +00:00
if self.config.get('export', False):
self._store_backtest_result(self.config['exportfilename'], results,
strategy if len(self.strategylist) > 1 else None)
print(f"Result for strategy {strategy}")
print(' BACKTESTING REPORT '.center(133, '='))
print(self._generate_text_table(data, results))
2018-07-12 19:19:43 +00:00
print(' SELL REASON STATS '.center(133, '='))
print(self._generate_text_table_sell_reason(data, results))
print(' LEFT OPEN TRADES REPORT '.center(133, '='))
print(self._generate_text_table(data, results.loc[results.open_at_end], True))
print()
2018-07-29 11:07:11 +00:00
if len(all_results) > 1:
# Print Strategy summary table
print(' Strategy Summary '.center(133, '='))
print(self._generate_text_table_strategy(all_results))
print('\nFor more details, please look at the detail tables above')
2018-03-17 21:43:36 +00:00
def setup_configuration(args: Namespace) -> Dict[str, Any]:
2017-11-22 23:25:06 +00:00
"""
Prepare the configuration for the backtesting
:param args: Cli args from Arguments()
:return: Configuration
"""
configuration = Configuration(args, RunMode.BACKTEST)
config = configuration.get_config()
# Ensure we do not use Exchange credentials
config['exchange']['key'] = ''
config['exchange']['secret'] = ''
2018-05-25 14:04:08 +00:00
if config['stake_amount'] == constants.UNLIMITED_STAKE_AMOUNT:
raise DependencyException('stake amount could not be "%s" for backtesting' %
constants.UNLIMITED_STAKE_AMOUNT)
return config
2018-03-17 21:43:36 +00:00
def start(args: Namespace) -> None:
"""
Start Backtesting script
:param args: Cli args from Arguments()
:return: None
2017-11-22 23:25:06 +00:00
"""
# Initialize configuration
config = setup_configuration(args)
2018-03-25 19:41:25 +00:00
logger.info('Starting freqtrade in Backtesting mode')
# Initialize backtesting object
backtesting = Backtesting(config)
backtesting.start()