forked from je-suis-tm/quant-trading
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathHeikin-Ashi backtest.py
372 lines (253 loc) · 12.1 KB
/
Heikin-Ashi backtest.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
# -*- coding: utf-8 -*-
"""
Created on Thu Feb 15 20:48:35 2018
@author: Administrator
"""
# In[1]:
#heikin ashi is a Japanese way to filter out the noise for momentum trading
#it can prevent the occurence of sideway chops
#basically we do a few transformations on four key benchmarks - Open, Close, High, Low
#apply some unique rules on ha Open, Close, High, Low to trade
#details of heikin ashi indicators and rules can be found in the following link
# https://quantiacs.com/Blog/Intro-to-Algorithmic-Trading-with-Heikin-Ashi.aspx
#need to get fix yahoo finance package first
#candlestick has been removed from matplotlib
#need to install mpl_finance instead
# In[2]:
import pandas as pd
import matplotlib.pyplot as plt
import fix_yahoo_finance as yf
import mpl_finance as mpf
import numpy as np
from scipy import integrate
from scipy.stats import t
# In[3]:
#Heikin Ashi has a unique method to filter out the noise
#its open, close, high, low require a different calculation approach
#please refer to the website mentioned above
def heikin_ashi(df1):
df1.reset_index(inplace=True)
df1['HA close']=(df1['Open']+df1['Close']+df1['High']+df1['Low'])/4
#initialize heikin ashi open
df1['HA open']=float(0)
df1['HA open'][0]=df1['Open'][0]
for n in range(1,len(df1)):
df1.at[n,'HA open']=(df1['HA open'][n-1]+df1['HA close'][n-1])/2)
temp=pd.concat([df1['HA open'],df1['HA close'],df1['Low'],df1['High']],axis=1)
df1['HA high']=temp.apply(max,axis=1)
df1['HA low']=temp.apply(min,axis=1)
del df1['Adj Close']
del df1['Volume']
return df1
# In[4]:
#setting up signal generations
#trigger conditions can be found from the website mentioned above
#they kinda look like marubozu candles
#there should also be a short strategy
#as i am an individual investor, i only use long strategies
#the trigger condition of short strategy is the reverse of long strategy
#you have to satisfy all four conditions to long/short
#nevertheless, the exit signal only has three conditions
def signal_generation(df,method):
df1=method(df)
df1['signals']=0
#i use cumulated sum to check how many positions i have longed
#i would ignore the exit signal prior to no long positions in the portfolio
#i also keep tracking how many long positions i have got
#long signals cannot exceed the stop loss limit
df1['cumsum']=0
for n in range(1,len(df1)):
if (df1['HA open'][n]>df1['HA close'][n] and df1['HA open'][n]==df1['HA high'][n] and
np.abs(df1['HA open'][n]-df1['HA close'][n])>np.abs(df1['HA open'][n-1]-df1['HA close'][n-1]) and
df1['HA open'][n-1]>df1['HA close'][n-1]):
df1.at[n,'signals']=1
df1['cumsum']=df1['signals'].cumsum()
#stop longing positions
if df1['cumsum'][n]>stls:
df1.at[n,'signals']=0
elif (df1['HA open'][n]<df1['HA close'][n] and df1['HA open'][n]==df1['HA low'][n] and
df1['HA open'][n-1]<df1['HA close'][n-1]):
df1.at[n,'signals']=-1
df1['cumsum']=df1['signals'].cumsum()
#if long positions i hold are more than one
#its time to clear all my positions
#if there are no long positions in my portfolio
#ignore the exit signal
if df1['cumsum'][n]>0:
df1.at[n,'signals']=-1*(df1['cumsum'][n-1]))
if df1['cumsum'][n]<0:
df1.at[n,'signals']=0
return df1
# In[5]:
#plotting the backtesting result
def plot(df1,ticker):
df1.set_index(df1['Date'],inplace=True)
#first plot is Heikin-Ashi candlestick
#use candlestick function and set Heikin-Ashi O,C,H,L
ax1=plt.subplot2grid((200,1), (0,0), rowspan=120,ylabel='HA price')
mpf.candlestick2_ochl(ax1, df1['HA open'], df1['HA close'], df1['HA high'], df1['HA low'], width=1, colorup='g', colordown='r')
plt.grid(True)
plt.xticks([])
plt.title('Heikin-Ashi')
#the second plot is the actual price with long/short positions as up/down arrows
ax2=plt.subplot2grid((200,1), (120,0), rowspan=80,ylabel='price',xlabel='')
df1['Close'].plot(ax=ax2,label=ticker)
#long/short positions are attached to the real close price of the stock
#set the line width to zero
#thats why we only observe markers
ax2.plot(df1.loc[df1['signals']==1].index,df1['Close'][df1['signals']==1],marker='^',lw=0,c='g',label='long')
ax2.plot(df1.loc[df1['signals']<0].index,df1['Close'][df1['signals']<0],marker='v',lw=0,c='r',label='short')
plt.grid(True)
plt.legend(loc='best')
plt.show()
# In[6]:
#backtesting
def portfolio(df1):
#initial capital to calculate the actual pnl
capital0=10000
#shares to buy of every position
positions=100
#cumsum column is created to check the holding of the position
df1['cumsum']=df1['signals'].cumsum()
portfolio=pd.DataFrame()
portfolio['holdings']=df1['cumsum']*df1['Close']*positions
portfolio['cash']=capital0-(df1['signals']*df1['Close']*positions).cumsum()
portfolio['total asset']=portfolio['holdings']+portfolio['cash']
portfolio['return']=portfolio['total asset'].pct_change()
portfolio['signals']=df1['signals']
portfolio['date']=df1['Date']
portfolio.set_index('date',inplace=True)
return portfolio
# In[7]:
#plotting the asset value change of the portfolio
def profit(portfolio):
fig=plt.figure()
bx=fig.add_subplot(111)
portfolio['total asset'].plot(label='Total Asset')
#long/short position markers related to the portfolio
#the same mechanism as the previous one
#replace close price with total asset value
bx.plot(portfolio['signals'].loc[portfolio['signals']==1].index,portfolio['total asset'][portfolio['signals']==1],lw=0,marker='^',c='g',label='long')
bx.plot(portfolio['signals'].loc[portfolio['signals']<0].index,portfolio['total asset'][portfolio['signals']<0],lw=0,marker='v',c='r',label='short')
plt.legend(loc='best')
plt.grid(True)
plt.xlabel('Date')
plt.ylabel('Asset Value')
plt.title('Total Asset')
plt.show()
# In[8]:
#omega ratio is a variation of sharpe ratio
#the risk free return is replaced by a given threshhold
#in this case, the return of benchmark
#integration is needed to calculate the return above and below the threshold
#it is a more reasonable ratio to measure the risk adjusted return
#normal distribution doesnt explain the fat tail of returns
#so i use student T cumulated distribution function instead
#for reason of simplicity, i do not use empirical distribution
#the cdf of empirical distribution is much more complex
def omega(risk_free,degree_of_freedom,maximum,minimum):
y=integrate.quad(lambda g:1-t.cdf(g,degree_of_freedom),risk_free,maximum)
x=integrate.quad(lambda g:t.cdf(g,degree_of_freedom),minimum,risk_free)
z=(y[0])/(x[0])
return z
#sortino ratio is another variation of sharpe ratio
#the standard deviation of all returns is substituted with standard deviation of negative returns
#sortino ratio measures the impact of negative return on return
#i am also using student T probability distribution function instead of normal distribution
def sortino(risk_free,degree_of_freedom,growth_rate,minimum):
v=np.sqrt(np.abs(integrate.quad(lambda g:((risk_free-g)**2)*t.pdf(g,degree_of_freedom),risk_free,minimum)))
s=(growth_rate-risk_free)/v[0]
return s
#i use a function to calculate maximum drawdown
#the idea is simple
#for every day, we take the current asset value
#to compare with the previous highest asset value
#we get our daily drawdown
#it is supposed to be negative if it is not the maximum for this period so far
#we implement a temporary variable to store the minimum value
#which is called maximum drawdown
#for each daily drawdown that is smaller than our temporary value
#we update the temp until we finish our traversal
#in the end we return the maximum drawdown
def mdd(series):
temp=0
for i in range(1,len(series)):
if temp>(series[i]/max(series[:i])-1):
temp=(series[i]/max(series[:i])-1)
return temp
# In[9]:
#stats calculation
def stats(portfolio,df1,stdate,eddate):
stats=pd.DataFrame([0])
#get the min and max of return
maximum=np.max(portfolio['return'])
minimum=np.min(portfolio['return'])
capital0=10000
#growth_rate denotes the average growth rate of portfolio
#i use geometric average instead of arithmetic average for percentage growth
growth_rate=(float(portfolio['total asset'].iloc[-1]/capital0))**(1/len(df1))-1
#calculating the standard deviation
std=float(np.sqrt((((portfolio['return']-growth_rate)**2).sum())/len(df1)))
#use S&P500 as benchmark
benchmark=yf.download('^GSPC',start=stdate,end=eddate)
#rb denotes the return of benchmark
rb=float(benchmark['Close'].iloc[-1]/benchmark['Open'].iloc[0]-1)
#rf denotes the average growth rate of benchmark
#i use geometric average instead of arithmetic average for percentage growth
rf=(rb+1)**(1/len(df1))-1
del benchmark
#backtesting stats
#CAGR stands for cumulated average growth rate
stats['CAGR']=stats['portfolio return']=float(0)
stats['CAGR'][0]=growth_rate
stats['portfolio return'][0]=portfolio['total asset'].iloc[-1]/capital0-1
stats['benchmark return']=rb
stats['sharpe ratio']=(growth_rate-rf)/std
stats['maximum drawdown']=mdd(portfolio['total asset'])
#calmar ratio is sorta like sharpe ratio
#the standard deviation is replaced by maximum drawdown
#it is the measurement of return after worse scenario adjustment
stats['calmar ratio']=growth_rate/stats['maximum drawdown']
stats['omega ratio']=omega(rf,len(df1),maximum,minimum)
stats['sortino ratio']=sortino(rf,len(df1),growth_rate,minimum)
#note that i use stop loss limit to limit the numbers of longs
#and when clearing positions, we clear all the positions at once
#so every long is always one, and short could be no larger than the stop loss limit
stats['numbers of longs']=df1['signals'].loc[df1['signals']==1].count()
stats['numbers of shorts']=df1['signals'].loc[df1['signals']<0].count()
stats['numbers of trades']=stats['numbers of shorts']+stats['numbers of longs']
#to get the total length of trades
#given that cumsum indicates the holding of positions
#we can get all the possible outcomes when cumsum doesnt equal zero
#then we count how many non-zero positions there are
#we get the estimation of total length of trades
stats['total length of trades']=df1['signals'].loc[df1['cumsum']!=0].count()
stats['average length of trades']=stats['total length of trades']/stats['numbers of trades']
stats['profit per trade']=float(0)
stats['profit per trade'].iloc[0]=(portfolio['total asset'].iloc[-1]-capital0)/stats['numbers of trades'].iloc[0]
del stats[0]
print(stats)
# In[10]:
def main():
#initializing
#stop loss positions, the maximum long positions we can get
#without certain constraints, you will long indefinites times as long as the market condition triggers the signal
#in a whipsaw condition, it is suicidal
stls=3
ticker='NVDA'
stdate='2015-04-01'
eddate='2018-02-15'
#slice is used for plotting
#a three year dataset with 750 variables would be too much for a figure
slicer=700
#downloading data
df=yf.download(ticker,start=stdate,end=eddate)
df1=signal_generation(df,heikin_ashi)
new=df1[slicer:]
plot(new,ticker)
portfo=portfolio(new)
profit(portfo)
stats(portfo,df1,stdate,eddate)
#note that this is the only py file with complete stats calculation
if __name__ == '__main__':
main()