import numpy as np
import pandas as pd
import plotly.graph_objects as go
import pandas_datareader as web
import datetime as dt


import scipy.stats


CAD=web.DataReader('CADUSD=X', 'yahoo', start = '12/31/2016')
#sp500.head()
CAD.info()

<class 'pandas.core.frame.DataFrame'>
DatetimeIndex: 999 entries, 2017-01-02 to 2020-11-03
Data columns (total 6 columns):
 #   Column     Non-Null Count  Dtype  
---  ------     --------------  -----  
 0   High       999 non-null    float64
 1   Low        999 non-null    float64
 2   Open       999 non-null    float64
 3   Close      999 non-null    float64
 4   Volume     999 non-null    float64
 5   Adj Close  999 non-null    float64
dtypes: float64(6)
memory usage: 54.6 KB


#Using Plotly Graphical Objects
fig1 = go.Figure()
fig1.add_trace(go.Scatter(x=CAD.index, y=CAD.Close, name='CAD/USD'))
fig1.update_layout(title="CAD/USD Exchange Rate", xaxis_type="date", yaxis_type="log")#?
fig1.show()


#We will also compare the returns of the MA strategy backtesting to those of a Long-only exposure to Canadian dollar.
price = np.array(CAD['Close'])
LongOnlyReturn = np.log(CAD['Close']/(CAD['Close']).shift(1))
LongOnly = np.exp(np.cumsum(LongOnlyReturn)) #Cumulative return of Long-Only Strategy


#This is the first definition of the MA function, from textbooks. It applies to the whole time-series. I think I shall use it to compare fully in-sample with out-of sample returns.
#It calculates the exposures over the whole period for given MA parameters i and j. Then it calculates the returns arizing from these exposures, and evaluates a maximization criterion, total return divided by standard deviation. 
# (In a future version I'll replace standard deviation by asymmetric deviation.)

def MAstrat0(i,j, SD=0.00):
    MA1 = np.array(CAD['Close'].rolling(i).mean())
    MA2 = np.array(CAD['Close'].rolling(j).mean())
    buy = MA1-MA2
    
    babs = np.abs(buy)
    babs[np.isnan(babs)] = 0

    buy[babs < SD] = 0
    buy[np.isnan(buy)] = 0
    Long = np.sign(buy)

    MAreturn = Long[:-1]*np.array(LongOnlyReturn[1:])
    MAstrategy = np.exp(np.cumsum(MAreturn))

    MAcrit = np.sum(MAreturn)/np.std(MAreturn[MAreturn<0]) #the criterion for choosing the MA parameters
    return MAcrit, MAreturn, MAstrategy, MA1, MA2, Long

MAcrit0 = MAstrat0(7,20,0.00)[0]; print(MAcrit0)

27.239010031230375


N = 500 #length of in-sample test window
ISprice = np.array(CAD['Close'][:N]) #from 0 to N-1, in-sample prices
#retN = LongOnlyReturn[:N-1]


#The second definition, below, calculates exposures, returns, and maximixation criterion on a subsample of prices, from inception to N-1. 

def MAstrat1(ISprice, i,j, SD=0.00): 
    
    #the moving averages are calculated through matrix convolutions     
    MA1 = np.convolve(ISprice, np.ones(i), 'valid')/i
    MA2 = np.convolve(ISprice, np.ones(j), 'valid')/j
    
    realSize = min(MA1.shape[0], MA2.shape[0])
    
    #buy size is realSize
    buy = MA1[(MA1.shape[0]-realSize):]-MA2[(MA2.shape[0]-realSize):]
    buy[np.abs(buy) < SD] = 0 #we can introduce a minimum threshold for trading
    #Long size is realSize
    Long = np.sign(buy)
    
    offset = max(i, j)

    MAreturn = Long[:-1]*np.array(LongOnlyReturn[offset:len(ISprice)]) 
    MAstrategy = np.exp(np.cumsum(MAreturn)) #not necessary here
    MAcrit = np.sum(MAreturn)/np.std(MAreturn[MAreturn<0]) #the maximization criterion is a sum or average scaled by standard deviation
    return MAcrit, MAreturn, MAstrategy, MA1, MA2, Long

MAcrit1 = MAstrat1(ISprice,7,20)[0]; print(MAcrit1)

16.919484189909767


#These parameters will be applied to out-of-sample testing
MAmaxcrit = -np.Inf
n=250 #maximum values for i and j
MACritij = np.zeros((n-1,n-1))

for i in range(1, n):
    for j in range(i+1, n):
        MAcrit = MAstrat1(ISprice, i,j, 0.00)[0]
        MACritij[i-1,j-1] = MAcrit
        if MAcrit>MAmaxcrit:
            MAmaxcrit = MAcrit
            imax = i
            jmax = j

print(f'i={imax}, j={jmax}, Maximization criterion = {MAmaxcrit}')

i=18, j=20, Maximization criterion = 69.01765325797


# There are various ways to plot

z = MACritij
fig = go.Figure(data=[go.Surface(z=z)])
fig.update_layout(title='MA Parameters Heatmap for Initial In-sample Window', 
                  scene_camera_eye=dict(x=1, y=-1.5, z=0.25),
                  autosize=False,
                  width=600, height=600,
                  margin=dict(l=65, r=50, b=65, t=90))
fig.show()


#Pure in-sample testing applies the optimization criterion to the whole data series. 

MAmaxcrit = -np.Inf
n=250 #maximum values for i and j
MACritij = np.zeros((n-1,n-1))

for i in range(1, n):
    for j in range(i+1, n):
        MAcrit = MAstrat0(i,j, 0.00)[0]
        MACritij[i-1,j-1] = MAcrit #(because the number of days lookback is matrix index+1)
        if MAcrit>MAmaxcrit:
            MAmaxcrit = MAcrit
            ISimax = i
            ISjmax = j

print(f'i={ISimax}, j={ISjmax}, Maximization criterion = {MAmaxcrit}')

i=9, j=10, Maximization criterion = 98.45235047862056


z = MACritij
#sh_0, sh_1 = z.shape
x, y = np.linspace(0, 1, n-1), np.linspace(0, 1, n-1)
fig = go.Figure(data=[go.Surface(z=z, x=x, y=y)])
fig.update_layout(title='MA Parameters Heatmap for the full series', 
                  scene_camera_eye=dict(x=1, y=-1.5, z=0.25),
                  autosize=False,
                  width=500, height=500,
                  margin=dict(l=65, r=50, b=65, t=90))
fig.show()


i = imax
j = jmax
#Out-of-sample only:
OSprice = np.array(CAD['Close'][N:]) #from N to the end, ou-of-sample prices
OSMAcrit, OSMAreturn, OSMAstrategy, OSMA1, OSMA2, OSLong = MAstrat1(OSprice, i,j, 0.00)

#in-sample only for the first N days
ISprice = np.array(CAD['Close'][:N])
ISMAcrit, ISMAreturn, ISMAstrategy, ISMA1, ISMA2, ISLong = MAstrat1(ISprice, i,j, 0.00)
#print(ISMAcrit)

#Combined in-sample with out-of-sample:
MAcrit, MAreturn, MAstrategy, MA1, MA2, Long = MAstrat1(price, i,j, 0.00)
print(MAcrit)

#Fully in-sample over the whole period: 
IMAcrit, IMAreturn, IMAstrategy, IMA1, IMA2, ILong = MAstrat0(ISimax,ISjmax, 0.00)
print(IMAcrit)

49.130736255897304
98.45235047862056


fig = go.Figure()
fig.add_trace(go.Scatter(x=CAD.index[ISjmax:], y=LongOnly[ISjmax:], name='Long-only'))
#fig.add_trace(go.Scatter(x=CAD.index[ISjmax:], y=IMAstrategy[ISjmax:], name='MA Strategy - Fully In Sample', line_color='#FF0000'))
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=MAstrategy, name='MA Strategy - Out of Sample', line_color='#008000'))
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=ISMAstrategy, name='MA Strategy - In Sample', line_color='#FF0000'))
fig.update_layout(title="MA Trading Strategy") 
fig.show()


layout = go.Layout(title='MA Combined Trading Exposures', yaxis=dict(), yaxis2=dict(overlaying='y', side='right'))
fig = go.Figure(layout=layout)
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=CAD['Close'][jmax:], name='CAD/USD', yaxis='y2'))
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=MA1, name='MA1',yaxis='y2'))
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=MA2, name='MA2',yaxis='y2'))
fig.add_trace(go.Scatter(x=CAD.index[jmax:], y=Long, name='Regime', yaxis='y1'))
fig.show()


#MAreturn = MAreturn[~np.isnan(MAreturn)] #but there shoudn't be any NaNs.


#Purely In-Sample returns

x = scipy.stats.describe(IMAreturn)
y= dict(x._asdict())
y["min"] = y["minmax"][0]
y["max"] = y["minmax"][1]
y.pop("minmax")
y["return/risk"] = y["mean"]/np.sqrt(y["variance"])
y

{'nobs': 998,
 'mean': 0.0003025095202530839,
 'variance': 1.9130270981182766e-05,
 'skewness': -0.10596661471700308,
 'kurtosis': 2.2336758423097063,
 'min': -0.01942763655277548,
 'max': 0.01710653688278069,
 'return/risk': 0.06916374260973256}


#Out-of-Sample returns

x = scipy.stats.describe(OSMAreturn)
y= dict(x._asdict())
y["min"] = y["minmax"][0]
y["max"] = y["minmax"][1]
y.pop("minmax")
y["return/risk"] = y["mean"]/np.sqrt(y["variance"])
y

{'nobs': 479,
 'mean': -0.0002953344009014845,
 'variance': 1.8443823179364526e-05,
 'skewness': 0.09978313275578958,
 'kurtosis': 0.8422426522732414,
 'min': -0.013882836595837231,
 'max': 0.015133424294694877,
 'return/risk': -0.0687683433290615}


plotarray=[go.Histogram(x=MAreturn[:N], nbinsx=50, marker_color='#FF0000')]
figlayout={'title':'Distribution of MA In-Sample Strategy returns'}
fig = go.Figure(data=plotarray, layout=figlayout)
fig.show()


plotarray=[go.Histogram(x=MAreturn[N:], nbinsx=50, marker_color='#008000')]
figlayout={'title':'Distribution of MA Out-of-Sample Strategy returns'}
fig = go.Figure(data=plotarray, layout=figlayout)
fig.show()


def Rolling(data,n): 
    #It calculates n-rolling return and standard deviation based on data.
    
    RollRet = np.zeros(len(data)-n)
    RollStd = np.zeros(len(data)-n)

    for i in range(len(data)-n):
        RollRet[i] = np.convolve(data[i:i+n], np.ones(n), 'valid')/n
        RollSqRet = np.convolve(data[i:i+n]**2, np.ones(n), 'valid')/n
        RollVar = RollSqRet-RollRet[i]**2
        RollStd[i] = np.sqrt(RollVar)
        
    return RollRet, RollStd


n=252 #(aproximately 1 year)
data = MAreturn[N:]
RollRet = Rolling(data,n)[0]
RollStd = Rolling(data,n)[1]

MeanRet = np.mean(RollRet)*252
StdDev = np.mean(RollStd)*np.sqrt(252)
print(f"Average 1-year Rolling Return:  {MeanRet:.4%} p.a.") 
print(f"Average 1-year Standard Deviation:  {StdDev:.4%} p.a.")
print(f"Return/Risk Ratio: {MeanRet/StdDev:.2}")

Average 1-year Rolling Return:  -3.4422% p.a.
Average 1-year Standard Deviation:  6.5127% p.a.
Return/Risk Ratio: -0.53


data = MAreturn[:N]
ISRollRet = Rolling(data,n)[0]
ISRollStd = Rolling(data,n)[1]

MeanRet = np.mean(ISRollRet)*252
StdDev = np.mean(ISRollStd)*np.sqrt(252)
print(f"Average in-sample 1-year Rolling Return:  {MeanRet:.4%} p.a.") 
print(f"Average in-sample 1-year Standard Deviation:  {StdDev:.4%} p.a.")
print(f"Return/Risk Ratio: {MeanRet/StdDev:.2}")

Average in-sample 1-year Rolling Return:  7.3396% p.a.
Average in-sample 1-year Standard Deviation:  7.0361% p.a.
Return/Risk Ratio: 1.0


layout = go.Layout(title='Annualized Rolling Performance', xaxis_type="date", yaxis=dict(tickformat=".2%"),
                   legend=dict(orientation="h", yanchor="bottom", y=1, xanchor="right",x=1))

fig2 = go.Figure(layout=layout)
fig2.add_trace(go.Scatter(x=CAD.index[n+jmax+N:], y=RollRet*252, name='Out-of-Sample Rolling Return', line_color='#008000'))
fig2.add_trace(go.Scatter(x=CAD.index[n+jmax:N], y=ISRollRet*252, name='In-Sample Rolling Return', mode='markers', line_color='#008000'))
fig2.add_trace(go.Scatter(x=CAD.index[n+jmax+N:], y=RollStd*np.sqrt(252), name='Out-of-Sample Rolling Standard Deviation', line_color='#FF0000'))
fig2.add_trace(go.Scatter(x=CAD.index[n+jmax:N], y=ISRollStd*np.sqrt(252), name='In-Sample Rolling Standard Deviation', mode='markers', line_color='#FF0000'))
#fig2.update_layout(title="CAD/USD", xaxis_type="date", yaxis_type="log")#?
fig2.show()

Backtesting: In-sample (IS) versus Out-of-Sample (OS)¶

Example : Moving Average trading strategy on the CADUSD exchange rate¶