from sklearn.linear_model import Lasso, Ridge, ElasticNet
y_penalized = data_ml['R1M_Usd'].values # Dependent variable
X_penalized = data_ml[features].values # Predictors
alphas = np.arange(1e-4,1.0e-3,1e-5) # here alpha is used for lambda in scikit-learn
lasso_res = {} # declaring the dict that will receive the model's result


for alpha in alphas: # looping through the different alphas/lambdas values
  lasso = Lasso(alpha=alpha) # model
  lasso.fit(X_penalized,y_penalized) 
  lasso_res[alpha] = lasso.coef_ # extract LASSO coefs

df_lasso_res = pd.DataFrame.from_dict(lasso_res).T # transpose the dataframe for plotting
df_lasso_res.columns = features # adding the names of the factors
predictors = (df_lasso_res.abs().sum() > 0.05) # selecting the most relevant
df_lasso_res.loc[:,predictors].plot(xlabel='Lambda',ylabel='Beta',figsize=(12,8)); # Plot!


n_alphas = 50 # declare the number of alphas for ridge
alphas = np.logspace(-2, 4, n_alphas) # transforming into log for Aspect ratio 
ridge_res = {} # declaring the dict that will receive the model's result 

for alpha in alphas: # looping through the different alphas/lambdas values
  ridge = Ridge(alpha=alpha) # model
  ridge.fit(X_penalized,y_penalized) # fit the model
  ridge_res[alpha] = ridge.coef_ # extract RIDGE coefs

df_ridge_res = pd.DataFrame.from_dict(ridge_res).T # transpose the dataframe for plotting
df_ridge_res.columns = features # adding the names of the factors
df_ridge_res.loc[:,predictors].plot(xlabel='Lambda',ylabel='Beta',figsize=(13,8)); # Plot!


t_oos = returns.index[returns.index > separation_date].values # Out-of-sample data 
Tt = len(t_oos) # Nb of dates
nb_port = 3 # Nb of portfolios/strats
port_weights = {} # Initial portf. weights in dict
port_returns = {} # Initial portf. returns in dict


def weights_sparsehedge(returns, alpha, Lambda):
  weights = [] # Initiate weights in list
  lr = ElasticNet(alpha=alpha,l1_ratio=Lambda) # ?? elasticnet
  for col in returns.columns: # Loop on the assets
    y = returns[col].values # Dependent variable
    X = returns.drop(col, axis=1).values # Independent variable
    lr.fit(X,y)
    err = y - lr.predict(X) # Prediction errors
    w = (1-np.sum(lr.coef_))/np.var(err) # Output: weight of asset i
    weights.append(w)
  return weights / np.sum(weights) # Normalisation of weights


def weights_multi(returns, j, alpha, Lambda):
  N = returns.shape[1]
  if j == 0: # j = 0 => EW
    return np.repeat(1/N,N) 
  elif j == 1: # j = 1 => Minimum Variance
    sigma = np.cov(returns.T) + 1e-2 * np.identity(N) # Covariance matrix + regularizing term
    w = np.matmul(np.linalg.inv(sigma),np.repeat(1,N)) # Multiply & inverse
    return w / np.sum(w) # Normalize
  elif j == 2: # j = 2 => Penalised / elasticnet
    return weights_sparsehedge(returns, alpha, Lambda)


for m, month in np.ndenumerate(t_oos): # Loop = rebal. dates
  temp_data = returns.loc[returns.index < month] # Data for weights
  realised_returns = returns.loc[returns.index == month].values # OOS returns
  weights_temp = {} 
  returns_temp = {}

  for j in range(nb_port): # Loop over strats
    wgts = weights_multi(temp_data, j, 0.1, 0.1) # Hard-coded params!
    rets = np.sum(wgts * realised_returns) # Portf. returns
    weights_temp[j] = wgts
    returns_temp[j] = rets
    
  port_weights[month] = weights_temp # not used but created
  port_returns[month] = returns_temp
  
port_returns_final = pd.concat(
        {k: pd.DataFrame.from_dict(v, 'index') for k, v in port_returns.items()}, 
        axis=0).reset_index() # Dict comprehension approach -- https://www.python.org/dev/peps/pep-0274/

colnames = ['date','strategy','return'] # Colnames
port_returns_final.columns = colnames # Colnames
strategies_name = {0:'EW',1:'MV',2:'Sparse'}
port_returns_final['strategy'] = port_returns_final['strategy'].replace(strategies_name)
pd.DataFrame(port_returns_final.groupby('strategy')['return'].std()).T # Portfolio volatilities (monthly scale)


y_penalized_train = training_sample['R1M_Usd'].values # Dependent variable
X_penalized_train = training_sample[features].values # Predictors
model = ElasticNet(alpha=0.1, l1_ratio=0.1) # model
fir_pen_pred=model.fit(X_penalized_train,y_penalized_train) # fitting the model


y_penalized_test = testing_sample['R1M_Usd'].values # Dependent variable
X_penalized_test = testing_sample[features].values # Predictors
mse = np.mean((fir_pen_pred.predict(X_penalized_test) - y_penalized_test)**2)
print(f'MSE: {mse}')

MSE: 0.03699695809185004


hitratio = np.mean(fir_pen_pred.predict(X_penalized_test) * y_penalized_test > 0)
print(f'Hit Ratio: {hitratio}')

Hit Ratio: 0.5460346399270738

Chapter 5 Penalized regressions and sparse hedging for minimum variance portfolios¶

5.1 Penalized regressions¶

5.1.1 Simple regressions¶

5.1.2 Forms of penalizations¶

5.1.3 Illustrations¶

5.2 Sparse hedging for minimum variance portfolios¶

5.2.1 Presentation and derivations¶

5.2.2 Example¶

5.3 Predictive regressions¶

5.3.1 Literature review and principle¶

5.3.2 Code and results¶

5.4 Coding exercices¶

References¶