import pandas as pdimport matplotlib.pyplot as pltimport matplotlib.style as styleimport seaborn as snsimport yfinance as yfstyle.use("default")params = {    "axes.labelsize": 8, "font.size": 8, "legend.fontsize": 8,    "xtick.labelsize": 8, "ytick.labelsize": 8, "text.usetex": False,    "font.family": "sans-serif", "axes.spines.top": False, "axes.spines.right": False,    "grid.color": "grey", "axes.grid": True,  "grid.alpha": 0.5, "grid.linestyle": ":",}plt.rcParams.update(params)

# use Yahoo Finance to download historical data for QQQ# over the last 15 years, from 2006-01-01 to 2021-01-01qqq_daily = yf.download("QQQ", start="2006-01-01", end="2023-12-31")qqq_daily["Adj Close"].plot(title="QQQ Daily Adjusted Close", figsize=(5, 3))plt.show()

[*********************100%%**********************]  1 of 1 completed

# calculate monthly returns of QQQqqq_monthly = qqq_daily["Adj Close"].resample("M").ffill().to_frame()qqq_monthly.index = qqq_monthly.index.to_period("M")qqq_monthly["Return"] = qqq_monthly["Adj Close"].pct_change() * 100qqq_monthly.dropna(inplace=True)qqq_monthly

# Step 2: Load the monthly three factors into a dataframe# CSV columns: , Mkt-RF, SMB, HML, RF# The first columns represents the date# The first row contains the column namesff_factors_monthly = pd.read_csv(    "./data/F-F_Research_Data_Factors-monthly.CSV", index_col=0)ff_factors_monthly.index.names = ["Date"]ff_factors_monthly.index = pd.to_datetime(ff_factors_monthly.index, format="%Y%m")ff_factors_monthly.index = ff_factors_monthly.index.to_period("M")ff_factors_monthly

# Filter factor dates to match the assetff_factors_subset = ff_factors_monthly[    ff_factors_monthly.index.isin(qqq_monthly.index)].copy()# Step 3: Calculate excess returns for the assetff_factors_subset["Excess_Return"] = qqq_monthly["Return"] - ff_factors_subset["RF"]ff_factors_subset

import statsmodels.api as sm# Prepare the independent variables (add a constant to the model)X = sm.add_constant(ff_factors_subset[["Mkt-RF", "SMB", "HML"]])# The dependent variabley = ff_factors_subset["Excess_Return"]# Run the regressionmodel = sm.OLS(y, X).fit()# Display the summary of the regressionprint(model.summary())

                            OLS Regression Results                            ==============================================================================Dep. Variable:          Excess_Return   R-squared:                       0.906Model:                            OLS   Adj. R-squared:                  0.905Method:                 Least Squares   F-statistic:                     680.7Date:                Mon, 26 Feb 2024   Prob (F-statistic):          3.43e-108Time:                        09:15:36   Log-Likelihood:                -413.33No. Observations:                 215   AIC:                             834.7Df Residuals:                     211   BIC:                             848.1Df Model:                           3                                         Covariance Type:            nonrobust                                         ==============================================================================                 coef    std err          t      P>|t|      [0.025      0.975]------------------------------------------------------------------------------const          0.2397      0.116      2.067      0.040       0.011       0.468Mkt-RF         1.1338      0.026     42.788      0.000       1.082       1.186SMB           -0.0565      0.049     -1.155      0.249      -0.153       0.040HML           -0.4177      0.035    -11.949      0.000      -0.487      -0.349==============================================================================Omnibus:                        0.661   Durbin-Watson:                   2.269Prob(Omnibus):                  0.719   Jarque-Bera (JB):                0.764Skew:                          -0.123   Prob(JB):                        0.682Kurtosis:                       2.842   Cond. No.                         4.93==============================================================================Notes:[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.

# Step 5.2: Plot the coefficients and their confidence intervalsfactors = model.params.index[1:]  # ['Mkt_Rf', 'SMB', 'HML']coefficients = model.params.values[1:]confidence_intervals = model.conf_int().diff(axis=1).iloc[1]# Create a DataFrameols_data = pd.DataFrame(    {        "Factor": factors,        "Coefficient": coefficients,        "Confidence_Lower": confidence_intervals[0],        "Confidence_Upper": confidence_intervals[1],    })# Plottingplt.figure(figsize=(3, 3))sns.barplot(x="Factor", y="Coefficient", data=ols_data, capsize=0.2, palette="coolwarm")# Add the p-value for each factor to the plotfor i, row in ols_data.iterrows():    plt.text(        i,        0.2,        f"p-value:{model.pvalues[row['Factor']]:.4f}",        ha="center",        va="bottom",        fontsize=6,    )plt.title("Impact of Fama-French Factors onQQQ Monthly Returns (2006-2023)")plt.xlabel("Factor"); plt.ylabel("Coefficient Value")plt.axhline(0, color="black", linewidth=0.8, linestyle="--")plt.show()

ff_factors_monthly = pd.read_csv(    "./data/F-F_Research_Data_5_Factors_2x3-monthly.csv", index_col=0)ff_factors_monthly.index.names = ["Date"]ff_factors_monthly

ff_factors_monthly.index = pd.to_datetime(ff_factors_monthly.index, format="%Y%m")# Sum up the monthly factors to get quarterly factorsff_factors_quarterly = ff_factors_monthly.resample("Q").sum()# For each quarter in ff_factors_quarterly, get the corresponding RF column# in ff_factors_monthly by looking up the RF value of the last month in the quarterff_factors_quarterly["RF"] = ff_factors_monthly["RF"].resample("Q").last()ff_factors_quarterly

	Adj Close	Return
Date
2006-02	35.565815	-2.142885
2006-03	36.309525	2.091080
2006-04	36.240250	-0.190790
2006-05	33.616402	-7.240149
2006-06	33.595703	-0.061573
...	...	...
2023-08	376.493195	-1.483010
2023-09	357.367859	-5.079862
2023-10	349.986481	-2.065485
2023-11	387.850891	10.818821
2023-12	409.519989	5.586966

	Mkt-RF	SMB	HML	RF
Date
1926-07	2.96	-2.56	-2.43	0.22
1926-08	2.64	-1.17	3.82	0.25
1926-09	0.36	-1.40	0.13	0.23
1926-10	-3.24	-0.09	0.70	0.32
1926-11	2.53	-0.10	-0.51	0.31
...	...	...	...	...
2023-08	-2.39	-3.16	-1.06	0.45
2023-09	-5.24	-2.51	1.52	0.43
2023-10	-3.19	-3.87	0.19	0.47
2023-11	8.84	-0.02	1.64	0.44
2023-12	4.85	6.35	4.94	0.43

	Mkt-RF	SMB	HML	RF	Excess_Return
Date
2006-02	-0.30	-0.38	-0.34	0.34	-2.482885
2006-03	1.46	3.44	0.60	0.37	1.721080
2006-04	0.73	-1.42	2.34	0.36	-0.550790
2006-05	-3.57	-2.96	2.41	0.43	-7.670149
2006-06	-0.35	-0.39	0.85	0.40	-0.461573
...	...	...	...	...	...
2023-08	-2.39	-3.16	-1.06	0.45	-1.933010
2023-09	-5.24	-2.51	1.52	0.43	-5.509862
2023-10	-3.19	-3.87	0.19	0.47	-2.535485
2023-11	8.84	-0.02	1.64	0.44	10.378821
2023-12	4.85	6.35	4.94	0.43	5.156966

	Mkt-RF	SMB	HML	RMW	CMA	RF
Date
196307	-0.39	-0.41	-0.97	0.68	-1.18	0.27
196308	5.07	-0.80	1.80	0.36	-0.35	0.25
196309	-1.57	-0.52	0.13	-0.71	0.29	0.27
196310	2.53	-1.39	-0.10	2.80	-2.01	0.29
196311	-0.85	-0.88	1.75	-0.51	2.24	0.27
...	...	...	...	...	...	...
202308	-2.39	-3.65	-1.06	3.43	-2.37	0.45
202309	-5.24	-1.80	1.52	1.86	-0.83	0.43
202310	-3.19	-4.04	0.19	2.46	-0.66	0.47
202311	8.84	-0.12	1.64	-3.91	-1.00	0.44
202312	4.85	7.32	4.94	-3.07	1.32	0.43

	Mkt-RF	SMB	HML	RMW	CMA	RF
Date
1963-09-30	3.11	-1.73	0.96	0.33	-1.24	0.27
1963-12-31	3.51	-4.37	1.63	2.32	0.16	0.29
1964-03-31	5.19	1.64	7.69	-2.09	5.60	0.31
1964-06-30	2.79	-1.86	1.81	-1.71	-1.08	0.30
1964-09-30	2.99	0.57	2.53	-0.36	2.88	0.28
...	...	...	...	...	...	...
2022-12-31	6.02	-1.00	10.76	9.97	14.02	0.33
2023-03-31	6.58	-1.87	-13.67	0.81	-8.17	0.36
2023-06-30	7.42	-1.60	-8.02	2.79	-5.98	0.40
2023-09-30	-4.42	-2.59	4.57	4.72	-2.63	0.43
2023-12-31	10.50	3.16	6.77	-4.52	-0.34	0.43

Fama-French Factor Model in Python

How Fama-French's Factor Model Works

Example

Steps to Replicate Fama-French Three-Factor Model on QQQ in Python

Step 1. Collect Monthly Returns of Portfolio or Asset

Step 2. Calculate the Fama-French Factors

Step 3: Calculate Excess Returns of Portfolio or Asset

Step 4: Run the Regression Model

Step 5: Interpret the Results

Factor Interpretation

Model Diagnostics

Converting Monthly to Quarterly Factors