quantopian · twiecki · Aug 21, 2017 · Jul 31, 2017 · Jul 31, 2017 · Jul 31, 2017
diff --git a/.travis.yml b/.travis.yml
@@ -25,7 +25,7 @@ before_install:
   - cp pyfolio/tests/matplotlibrc .
 
 install:
-  - conda create -q -n testenv --yes python=$TRAVIS_PYTHON_VERSION ipython pyzmq numpy scipy nose matplotlib pandas Cython patsy flake8 seaborn runipy pytables networkx pandas-datareader matplotlib-tests joblib
+  - conda create -q -n testenv --yes python=$TRAVIS_PYTHON_VERSION ipython pyzmq numpy scipy nose matplotlib pandas Cython patsy flake8 seaborn scikit-learn runipy pytables networkx pandas-datareader matplotlib-tests joblib
   - source activate testenv
   - pip install nose_parameterized
   #- pip install --no-deps git+https://github.com/quantopian/zipline

diff --git a/pyfolio/timeseries.py b/pyfolio/timeseries.py
@@ -21,6 +21,7 @@
 import numpy as np
 import scipy as sp
 import scipy.stats as stats
+from sklearn import linear_model
 
 from . import utils
 from .utils import APPROX_BDAYS_PER_MONTH, APPROX_BDAYS_PER_YEAR
@@ -551,27 +552,27 @@ def rolling_beta(returns, factor_returns,
 def rolling_fama_french(returns, factor_returns=None,
                         rolling_window=APPROX_BDAYS_PER_MONTH * 6):
     """
-    Computes rolling Fama-French single factor betas.
+    Computes rolling Fama-French single factor betas using a multivariate
+    linear regression (separate linear regressions is problematic because
+    the Fama-French factors are confounded).
 
-    Specifically, returns SMB, HML, and UMD.
+    Specifically, returns rolling betas to SMB, HML, and UMD.
 
     Parameters
     ----------
     returns : pd.Series
         Daily returns of the strategy, noncumulative.
          - See full explanation in tears.create_full_tear_sheet.
     factor_returns : pd.DataFrame, optional
-        data set containing the Fama-French risk factors. See
+        Data set containing the Fama-French risk factors. See
         utils.load_portfolio_risk_factors.
     rolling_window : int, optional
-        The days window over which to compute the beta.
-        Default is 6 months.
+        The days window over which to compute the beta. Defaults to 6 months.
 
     Returns
     -------
     pandas.DataFrame
-        DataFrame containing rolling beta coefficients for SMB, HML
-        and UMD
+        DataFrame containing rolling beta coefficients to SMB, HML and UMD
     """
 
     if factor_returns is None:
@@ -580,8 +581,26 @@ def rolling_fama_french(returns, factor_returns=None,
         factor_returns = factor_returns.drop(['Mkt-RF', 'RF'],
                                              axis='columns')
 
-    return rolling_beta(returns, factor_returns,
-                        rolling_window=rolling_window)
+    # add constant to regression
+    factor_returns['const'] = 1
+
+    # have NaNs when there is insufficient data to do a regression
+    regression_coeffs = np.empty((rolling_window,
+                                  len(factor_returns.columns)))
+    regression_coeffs.fill(np.nan)
+
+    for beg, end in zip(factor_returns.index[:-rolling_window],
+                        factor_returns.index[rolling_window:]):
+        coeffs = linear_model.LinearRegression().fit(factor_returns[beg:end],
+                                                     returns[beg:end]).coef_
+        regression_coeffs = np.append(regression_coeffs, [coeffs], axis=0)
+
+    rolling_fama_french = pd.DataFrame(data=regression_coeffs[:, :3],
+                                       columns=['SMB', 'HML', 'UMD'],
+                                       index=factor_returns.index)
+    rolling_fama_french.index.name = None
+
+    return rolling_fama_french
 
 
 def gross_lev(positions):

diff --git a/setup.py b/setup.py
@@ -51,6 +51,7 @@
     'pandas>=0.19.0',
     'pytz>=2014.10',
     'scipy>=0.14.0',
+    'scikit-learn>=0.18.2'
     'seaborn>=0.7.1',
     'pandas-datareader>=0.2',
     'empyrical>=0.3.0'