diff --git a/README.md b/README.md index 7db3459..1f221f5 100644 --- a/README.md +++ b/README.md @@ -32,11 +32,15 @@ Probabilistic regression example on the Boston housing dataset: ```python from ngboost import NGBRegressor -from sklearn.datasets import load_boston from sklearn.model_selection import train_test_split from sklearn.metrics import mean_squared_error -X, Y = load_boston(True) +#Load Boston housing dataset +data_url = "http://lib.stat.cmu.edu/datasets/boston" +raw_df = pd.read_csv(data_url, sep="\s+", skiprows=22, header=None) +X = np.hstack([raw_df.values[::2, :], raw_df.values[1::2, :2]]) +Y = raw_df.values[1::2, 2] + X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2) ngb = NGBRegressor().fit(X_train, Y_train)