!conda activate ramp-bike-skore
!python download_data.py


import pandas as pd
from pathlib import Path

data = pd.read_parquet(Path("data") / "train.parquet").sort_values(by="date")


data.head()


from skrub import TableReport

TableReport(data)

Processing column  11 / 11


data.groupby(["site_name", "counter_name"], observed=True)[
    "bike_count"
].sum().sort_values(ascending=False).head(10).to_frame()


import folium

m = folium.Map(location=data[["latitude", "longitude"]].mean(axis=0), zoom_start=13)

for _, row in (
    data[["counter_name", "latitude", "longitude"]]
    .drop_duplicates("counter_name")
    .iterrows()
):
    folium.Marker(
        row[["latitude", "longitude"]].values.tolist(), popup=row["counter_name"]
    ).add_to(m)

m

/opt/anaconda3/envs/ramp-bike-skore/lib/python3.12/site-packages/folium/utilities.py:93: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`
  coords = (location[0], location[1])


import matplotlib.pyplot as plt

mask = data["counter_name"] == "Totem 73 boulevard de Sébastopol S-N"

data[mask].plot(x="date", y="bike_count")
plt.show()


mask = data["counter_name"] == "Totem 73 boulevard de Sébastopol S-N"

data[mask].groupby(pd.Grouper(freq="1W", key="date"))[["bike_count"]].sum().plot()
plt.show()


fig, ax = plt.subplots(figsize=(10, 4))

mask = (
    (data["counter_name"] == "Totem 73 boulevard de Sébastopol S-N")
    & (data["date"] > pd.to_datetime("2021/03/01"))
    & (data["date"] < pd.to_datetime("2021/03/08"))
)

data[mask].plot(x="date", y="bike_count", ax=ax)
plt.show()


import seaborn as sns

ax = sns.histplot(data, x="bike_count", kde=True, bins=50)

data['log_bike_count'] = np.log(1 + data['bike_count'])


ax = sns.histplot(data, x="log_bike_count", kde=True, bins=50)


import problem

X_train, y_train = problem.get_train_data()
X_test, y_test = problem.get_test_data()


X_train.head(2)


y_train

array([1.60943791, 1.38629436, 0.        , ..., 2.48490665, 1.60943791,
       1.38629436], shape=(455163,))


print(
    f'Train: n_samples={X_train.shape[0]},  {X_train["date"].min()} to {X_train["date"].max()}'
)
print(
    f'Test: n_samples={X_test.shape[0]},  {X_test["date"].min()} to {X_test["date"].max()}'
)

Train: n_samples=455163,  2020-09-01 01:00:00 to 2021-08-09 23:00:00
Test: n_samples=41608,  2021-08-10 01:00:00 to 2021-09-09 23:00:00


from sklearn.dummy import DummyRegressor

dummy_regr = DummyRegressor(strategy="mean")
dummy_regr

DummyRegressor()

DummyRegressor()


from skore import EstimatorReport

dummy_report = EstimatorReport(
    dummy_regr,
    X_train=X_train,
    X_test=X_test,
    y_train=y_train,
    y_test=y_test,
)


dummy_report.help()

╭───────────────────── Tools to diagnose estimator DummyRegressor ─────────────────────╮
│ EstimatorReport                                                                      │
│ ├── .metrics                                                                         │
│ │   ├── .prediction_error(...)         - Plot the prediction error of a regression   │
│ │   │   model.                                                                       │
│ │   ├── .r2(...)               (↗︎)     - Compute the R² score.                       │
│ │   ├── .rmse(...)             (↘︎)     - Compute the root mean squared error.        │
│ │   ├── .timings(...)                  - Get all measured processing times related   │
│ │   │   to the estimator.                                                            │
│ │   ├── .custom_metric(...)            - Compute a custom metric.                    │
│ │   └── .report_metrics(...)           - Report a set of metrics for our estimator.  │
│ ├── .feature_importance                                                              │
│ │   └── .permutation(...)              - Report the permutation feature importance.  │
│ ├── .cache_predictions(...)            - Cache estimator's predictions.              │
│ ├── .clear_cache(...)                  - Clear the cache.                            │
│ ├── .get_predictions(...)              - Get estimator's predictions.                │
│ └── Attributes                                                                       │
│     ├── .X_test                        - Testing data                                │
│     ├── .X_train                       - Training data                               │
│     ├── .y_test                        - Testing target                              │
│     ├── .y_train                       - Training target                             │
│     ├── .estimator_                    - The cloned or copied estimator              │
│     ├── .estimator_name_               - The name of the estimator                   │
│     └── .fit_time_                     - The time taken to fit the estimator, in     │
│         seconds                                                                      │
│                                                                                      │
│                                                                                      │
│ Legend:                                                                              │
│ (↗︎) higher is better (↘︎) lower is better                                             │
╰──────────────────────────────────────────────────────────────────────────────────────╯


dummy_report.metrics.report_metrics(data_source="train")


dummy_report.metrics.report_metrics(data_source="test")


from skrub import tabular_learner
from sklearn.linear_model import Ridge

ridge_tab_learner = tabular_learner(Ridge())

ridge_tab_report = EstimatorReport(
    ridge_tab_learner,
    X_train=X_train,
    X_test=X_test,
    y_train=y_train,
    y_test=y_test,
)
ridge_tab_report.estimator_

Pipeline(steps=[('tablevectorizer',
                 TableVectorizer(datetime=DatetimeEncoder(periodic_encoding='spline'))),
                ('simpleimputer', SimpleImputer(add_indicator=True)),
                ('standardscaler', StandardScaler()), ('ridge', Ridge())])

Pipeline(steps=[('tablevectorizer',
                 TableVectorizer(datetime=DatetimeEncoder(periodic_encoding='spline'))),
                ('simpleimputer', SimpleImputer(add_indicator=True)),
                ('standardscaler', StandardScaler()), ('ridge', Ridge())])

TableVectorizer(datetime=DatetimeEncoder(periodic_encoding='spline'))

['site_id', 'latitude', 'longitude']

PassThrough()

['date', 'counter_installation_date']

DatetimeEncoder(periodic_encoding='spline')

['site_name', 'counter_technical_id']

OneHotEncoder(drop='if_binary', dtype='float32', handle_unknown='ignore',
              sparse_output=False)

['counter_id', 'counter_name']


from skore import ComparisonReport

reports_to_compare = {
    "Dummy (mean)": dummy_report,
    "Ridge (skrub baseline)": ridge_tab_report
}
comparator = ComparisonReport(reports=reports_to_compare)
comparator.metrics.report_metrics()

Output()


hgbt_skrub = tabular_learner("regressor")

hgbt_report = EstimatorReport(
    hgbt_skrub,
    X_train=X_train,
    X_test=X_test,
    y_train=y_train,
    y_test=y_test,
)
hgbt_report.estimator_

Pipeline(steps=[('tablevectorizer',
                 TableVectorizer(high_cardinality=MinHashEncoder(),
                                 low_cardinality=ToCategorical())),
                ('histgradientboostingregressor',
                 HistGradientBoostingRegressor())])

Pipeline(steps=[('tablevectorizer',
                 TableVectorizer(high_cardinality=MinHashEncoder(),
                                 low_cardinality=ToCategorical())),
                ('histgradientboostingregressor',
                 HistGradientBoostingRegressor())])

TableVectorizer(high_cardinality=MinHashEncoder(),
                low_cardinality=ToCategorical())

['site_id', 'latitude', 'longitude']

PassThrough()

['date', 'counter_installation_date']

DatetimeEncoder()

['site_name', 'counter_technical_id']

ToCategorical()

['counter_id', 'counter_name']


reports_to_compare["HGBT (skrub baseline)"] = hgbt_report
comparator = ComparisonReport(reports=reports_to_compare)
comparator.metrics.report_metrics()

Output()


def _encode_dates(X):
    X = X.copy()  # modify a copy of X
    # Encode the date information from the DateOfDeparture columns
    X.loc[:, "year"] = X["date"].dt.year
    X.loc[:, "month"] = X["date"].dt.month
    X.loc[:, "day"] = X["date"].dt.day
    X.loc[:, "weekday"] = X["date"].dt.weekday
    X.loc[:, "hour"] = X["date"].dt.hour

    # Finally we can drop the original columns from the dataframe
    return X.drop(columns=["date"])


data["date"].head()

705677   2020-09-01 01:00:00
333389   2020-09-01 01:00:00
343292   2020-09-01 01:00:00
805911   2020-09-01 01:00:00
353162   2020-09-01 01:00:00
Name: date, dtype: datetime64[us]


_encode_dates(data[["date"]].head())


from sklearn.preprocessing import FunctionTransformer

date_encoder = FunctionTransformer(_encode_dates, validate=False)
date_encoder.fit_transform(data[["date"]]).head()


from sklearn.preprocessing import OneHotEncoder

enc = OneHotEncoder(sparse_output=False)

enc.fit_transform(_encode_dates(data[["date"]])[["hour"]].head())

array([[1.],
       [1.],
       [1.],
       [1.],
       [1.]])


_encode_dates(X_train[["date"]]).columns.tolist()

['year', 'month', 'day', 'weekday', 'hour']


from sklearn.compose import ColumnTransformer
from sklearn.pipeline import make_pipeline

date_encoder = FunctionTransformer(_encode_dates)
date_cols = _encode_dates(X_train[["date"]]).columns.tolist()

categorical_encoder = OneHotEncoder(handle_unknown="ignore")
categorical_cols = ["counter_name", "site_name"]

preprocessor = ColumnTransformer(
    [
        ("date", OneHotEncoder(handle_unknown="ignore"), date_cols),
        ("cat", categorical_encoder, categorical_cols),
    ]
)

regressor = Ridge()

pipe = make_pipeline(date_encoder, preprocessor, regressor)
pipe

Pipeline(steps=[('functiontransformer',
                 FunctionTransformer(func=<function _encode_dates at 0x11bf6c400>)),
                ('columntransformer',
                 ColumnTransformer(transformers=[('date',
                                                  OneHotEncoder(handle_unknown='ignore'),
                                                  ['year', 'month', 'day',
                                                   'weekday', 'hour']),
                                                 ('cat',
                                                  OneHotEncoder(handle_unknown='ignore'),
                                                  ['counter_name',
                                                   'site_name'])])),
                ('ridge', Ridge())])

Pipeline(steps=[('functiontransformer',
                 FunctionTransformer(func=<function _encode_dates at 0x11bf6c400>)),
                ('columntransformer',
                 ColumnTransformer(transformers=[('date',
                                                  OneHotEncoder(handle_unknown='ignore'),
                                                  ['year', 'month', 'day',
                                                   'weekday', 'hour']),
                                                 ('cat',
                                                  OneHotEncoder(handle_unknown='ignore'),
                                                  ['counter_name',
                                                   'site_name'])])),
                ('ridge', Ridge())])

FunctionTransformer(func=<function _encode_dates at 0x11bf6c400>)

ColumnTransformer(transformers=[('date', OneHotEncoder(handle_unknown='ignore'),
                                 ['year', 'month', 'day', 'weekday', 'hour']),
                                ('cat', OneHotEncoder(handle_unknown='ignore'),
                                 ['counter_name', 'site_name'])])

['year', 'month', 'day', 'weekday', 'hour']

OneHotEncoder(handle_unknown='ignore')

['counter_name', 'site_name']

OneHotEncoder(handle_unknown='ignore')

Ridge()


pipe_report = EstimatorReport(
    pipe,
    X_train=X_train,
    X_test=X_test,
    y_train=y_train,
    y_test=y_test,
)


df_pipe = pd.concat([
    pipe_report.metrics.report_metrics(data_source="train"),
    pipe_report.metrics.report_metrics(data_source="test"),
], axis=1)
df_pipe.columns = ["Manuel Ridge (train)", "Manuel Ridge (test)"]
df_pipe


reports_to_compare["Ridge (manual)"] = pipe_report
comparator = ComparisonReport(reports=reports_to_compare)
comparator.metrics.report_metrics()

Output()


import numpy as np

pipe = pipe_report.estimator_

mask = (
    (X_test["counter_name"] == "Totem 73 boulevard de Sébastopol S-N")
    & (X_test["date"] > pd.to_datetime("2021/09/01"))
    & (X_test["date"] < pd.to_datetime("2021/09/08"))
)

df_viz = X_test.loc[mask].copy()
df_viz["bike_count"] = np.exp(y_test[mask.values]) - 1
df_viz["bike_count (predicted)"] = np.exp(pipe.predict(X_test[mask])) - 1


fig, ax = plt.subplots(figsize=(12, 4))

df_viz.plot(x="date", y="bike_count", ax=ax)
df_viz.plot(x="date", y="bike_count (predicted)", ax=ax, ls="--")
ax.set_title("Predictions with Ridge")
ax.set_ylabel("bike_count")

Text(0, 0.5, 'bike_count')


pipe_report.metrics.prediction_error().plot(kind="actual_vs_predicted")


pipe_report.feature_importance.permutation(seed=0).T.boxplot(vert=False)
plt.tight_layout()


from sklearn.model_selection import TimeSeriesSplit
from skore import CrossValidationReport

cv = TimeSeriesSplit(n_splits=6)

cv_report = CrossValidationReport(
    pipe, X_train, y_train, cv_splitter=cv
)

Output()


cv_report.help()

╭───────────────────────── Tools to diagnose estimator Ridge ──────────────────────────╮
│ CrossValidationReport                                                                │
│ ├── .metrics                                                                         │
│ │   ├── .prediction_error(...)         - Plot the prediction error of a regression   │
│ │   │   model.                                                                       │
│ │   ├── .r2(...)               (↗︎)     - Compute the R² score.                       │
│ │   ├── .rmse(...)             (↘︎)     - Compute the root mean squared error.        │
│ │   ├── .timings(...)                  - Get all measured processing times related   │
│ │   │   to the estimator.                                                            │
│ │   ├── .custom_metric(...)            - Compute a custom metric.                    │
│ │   └── .report_metrics(...)           - Report a set of metrics for our estimator.  │
│ ├── .cache_predictions(...)            - Cache the predictions for sub-estimators    │
│ │   reports.                                                                         │
│ ├── .clear_cache(...)                  - Clear the cache.                            │
│ ├── .get_predictions(...)              - Get estimator's predictions.                │
│ └── Attributes                                                                       │
│     ├── .X                             - The data to fit                             │
│     ├── .y                             - The target variable to try to predict in    │
│     │   the case of supervised learning                                              │
│     ├── .estimator_                    - The cloned or copied estimator              │
│     ├── .estimator_name_               - The name of the estimator                   │
│     ├── .estimator_reports_            - The estimator reports for each split        │
│     └── .n_jobs                        - Number of jobs to run in parallel           │
│                                                                                      │
│                                                                                      │
│ Legend:                                                                              │
│ (↗︎) higher is better (↘︎) lower is better                                             │
╰──────────────────────────────────────────────────────────────────────────────────────╯


cv_report.metrics.report_metrics(data_source="train")

Output()


cv_report.metrics.report_metrics(data_source="test")

Output()


cv_report.metrics.report_metrics(data_source="test", aggregate=None)

Output()

	counter_id	counter_name	site_id	site_name	bike_count	date	counter_installation_date	counter_technical_id	latitude	longitude	log_bike_count
705677	100056332-104056332	Pont de Bercy SO-NE	100056332	Pont de Bercy	0.0	2020-09-01 01:00:00	2019-12-11	Y2H19070378	48.83848	2.37587	0.000000
333389	100047547-104047547	6 rue Julia Bartet NE-SO	100047547	6 rue Julia Bartet	4.0	2020-09-01 01:00:00	2018-11-28	Y2H18086323	48.82636	2.30303	1.609438
343292	100047547-103047547	6 rue Julia Bartet SO-NE	100047547	6 rue Julia Bartet	2.0	2020-09-01 01:00:00	2018-11-28	Y2H18086323	48.82636	2.30303	1.098612
805911	100057380-103057380	Totem Cours la Reine O-E	100057380	Totem Cours la Reine	0.0	2020-09-01 01:00:00	2020-02-11	YTH19111509	48.86462	2.31444	0.000000
353162	100047548-103047548	Face au 25 quai de l'Oise NE-SO	100047548	Face au 25 quai de l'Oise	2.0	2020-09-01 01:00:00	2018-11-28	Y2H18086324	48.89141	2.38482	1.098612

	counter_id	counter_name	site_id	site_name	bike_count	date	counter_installation_date	counter_technical_id	latitude	longitude	log_bike_count
	counter_id	counter_name	site_id	site_name	bike_count	date	counter_installation_date	counter_technical_id	latitude	longitude	log_bike_count
705677	100056332-104056332	Pont de Bercy SO-NE	100056332	Pont de Bercy	0.0	2020-09-01 01:00:00	2019-12-11 00:00:00	Y2H19070378	48.83848	2.37587	0.0
333389	100047547-104047547	6 rue Julia Bartet NE-SO	100047547	6 rue Julia Bartet	4.0	2020-09-01 01:00:00	2018-11-28 00:00:00	Y2H18086323	48.82636	2.30303	1.6094379124341003
343292	100047547-103047547	6 rue Julia Bartet SO-NE	100047547	6 rue Julia Bartet	2.0	2020-09-01 01:00:00	2018-11-28 00:00:00	Y2H18086323	48.82636	2.30303	1.0986122886681098
805911	100057380-103057380	Totem Cours la Reine O-E	100057380	Totem Cours la Reine	0.0	2020-09-01 01:00:00	2020-02-11 00:00:00	YTH19111509	48.86462	2.31444	0.0
353162	100047548-103047548	Face au 25 quai de l'Oise NE-SO	100047548	Face au 25 quai de l'Oise	2.0	2020-09-01 01:00:00	2018-11-28 00:00:00	Y2H18086324	48.89141	2.38482	1.0986122886681098

794577	100057329-103057329	Totem 85 quai d'Austerlitz SE-NO	100057329	Totem 85 quai d'Austerlitz	16.0	2021-08-09 23:00:00	2020-02-18 00:00:00	YTH19111508	48.84201	2.36729	2.833213344056216
873948	100060178-101060178	90 Rue De Sèvres SO-NE	100060178	90 Rue De Sèvres	7.0	2021-08-09 23:00:00	2020-07-22 00:00:00	Y2H20052705	48.84638	2.31529	2.0794415416798357
743159	100056335-104056335	Quai d'Orsay E-O	100056335	Quai d'Orsay	8.0	2021-08-09 23:00:00	2019-11-07 00:00:00	Y2H19070382	48.86288	2.31179	2.1972245773362196
135283	100042374-109042374	Voie Georges Pompidou SO-NE	100042374	Voie Georges Pompidou	3.0	2021-08-09 23:00:00	2017-12-15 00:00:00	Y2H21025335	48.8484	2.27586	1.3862943611198906
683843	100056331-104056331	Face au 40 quai D'Issy NE-SO	100056331	Face au 40 quai D'Issy	0.0	2021-08-09 23:00:00	2019-11-05 00:00:00	Y2H19070377	48.83421	2.26542	0.0

Column	Column name	dtype	Unique values	Mean	Std	Min	Median	Max
0	counter_id	CategoricalDtype	56 (< 0.1%)
1	counter_name	CategoricalDtype	56 (< 0.1%)
2	site_id	Int64DType	30 (< 0.1%)	1.05e+08	3.16e+07	100,007,049	100,056,226	300,014,702
3	site_name	CategoricalDtype	30 (< 0.1%)
4	bike_count	Float64DType	977 (0.2%)	59.5	87.1	0.00	28.0	1.28e+03
5	date	DateTime64DType	8230 (1.8%)			2020-09-01T01:00:00		2021-08-09T23:00:00
6	counter_installation_date	DateTime64DType	22 (< 0.1%)			2013-01-18T00:00:00		2020-11-29T00:00:00
7	counter_technical_id	CategoricalDtype	30 (< 0.1%)
8	latitude	Float64DType	30 (< 0.1%)	48.9	0.0186	48.8	48.9	48.9
9	longitude	Float64DType	30 (< 0.1%)	2.35	0.0380	2.27	2.35	2.41
10	log_bike_count	Float64DType	977 (0.2%)	3.05	1.68	0.00	3.37	7.15

		bike_count
site_name	counter_name
Totem 73 boulevard de Sébastopol	Totem 73 boulevard de Sébastopol S-N	1809231.0
Totem 64 Rue de Rivoli	Totem 64 Rue de Rivoli O-E	1406900.0
Totem 73 boulevard de Sébastopol	Totem 73 boulevard de Sébastopol N-S	1357868.0
67 boulevard Voltaire SE-NO	67 boulevard Voltaire SE-NO	1036575.0
Totem 64 Rue de Rivoli	Totem 64 Rue de Rivoli E-O	914089.0
27 quai de la Tournelle	27 quai de la Tournelle SE-NO	888717.0
Quai d'Orsay	Quai d'Orsay E-O	849724.0
Totem Cours la Reine	Totem Cours la Reine O-E	806149.0
Face au 48 quai de la marne	Face au 48 quai de la marne SO-NE	806071.0
Face au 48 quai de la marne	Face au 48 quai de la marne NE-SO	759194.0

	counter_id	counter_name	site_id	site_name	date	counter_installation_date	counter_technical_id	latitude	longitude
400125	100049407-353255860	152 boulevard du Montparnasse E-O	100049407	152 boulevard du Montparnasse	2020-09-01 01:00:00	2018-12-07	Y2H19070373	48.840801	2.333233
408305	100049407-353255859	152 boulevard du Montparnasse O-E	100049407	152 boulevard du Montparnasse	2020-09-01 01:00:00	2018-12-07	Y2H19070373	48.840801	2.333233

RAMP on predicting cyclist traffic in Paris¶

Introduction¶

Loading and exploring the data¶

Loading the data with pandas¶

counter_id

counter_name

site_id

site_name

bike_count

date

counter_installation_date

counter_technical_id

latitude

longitude

log_bike_count

counter_id

counter_name

site_id

site_name

bike_count

date

counter_installation_date

counter_technical_id

latitude

longitude

log_bike_count

Please enable javascript

Visualizing the data¶

Building a few baselines using scikit-learn and skrub¶

Getting the train and test data¶

Dummy model¶

Linear model from skrub¶

Tree-based model¶

A custom complex pipeline for a linear model¶

Feature extraction¶

Ridge model¶

Evaluation¶

Inspection¶

A note on cross-validation¶

Column 1	Column 2	Cramér's V	Pearson's Correlation
counter_id	counter_name	1.00
site_name	counter_technical_id	1.00
site_id	site_name	0.792
site_id	counter_technical_id	0.792
counter_id	site_name	0.716
counter_id	counter_technical_id	0.716
counter_name	site_name	0.716
counter_name	counter_technical_id	0.716
counter_installation_date	latitude	0.696
counter_technical_id	latitude	0.666
site_name	latitude	0.666
site_id	counter_installation_date	0.649
site_id	latitude	0.634	-0.118
site_name	longitude	0.618
counter_technical_id	longitude	0.618
site_id	longitude	0.614	-0.182
counter_installation_date	longitude	0.588
bike_count	log_bike_count	0.585	0.764
latitude	longitude	0.579	0.167
counter_installation_date	counter_technical_id	0.565

	DummyRegressor
Metric
R²	0.000000
RMSE	1.675057
Fit time	0.000398
Predict time	0.000444

	DummyRegressor
Metric
R²	-0.068402
RMSE	1.487492
Fit time	0.000398
Predict time	0.000214

Estimator	Dummy (mean)	Ridge (skrub baseline)
Metric
R²	-0.068402	0.567088
RMSE	1.487492	0.946864
Fit time	0.000398	45.979211
Predict time	0.000214	0.272696

	year	month	day	weekday	hour
705677	2020	9	1	1	1
333389	2020	9	1	1	1
343292	2020	9	1	1	1
805911	2020	9	1	1	1
353162	2020	9	1	1	1

	Manuel Ridge (train)	Manuel Ridge (test)
Metric
R²	0.771475	0.745980
RMSE	0.800750	0.725306
Fit time	0.246295	0.246295
Predict time	0.159231	0.018873

	Ridge
	mean	std
Metric
R²	0.819263	0.020461
RMSE	0.710780	0.053518
Fit time	0.139352	0.065364
Predict time	0.084718	0.049095

	Ridge
	mean	std
Metric
R²	0.676437	0.077509
RMSE	0.931700	0.081377
Fit time	0.139352	0.065364
Predict time	0.026663	0.003670

	Ridge
	Split #0	Split #1	Split #2	Split #3	Split #4	Split #5
Metric
R²	0.660951	0.721467	0.757911	0.742509	0.611206	0.564578
RMSE	0.963112	0.869636	0.853591	0.870083	1.060825	0.972954
Fit time	0.046973	0.101718	0.113555	0.165793	0.175068	0.233009
Predict time	0.033113	0.022903	0.024964	0.026339	0.024282	0.028379