From a59b6b1490c0a272610444bc03c0b08b907655a8 Mon Sep 17 00:00:00 2001 From: Manu NALEPA Date: Mon, 24 Aug 2020 20:58:34 +0200 Subject: [PATCH] exemples.ipynb: Add DataFrame.groupby.expanding.apply --- docs/examples.ipynb | 48 +++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 48 insertions(+) diff --git a/docs/examples.ipynb b/docs/examples.ipynb index f6b446a..cb1849c 100644 --- a/docs/examples.ipynb +++ b/docs/examples.ipynb @@ -285,6 +285,54 @@ "res.equals(res_parallel)" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# DataFrame.groupby.expanding.apply" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "df_size = int(1e6)\n", + "df = pd.DataFrame(dict(a=np.random.randint(1, 300, df_size),\n", + " b=np.random.rand(df_size)))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def func(x):\n", + " return x.iloc[0] + x.iloc[1] ** 2 + x.iloc[2] ** 3 + x.iloc[3] ** 4" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "%%time\n", + "res = df.groupby('a').b.expanding(4).apply(func, raw=False)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "%%time\n", + "res_parallel = df.groupby('a').b.expanding(4).parallel_apply(func, raw=False)" + ] + }, { "cell_type": "markdown", "metadata": {},