From 0d3e0760a174a06c742ae57f2d7019530c7d723a Mon Sep 17 00:00:00 2001 From: Sergio Jimenez Jimenez Date: Mon, 8 Dec 2025 11:34:23 +0100 Subject: [PATCH] Imporve data description. --- src/paddle_ocr_fine_tune_unir_raytune.ipynb | 43 ++++----------------- 1 file changed, 8 insertions(+), 35 deletions(-) diff --git a/src/paddle_ocr_fine_tune_unir_raytune.ipynb b/src/paddle_ocr_fine_tune_unir_raytune.ipynb index c54f356..d2763ed 100644 --- a/src/paddle_ocr_fine_tune_unir_raytune.ipynb +++ b/src/paddle_ocr_fine_tune_unir_raytune.ipynb @@ -2322,7 +2322,7 @@ "max 0.699247 " ] }, - "execution_count": 20, + "execution_count": 32, "metadata": {}, "output_type": "execute_result" } @@ -2334,7 +2334,7 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": 33, "id": "50fa5b59", "metadata": {}, "outputs": [ @@ -2383,44 +2383,17 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": 34, "id": "9462b7a2", "metadata": {}, "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "textline_orientation=True:\n", - " CER WER\n", - "count 53.000000 53.000000\n", - "mean 0.037637 0.127337\n", - "std 0.098417 0.095844\n", - "min 0.011535 0.098902\n", - "25% 0.011875 0.100441\n", - "50% 0.012199 0.101228\n", - "75% 0.012583 0.103280\n", - "max 0.516069 0.594530\n", - "\n", - "textline_orientation=False:\n", - " CER WER\n", - "count 11.000000 11.000000\n", - "mean 0.124009 0.217126\n", - "std 0.139431 0.133092\n", - "min 0.039052 0.132047\n", - "25% 0.044246 0.132462\n", - "50% 0.064799 0.164937\n", - "75% 0.093873 0.198020\n", - "max 0.418109 0.503710\n" - ] - }, { "data": { "text/plain": [ "" ] }, - "execution_count": 29, + "execution_count": 34, "metadata": {}, "output_type": "execute_result" }, @@ -2437,11 +2410,11 @@ ], "source": [ "# Direct comparison for binary parameter\n", - "print(\"textline_orientation=True:\")\n", - "print(df[df[\"config/textline_orientation\"] == True][[\"CER\", \"WER\"]].describe())\n", + "#print(\"textline_orientation=True:\")\n", + "#print(df[df[\"config/textline_orientation\"] == True][[\"CER\", \"WER\"]].describe())\n", "\n", - "print(\"\\ntextline_orientation=False:\")\n", - "print(df[df[\"config/textline_orientation\"] == False][[\"CER\", \"WER\"]].describe())\n", + "#print(\"\\ntextline_orientation=False:\")\n", + "#print(df[df[\"config/textline_orientation\"] == False][[\"CER\", \"WER\"]].describe())\n", "\n", "# Or a simple mean comparison\n", "df.groupby(\"config/textline_orientation\")[[\"CER\", \"WER\"]].mean()\n",