From ec53a9c4134291fe64fc44aaf7786cbe16dbcee7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=C5=81ukasz=20Augustyniak?= Date: Tue, 14 Nov 2023 11:01:22 +0000 Subject: [PATCH] fix cell outputs --- nbs/03_training_example.ipynb | 158 ++++++++++++++++++++++++++++++---- 1 file changed, 140 insertions(+), 18 deletions(-) diff --git a/nbs/03_training_example.ipynb b/nbs/03_training_example.ipynb index 6e38aca..feea3c5 100644 --- a/nbs/03_training_example.ipynb +++ b/nbs/03_training_example.ipynb @@ -48,7 +48,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, "outputs": [ { @@ -99,6 +99,27 @@ }, "metadata": {}, "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Dataset mms downloaded and prepared to /root/.cache/huggingface/datasets/Brand24___mms/default/0.2.0/70532fdd01f149ff84a280b7d9cfb661643abf4837b4f0f3aa1128064e870d65. Subsequent calls will reuse this data.\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "5663e74add1d415c853bcb257a15963a", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0/1 [00:001\u001b[0m \u001b[39m#| eval: false\u001b[39;00m\n\u001b[0;32m----> 2\u001b[0m mms_dataset\u001b[39m.\u001b[39mcolumn_names\n", - "\u001b[0;31mNameError\u001b[0m: name 'mms_dataset' is not defined" - ] + "data": { + "text/plain": [ + "{'train': ['_id',\n", + " 'text',\n", + " 'label',\n", + " 'original_dataset',\n", + " 'domain',\n", + " 'language',\n", + " 'Family',\n", + " 'Genus',\n", + " 'Definite articles',\n", + " 'Indefinite articles',\n", + " 'Number of cases',\n", + " 'Order of subject, object, verb',\n", + " 'Negative morphemes',\n", + " 'Polar questions',\n", + " 'Position of negative word wrt SOV',\n", + " 'Prefixing vs suffixing',\n", + " 'Coding of nominal plurality',\n", + " 'Grammatical genders',\n", + " 'cleanlab_self_confidence']}" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" } ], "source": [ @@ -146,7 +184,22 @@ "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "31c9a75e3c5e4e349120702866a1ca1f", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Filter: 0%| | 0/6165262 [00:00 0.6)" @@ -173,7 +241,18 @@ "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "73227" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "#| eval: false\n", "len(pl_sm_high_confidence)" @@ -203,7 +282,22 @@ "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "28e61f6f723044e2bc8824d7f808f63e", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Map: 0%| | 0/73227 [00:00