diff --git a/chapter10/Chapter 10 - Creating Text Embedding Models.ipynb b/chapter10/Chapter 10 - Creating Text Embedding Models.ipynb index b4abfb6..53f46e6 100644 --- a/chapter10/Chapter 10 - Creating Text Embedding Models.ipynb +++ b/chapter10/Chapter 10 - Creating Text Embedding Models.ipynb @@ -269,21 +269,7 @@ "id": "8uAAhNs0ocoV" }, "outputs": [], - "source": [ - "from sentence_transformers.training_args import SentenceTransformerTrainingArguments\n", - "\n", - "# Define the training arguments\n", - "args = SentenceTransformerTrainingArguments(\n", - " output_dir=\"base_embedding_model\",\n", - " num_train_epochs=1,\n", - " per_device_train_batch_size=32,\n", - " per_device_eval_batch_size=32,\n", - " warmup_steps=100,\n", - " fp16=True,\n", - " eval_steps=100,\n", - " logging_steps=100,\n", - ")" - ] + "source": "from sentence_transformers.training_args import SentenceTransformerTrainingArguments\n\n# Define the training arguments\nargs = SentenceTransformerTrainingArguments(\n output_dir=\"base_embedding_model\",\n num_train_epochs=1,\n per_device_train_batch_size=32,\n per_device_eval_batch_size=32,\n warmup_steps=100,\n fp16=True,\n eval_steps=100,\n logging_steps=100,\n report_to=\"none\",\n)" }, { "cell_type": "code", @@ -837,189 +823,8 @@ "id": "Ikky866vdseY", "outputId": "803f2abe-002a-481c-9403-8ce39dfa5b47" }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "WARNING:sentence_transformers.SentenceTransformer:No sentence-transformers model found with name bert-base-uncased. Creating a new one with mean pooling.\n", - "/usr/local/lib/python3.10/dist-packages/huggingface_hub/file_download.py:1132: FutureWarning: `resume_download` is deprecated and will be removed in version 1.0.0. Downloads always resume when possible. If you want to force a new download, use `force_download=True`.\n", - " warnings.warn(\n" - ] - }, - { - "data": { - "text/html": [ - "\n", - "
\n", - " \n", - " \n", - " [1563/1563 06:04, Epoch 1/1]\n", - "
\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
StepTraining Loss
1000.231900
2000.168900
3000.170900
4000.157800
5000.152900
6000.156100
7000.149300
8000.154500
9000.150900
10000.145600
11000.147800
12000.145600
13000.145100
14000.142000
15000.141600

" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "c16cc9c062f547ee938537a719d4f668", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "Computing widget examples: 0%| | 0/5 [00:00\n", - " \n", - " \n", - " [528/528 03:00, Epoch 1/1]\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
StepTraining Loss
1000.345200
2000.105500
3000.079000
4000.062200
5000.069000

" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "5913c2edc4de4e48990626d19af0ff2b", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "Computing widget examples: 0%| | 0/5 [00:00\n", - " \n", - " \n", - " [1563/1563 01:57, Epoch 1/1]\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
StepTraining Loss
1000.155500
2000.110000
3000.118600
4000.115300
5000.110700
6000.101000
7000.113100
8000.099800
9000.109600
10000.105800
11000.094900
12000.106400
13000.105300
14000.105200
15000.106600

" - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "511480884e6145cda98eac03e3eaa214", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "Computing widget examples: 0%| | 0/5 [00:00