{ "cells": [ { "cell_type": "code", "execution_count": 6, "id": "c11e397b", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "📂 Searching for documents in: /Users/przemo/Coding/document data retrieval/content\n", "✅ Created 8134 multilingual instruction pairs.\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Map: 100%|██████████| 7320/7320 [00:01<00:00, 5442.12 examples/s]\n", "Map: 100%|██████████| 814/814 [00:00<00:00, 5879.32 examples/s]\n", "/var/folders/t6/7gm1y_yj5831dq3xh1b21y8w0000gp/T/ipykernel_31309/193414689.py:109: FutureWarning: `tokenizer` is deprecated and will be removed in version 5.0.0 for `Seq2SeqTrainer.__init__`. Use `processing_class` instead.\n", " trainer = Seq2SeqTrainer(\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "🚀 Training Multilingual Model...\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "/Users/przemo/Coding/.venv/lib/python3.13/site-packages/torch/utils/data/dataloader.py:692: UserWarning: 'pin_memory' argument is set as true but not supported on MPS now, device pinned memory won't be used.\n", " warnings.warn(warn_msg)\n" ] }, { "data": { "text/html": [ "\n", "
| Epoch | \n", "Training Loss | \n", "Validation Loss | \n", "
|---|---|---|
| 1 | \n", "0.838600 | \n", "0.698937 | \n", "
| 2 | \n", "0.628400 | \n", "0.617202 | \n", "
| 3 | \n", "0.598600 | \n", "0.577280 | \n", "
| 4 | \n", "0.575200 | \n", "0.545364 | \n", "
| 5 | \n", "0.488400 | \n", "0.526966 | \n", "
| 6 | \n", "0.489900 | \n", "0.512095 | \n", "
| 7 | \n", "0.447100 | \n", "0.500422 | \n", "
| 8 | \n", "0.450300 | \n", "0.499637 | \n", "
| 9 | \n", "0.396700 | \n", "0.494340 | \n", "
| 10 | \n", "0.402300 | \n", "0.497277 | \n", "
"
],
"text/plain": [
"