diff --git a/training/fine-tune-embedding-model-for-rag.ipynb b/training/fine-tune-embedding-model-for-rag.ipynb index 9d9fbaf..7155f27 100644 --- a/training/fine-tune-embedding-model-for-rag.ipynb +++ b/training/fine-tune-embedding-model-for-rag.ipynb @@ -169,7 +169,7 @@ " model_id, device=\"cuda\" if torch.cuda.is_available() else \"cpu\"\n", ")\n", "\n", - "# load test dataset\n", + "# Load the datasets (both are treated as 'train' splits when loadedĀ fromĀ JSON)\n", "test_dataset = load_dataset(\"json\", data_files=\"test_dataset.json\", split=\"train\")\n", "train_dataset = load_dataset(\"json\", data_files=\"train_dataset.json\", split=\"train\")\n", "corpus_dataset = concatenate_datasets([train_dataset, test_dataset])\n",