{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "98de82f6-2dc9-4d27-a5d8-d07ae04b496c", "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/Users/peportier/miniforge3/envs/RAG_ENV/lib/python3.9/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", " from .autonotebook import tqdm as notebook_tqdm\n", "/Users/peportier/miniforge3/envs/RAG_ENV/lib/python3.9/site-packages/transformers/utils/generic.py:441: UserWarning: torch.utils._pytree._register_pytree_node is deprecated. Please use torch.utils._pytree.register_pytree_node instead.\n", " _torch_pytree._register_pytree_node(\n" ] } ], "source": [ "from embedding import EmbeddingModel" ] }, { "cell_type": "code", "execution_count": 2, "id": "37408a48-ce90-4176-bc9f-b71ebc22a178", "metadata": { "collapsed": true, "jupyter": { "outputs_hidden": true } }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-01-07 08:16:20,663 - INFO - Load pretrained SentenceTransformer: intfloat/multilingual-e5-large\n", "/Users/peportier/miniforge3/envs/RAG_ENV/lib/python3.9/site-packages/transformers/utils/generic.py:309: UserWarning: torch.utils._pytree._register_pytree_node is deprecated. Please use torch.utils._pytree.register_pytree_node instead.\n", " _torch_pytree._register_pytree_node(\n", "2024-01-07 08:16:24,944 - INFO - Use pytorch device: cpu\n", "2024-01-07 08:16:24,951 - INFO - Anonymized telemetry enabled. See https://docs.trychroma.com/telemetry for more information.\n", "2024-01-07 08:16:25,075 - INFO - 255a0eb096.txt : Start\n", "Token indices sequence length is longer than the specified maximum sequence length for this model (529 > 512). Running this sequence through the model will result in indexing errors\n", "Batches: 0%| | 0/1 [00:00