From c25ea0ecca7b793438aad026ffac82fbe10e60ec Mon Sep 17 00:00:00 2001
From: rcarrata <rcarratalasanchez@gmail.com>
Date: Wed, 6 Nov 2024 19:33:47 +0100
Subject: [PATCH] added rag

---
 lab-materials/04-rag/5.1-ingest-rag.ipynb | 1578 +++++++++++++++++++++
 lab-materials/04-rag/5.2-query-rag.ipynb  |  280 ++++
 lab-materials/04-rag/5.3-simple-rag.ipynb |  371 +++++
 3 files changed, 2229 insertions(+)
 create mode 100644 lab-materials/04-rag/5.1-ingest-rag.ipynb
 create mode 100644 lab-materials/04-rag/5.2-query-rag.ipynb
 create mode 100644 lab-materials/04-rag/5.3-simple-rag.ipynb

diff --git a/lab-materials/04-rag/5.1-ingest-rag.ipynb b/lab-materials/04-rag/5.1-ingest-rag.ipynb
new file mode 100644
index 0000000..5936710
--- /dev/null
+++ b/lab-materials/04-rag/5.1-ingest-rag.ipynb
@@ -0,0 +1,1578 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "3420575b-4d00-458b-aa0e-7030008ccd53",
+   "metadata": {},
+   "source": [
+    "## Creating an index and populating it with documents using Milvus and Nomic AI Embeddings\n",
+    "\n",
+    "Ingest PDF documents, then web pages content into a Milvus VectorStore."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8308b229-b520-4e82-a783-eb921bb955e7",
+   "metadata": {},
+   "source": [
+    "### Needed packages and imports"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "91e41b41-f60a-4b0f-91a1-cd273b60f21b",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "#!pip install einops==0.7.0 langchain==0.1.9 pypdf==4.0.2 pymilvus==2.3.6 sentence-transformers==2.4.0\n",
+    "#!pip install -q einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "600cd763-6ecc-4c77-89c0-47108c31c44e",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "import requests\n",
+    "import os\n",
+    "from langchain.document_loaders import PyPDFDirectoryLoader, WebBaseLoader\n",
+    "from langchain.text_splitter import RecursiveCharacterTextSplitter\n",
+    "from langchain.embeddings.huggingface import HuggingFaceEmbeddings\n",
+    "from langchain_community.vectorstores import Milvus"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1a82063d-6153-4812-8977-042241736b53",
+   "metadata": {},
+   "source": [
+    "### Base parameters, the Milvus connection info"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "417ed4a4-9418-4f48-bebd-ef0ea11ae434",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "MILVUS_HOST = \"vectordb-milvus.milvus.svc.cluster.local\"\n",
+    "MILVUS_PORT = 19530\n",
+    "MILVUS_USERNAME = os.getenv('MILVUS_USERNAME')\n",
+    "MILVUS_PASSWORD = os.getenv('MILVUS_PASSWORD')\n",
+    "MILVUS_COLLECTION = \"collection_nomicai_embeddings\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f68f6785-480e-4519-be4f-8e1738dba4ca",
+   "metadata": {},
+   "source": [
+    "## Initial index creation and document ingestion"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f8cff5f7-c509-48db-90b5-e15815b8b530",
+   "metadata": {},
+   "source": [
+    "#### Download and load pdfs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "bc4fe0db-f494-4cbd-9e97-8b6359a78cb7",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "product_version=\"2.13\"\n",
+    "documents = [\n",
+    "    \"release_notes\",\n",
+    "    \"introduction_to_red_hat_openshift_ai\",\n",
+    "    \"getting_started_with_red_hat_openshift_ai_self-managed\",\n",
+    "    \"openshift_ai_tutorial_-_fraud_detection_example\",\n",
+    "    \"developing_a_model\",\n",
+    "    \"integrating_data_from_amazon_s3\",\n",
+    "    \"working_on_data_science_projects\",\n",
+    "    \"serving_models\",\n",
+    "    \"monitoring_data_science_models\",\n",
+    "    \"managing_users\",\n",
+    "    \"managing_resources\",\n",
+    "    \"installing_and_uninstalling_openshift_ai_self-managed\",\n",
+    "    \"installing_and_uninstalling_openshift_ai_self-managed_in_a_disconnected_environment\",\n",
+    "    \"upgrading_openshift_ai_self-managed\",\n",
+    "    \"upgrading_openshift_ai_self-managed_in_a_disconnected_environment\",   \n",
+    "]\n",
+    "\n",
+    "pdfs = [f\"https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/{product_version}/pdf/{doc}/red_hat_openshift_ai_self-managed-{product_version}-{doc}-en-us.pdf\" for doc in documents]\n",
+    "pdfs_to_urls = {f\"red_hat_openshift_ai_self-managed-{product_version}-{doc}-en-us\": f\"https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/{product_version}/html-single/{doc}/index\" for doc in documents}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "3eea5acc-49df-41c9-a01a-0cdbca96e8e2",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Skipped https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/pdf/developing_a_model/red_hat_openshift_ai_self-managed-2.13-developing_a_model-en-us.pdf\n",
+      "Skipped https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/pdf/integrating_data_from_amazon_s3/red_hat_openshift_ai_self-managed-2.13-integrating_data_from_amazon_s3-en-us.pdf\n",
+      "Skipped https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/pdf/monitoring_data_science_models/red_hat_openshift_ai_self-managed-2.13-monitoring_data_science_models-en-us.pdf\n"
+     ]
+    }
+   ],
+   "source": [
+    "docs_dir = f\"rhoai-doc-{product_version}\"\n",
+    "\n",
+    "if not os.path.exists(docs_dir):\n",
+    "    os.mkdir(docs_dir)\n",
+    "\n",
+    "for pdf in pdfs:\n",
+    "    try:\n",
+    "        response = requests.get(pdf)\n",
+    "    except:\n",
+    "        print(f\"Skipped {pdf}\")\n",
+    "        continue\n",
+    "    if response.status_code!=200:\n",
+    "        print(f\"Skipped {pdf}\")\n",
+    "        continue  \n",
+    "    with open(f\"{docs_dir}/{pdf.split('/')[-1]}\", 'wb') as f:\n",
+    "        f.write(response.content)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "af4074d4-eff4-45b2-902d-ec8c075a83ef",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "pdf_folder_path = f\"./rhoai-doc-{product_version}\"\n",
+    "\n",
+    "pdf_loader = PyPDFDirectoryLoader(pdf_folder_path)\n",
+    "pdf_docs = pdf_loader.load()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cde7ed3a-0530-47a1-95c2-22db6c782a95",
+   "metadata": {},
+   "source": [
+    "#### Inject metadata"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "702230f6-e6d3-44c7-a643-4996387606ff",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "from pathlib import Path\n",
+    "\n",
+    "for doc in pdf_docs:\n",
+    "    doc.metadata[\"source\"] = pdfs_to_urls[Path(doc.metadata[\"source\"]).stem]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dd511d44-2d92-47a0-9163-b25576c9557b",
+   "metadata": {},
+   "source": [
+    "#### Load websites"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "8aebf003-d7ec-43ba-8e04-1931bcff2866",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "websites = [\n",
+    "    \"https://ai-on-openshift.io/getting-started/openshift/\",\n",
+    "    \"https://ai-on-openshift.io/getting-started/opendatahub/\",\n",
+    "    \"https://ai-on-openshift.io/getting-started/openshift-ai/\",\n",
+    "    \"https://ai-on-openshift.io/odh-rhoai/configuration/\",\n",
+    "    \"https://ai-on-openshift.io/odh-rhoai/custom-notebooks/\",\n",
+    "    \"https://ai-on-openshift.io/odh-rhoai/nvidia-gpus/\",\n",
+    "    \"https://ai-on-openshift.io/odh-rhoai/custom-runtime-triton/\",\n",
+    "    \"https://ai-on-openshift.io/odh-rhoai/openshift-group-management/\",\n",
+    "    \"https://ai-on-openshift.io/tools-and-applications/minio/minio/\",\n",
+    "    \"https://access.redhat.com/articles/7047935\",\n",
+    "    \"https://access.redhat.com/articles/rhoai-supported-configs\",\n",
+    "]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "99f41110-8ca7-4d90-93b2-3b5021c894b8",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "website_loader = WebBaseLoader(websites)\n",
+    "website_docs = website_loader.load()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "157ddd29-54b3-474a-9b10-2d274bc3254f",
+   "metadata": {},
+   "source": [
+    "#### Merge both types of docs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "8d361094-8b43-4351-8495-37628c35c42d",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "docs = pdf_docs + website_docs"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4198fe0a-38bf-4cd4-af7d-35b41c645edd",
+   "metadata": {},
+   "source": [
+    "#### Split documents into chunks with some overlap"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "edba4a08-2194-4df1-9091-6f2b596757a1",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Document(page_content='Red Hat OpenShift AI Self-Managed\\n2.13\\nOpenShift AI tutorial - Fraud detection\\nexample\\nUse OpenShift AI to train an example model in JupyterLab, deploy the model, and\\nrefine the model by using automated pipelines\\nLast Updated: 2024-09-20', metadata={'source': 'https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/openshift_ai_tutorial_-_fraud_detection_example/index', 'page': 0})"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "text_splitter = RecursiveCharacterTextSplitter(chunk_size=1024,\n",
+    "                                               chunk_overlap=40)\n",
+    "all_splits = text_splitter.split_documents(docs)\n",
+    "all_splits[0]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "79c2659f-4716-4c0a-a037-45af3560ab89",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "#!pip install sentence-transformers\n",
+    "#!pip show sentence-transformers\n",
+    "#!pip uninstall -y sentence-transformers\n",
+    "#!pip install sentence-transformers"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7ae7eae2-c670-4eb5-803b-b4d591fa83db",
+   "metadata": {},
+   "source": [
+    "#### Create the index and ingest the documents"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "id": "bbb6a3e3-5ccd-441e-b80d-427555d9e9f6",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "You try to use a model that was created with version 2.4.0.dev0, however, your version is 2.4.0. This might cause unexpected behavior or errors. In that case, try to update to the latest version.\n",
+      "\n",
+      "\n",
+      "\n",
+      "<All keys matched successfully>\n"
+     ]
+    }
+   ],
+   "source": [
+    "# If you don't want to use a GPU, you can remove the 'device': 'cuda' argument\n",
+    "model_kwargs = {'trust_remote_code': True, 'device': 'cuda'}\n",
+    "embeddings = HuggingFaceEmbeddings(\n",
+    "    model_name=\"nomic-ai/nomic-embed-text-v1\",\n",
+    "    model_kwargs=model_kwargs,\n",
+    "    show_progress=True\n",
+    ")\n",
+    "\n",
+    "\n",
+    "db = Milvus(\n",
+    "    embedding_function=embeddings,\n",
+    "    connection_args={\"host\": MILVUS_HOST, \"port\": MILVUS_PORT, \"user\": MILVUS_USERNAME, \"password\": MILVUS_PASSWORD},\n",
+    "    collection_name=MILVUS_COLLECTION,\n",
+    "    metadata_field=\"metadata\",\n",
+    "    text_field=\"page_content\",\n",
+    "    auto_id=True,\n",
+    "    drop_old=True\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "id": "b6bf425b-dffd-4f42-9537-49d41383182d",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "de0956f111864f95a1c17a1b0e7d6b9e",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Batches:   0%|          | 0/35 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/plain": [
+       "[453133124104520064,\n",
+       " 453133124104520065,\n",
+       " 453133124104520066,\n",
+       " 453133124104520067,\n",
+       " 453133124104520068,\n",
+       " 453133124104520069,\n",
+       " 453133124104520070,\n",
+       " 453133124104520071,\n",
+       " 453133124104520072,\n",
+       " 453133124104520073,\n",
+       " 453133124104520074,\n",
+       " 453133124104520075,\n",
+       " 453133124104520076,\n",
+       " 453133124104520077,\n",
+       " 453133124104520078,\n",
+       " 453133124104520079,\n",
+       " 453133124104520080,\n",
+       " 453133124104520081,\n",
+       " 453133124104520082,\n",
+       " 453133124104520083,\n",
+       " 453133124104520084,\n",
+       " 453133124104520085,\n",
+       " 453133124104520086,\n",
+       " 453133124104520087,\n",
+       " 453133124104520088,\n",
+       " 453133124104520089,\n",
+       " 453133124104520090,\n",
+       " 453133124104520091,\n",
+       " 453133124104520092,\n",
+       " 453133124104520093,\n",
+       " 453133124104520094,\n",
+       " 453133124104520095,\n",
+       " 453133124104520096,\n",
+       " 453133124104520097,\n",
+       " 453133124104520098,\n",
+       " 453133124104520099,\n",
+       " 453133124104520100,\n",
+       " 453133124104520101,\n",
+       " 453133124104520102,\n",
+       " 453133124104520103,\n",
+       " 453133124104520104,\n",
+       " 453133124104520105,\n",
+       " 453133124104520106,\n",
+       " 453133124104520107,\n",
+       " 453133124104520108,\n",
+       " 453133124104520109,\n",
+       " 453133124104520110,\n",
+       " 453133124104520111,\n",
+       " 453133124104520112,\n",
+       " 453133124104520113,\n",
+       " 453133124104520114,\n",
+       " 453133124104520115,\n",
+       " 453133124104520116,\n",
+       " 453133124104520117,\n",
+       " 453133124104520118,\n",
+       " 453133124104520119,\n",
+       " 453133124104520120,\n",
+       " 453133124104520121,\n",
+       " 453133124104520122,\n",
+       " 453133124104520123,\n",
+       " 453133124104520124,\n",
+       " 453133124104520125,\n",
+       " 453133124104520126,\n",
+       " 453133124104520127,\n",
+       " 453133124104520128,\n",
+       " 453133124104520129,\n",
+       " 453133124104520130,\n",
+       " 453133124104520131,\n",
+       " 453133124104520132,\n",
+       " 453133124104520133,\n",
+       " 453133124104520134,\n",
+       " 453133124104520135,\n",
+       " 453133124104520136,\n",
+       " 453133124104520137,\n",
+       " 453133124104520138,\n",
+       " 453133124104520139,\n",
+       " 453133124104520140,\n",
+       " 453133124104520141,\n",
+       " 453133124104520142,\n",
+       " 453133124104520143,\n",
+       " 453133124104520144,\n",
+       " 453133124104520145,\n",
+       " 453133124104520146,\n",
+       " 453133124104520147,\n",
+       " 453133124104520148,\n",
+       " 453133124104520149,\n",
+       " 453133124104520150,\n",
+       " 453133124104520151,\n",
+       " 453133124104520152,\n",
+       " 453133124104520153,\n",
+       " 453133124104520154,\n",
+       " 453133124104520155,\n",
+       " 453133124104520156,\n",
+       " 453133124104520157,\n",
+       " 453133124104520158,\n",
+       " 453133124104520159,\n",
+       " 453133124104520160,\n",
+       " 453133124104520161,\n",
+       " 453133124104520162,\n",
+       " 453133124104520163,\n",
+       " 453133124104520164,\n",
+       " 453133124104520165,\n",
+       " 453133124104520166,\n",
+       " 453133124104520167,\n",
+       " 453133124104520168,\n",
+       " 453133124104520169,\n",
+       " 453133124104520170,\n",
+       " 453133124104520171,\n",
+       " 453133124104520172,\n",
+       " 453133124104520173,\n",
+       " 453133124104520174,\n",
+       " 453133124104520175,\n",
+       " 453133124104520176,\n",
+       " 453133124104520177,\n",
+       " 453133124104520178,\n",
+       " 453133124104520179,\n",
+       " 453133124104520180,\n",
+       " 453133124104520181,\n",
+       " 453133124104520182,\n",
+       " 453133124104520183,\n",
+       " 453133124104520184,\n",
+       " 453133124104520185,\n",
+       " 453133124104520186,\n",
+       " 453133124104520187,\n",
+       " 453133124104520188,\n",
+       " 453133124104520189,\n",
+       " 453133124104520190,\n",
+       " 453133124104520191,\n",
+       " 453133124104520192,\n",
+       " 453133124104520193,\n",
+       " 453133124104520194,\n",
+       " 453133124104520195,\n",
+       " 453133124104520196,\n",
+       " 453133124104520197,\n",
+       " 453133124104520198,\n",
+       " 453133124104520199,\n",
+       " 453133124104520200,\n",
+       " 453133124104520201,\n",
+       " 453133124104520202,\n",
+       " 453133124104520203,\n",
+       " 453133124104520204,\n",
+       " 453133124104520205,\n",
+       " 453133124104520206,\n",
+       " 453133124104520207,\n",
+       " 453133124104520208,\n",
+       " 453133124104520209,\n",
+       " 453133124104520210,\n",
+       " 453133124104520211,\n",
+       " 453133124104520212,\n",
+       " 453133124104520213,\n",
+       " 453133124104520214,\n",
+       " 453133124104520215,\n",
+       " 453133124104520216,\n",
+       " 453133124104520217,\n",
+       " 453133124104520218,\n",
+       " 453133124104520219,\n",
+       " 453133124104520220,\n",
+       " 453133124104520221,\n",
+       " 453133124104520222,\n",
+       " 453133124104520223,\n",
+       " 453133124104520224,\n",
+       " 453133124104520225,\n",
+       " 453133124104520226,\n",
+       " 453133124104520227,\n",
+       " 453133124104520228,\n",
+       " 453133124104520229,\n",
+       " 453133124104520230,\n",
+       " 453133124104520231,\n",
+       " 453133124104520232,\n",
+       " 453133124104520233,\n",
+       " 453133124104520234,\n",
+       " 453133124104520235,\n",
+       " 453133124104520236,\n",
+       " 453133124104520237,\n",
+       " 453133124104520238,\n",
+       " 453133124104520239,\n",
+       " 453133124104520240,\n",
+       " 453133124104520241,\n",
+       " 453133124104520242,\n",
+       " 453133124104520243,\n",
+       " 453133124104520244,\n",
+       " 453133124104520245,\n",
+       " 453133124104520246,\n",
+       " 453133124104520247,\n",
+       " 453133124104520248,\n",
+       " 453133124104520249,\n",
+       " 453133124104520250,\n",
+       " 453133124104520251,\n",
+       " 453133124104520252,\n",
+       " 453133124104520253,\n",
+       " 453133124104520254,\n",
+       " 453133124104520255,\n",
+       " 453133124104520256,\n",
+       " 453133124104520257,\n",
+       " 453133124104520258,\n",
+       " 453133124104520259,\n",
+       " 453133124104520260,\n",
+       " 453133124104520261,\n",
+       " 453133124104520262,\n",
+       " 453133124104520263,\n",
+       " 453133124104520264,\n",
+       " 453133124104520265,\n",
+       " 453133124104520266,\n",
+       " 453133124104520267,\n",
+       " 453133124104520268,\n",
+       " 453133124104520269,\n",
+       " 453133124104520270,\n",
+       " 453133124104520271,\n",
+       " 453133124104520272,\n",
+       " 453133124104520273,\n",
+       " 453133124104520274,\n",
+       " 453133124104520275,\n",
+       " 453133124104520276,\n",
+       " 453133124104520277,\n",
+       " 453133124104520278,\n",
+       " 453133124104520279,\n",
+       " 453133124104520280,\n",
+       " 453133124104520281,\n",
+       " 453133124104520282,\n",
+       " 453133124104520283,\n",
+       " 453133124104520284,\n",
+       " 453133124104520285,\n",
+       " 453133124104520286,\n",
+       " 453133124104520287,\n",
+       " 453133124104520288,\n",
+       " 453133124104520289,\n",
+       " 453133124104520290,\n",
+       " 453133124104520291,\n",
+       " 453133124104520292,\n",
+       " 453133124104520293,\n",
+       " 453133124104520294,\n",
+       " 453133124104520295,\n",
+       " 453133124104520296,\n",
+       " 453133124104520297,\n",
+       " 453133124104520298,\n",
+       " 453133124104520299,\n",
+       " 453133124104520300,\n",
+       " 453133124104520301,\n",
+       " 453133124104520302,\n",
+       " 453133124104520303,\n",
+       " 453133124104520304,\n",
+       " 453133124104520305,\n",
+       " 453133124104520306,\n",
+       " 453133124104520307,\n",
+       " 453133124104520308,\n",
+       " 453133124104520309,\n",
+       " 453133124104520310,\n",
+       " 453133124104520311,\n",
+       " 453133124104520312,\n",
+       " 453133124104520313,\n",
+       " 453133124104520314,\n",
+       " 453133124104520315,\n",
+       " 453133124104520316,\n",
+       " 453133124104520317,\n",
+       " 453133124104520318,\n",
+       " 453133124104520319,\n",
+       " 453133124104520320,\n",
+       " 453133124104520321,\n",
+       " 453133124104520322,\n",
+       " 453133124104520323,\n",
+       " 453133124104520324,\n",
+       " 453133124104520325,\n",
+       " 453133124104520326,\n",
+       " 453133124104520327,\n",
+       " 453133124104520328,\n",
+       " 453133124104520329,\n",
+       " 453133124104520330,\n",
+       " 453133124104520331,\n",
+       " 453133124104520332,\n",
+       " 453133124104520333,\n",
+       " 453133124104520334,\n",
+       " 453133124104520335,\n",
+       " 453133124104520336,\n",
+       " 453133124104520337,\n",
+       " 453133124104520338,\n",
+       " 453133124104520339,\n",
+       " 453133124104520340,\n",
+       " 453133124104520341,\n",
+       " 453133124104520342,\n",
+       " 453133124104520343,\n",
+       " 453133124104520344,\n",
+       " 453133124104520345,\n",
+       " 453133124104520346,\n",
+       " 453133124104520347,\n",
+       " 453133124104520348,\n",
+       " 453133124104520349,\n",
+       " 453133124104520350,\n",
+       " 453133124104520351,\n",
+       " 453133124104520352,\n",
+       " 453133124104520353,\n",
+       " 453133124104520354,\n",
+       " 453133124104520355,\n",
+       " 453133124104520356,\n",
+       " 453133124104520357,\n",
+       " 453133124104520358,\n",
+       " 453133124104520359,\n",
+       " 453133124104520360,\n",
+       " 453133124104520361,\n",
+       " 453133124104520362,\n",
+       " 453133124104520363,\n",
+       " 453133124104520364,\n",
+       " 453133124104520365,\n",
+       " 453133124104520366,\n",
+       " 453133124104520367,\n",
+       " 453133124104520368,\n",
+       " 453133124104520369,\n",
+       " 453133124104520370,\n",
+       " 453133124104520371,\n",
+       " 453133124104520372,\n",
+       " 453133124104520373,\n",
+       " 453133124104520374,\n",
+       " 453133124104520375,\n",
+       " 453133124104520376,\n",
+       " 453133124104520377,\n",
+       " 453133124104520378,\n",
+       " 453133124104520379,\n",
+       " 453133124104520380,\n",
+       " 453133124104520381,\n",
+       " 453133124104520382,\n",
+       " 453133124104520383,\n",
+       " 453133124104520384,\n",
+       " 453133124104520385,\n",
+       " 453133124104520386,\n",
+       " 453133124104520387,\n",
+       " 453133124104520388,\n",
+       " 453133124104520389,\n",
+       " 453133124104520390,\n",
+       " 453133124104520391,\n",
+       " 453133124104520392,\n",
+       " 453133124104520393,\n",
+       " 453133124104520394,\n",
+       " 453133124104520395,\n",
+       " 453133124104520396,\n",
+       " 453133124104520397,\n",
+       " 453133124104520398,\n",
+       " 453133124104520399,\n",
+       " 453133124104520400,\n",
+       " 453133124104520401,\n",
+       " 453133124104520402,\n",
+       " 453133124104520403,\n",
+       " 453133124104520404,\n",
+       " 453133124104520405,\n",
+       " 453133124104520406,\n",
+       " 453133124104520407,\n",
+       " 453133124104520408,\n",
+       " 453133124104520409,\n",
+       " 453133124104520410,\n",
+       " 453133124104520411,\n",
+       " 453133124104520412,\n",
+       " 453133124104520413,\n",
+       " 453133124104520414,\n",
+       " 453133124104520415,\n",
+       " 453133124104520416,\n",
+       " 453133124104520417,\n",
+       " 453133124104520418,\n",
+       " 453133124104520419,\n",
+       " 453133124104520420,\n",
+       " 453133124104520421,\n",
+       " 453133124104520422,\n",
+       " 453133124104520423,\n",
+       " 453133124104520424,\n",
+       " 453133124104520425,\n",
+       " 453133124104520426,\n",
+       " 453133124104520427,\n",
+       " 453133124104520428,\n",
+       " 453133124104520429,\n",
+       " 453133124104520430,\n",
+       " 453133124104520431,\n",
+       " 453133124104520432,\n",
+       " 453133124104520433,\n",
+       " 453133124104520434,\n",
+       " 453133124104520435,\n",
+       " 453133124104520436,\n",
+       " 453133124104520437,\n",
+       " 453133124104520438,\n",
+       " 453133124104520439,\n",
+       " 453133124104520440,\n",
+       " 453133124104520441,\n",
+       " 453133124104520442,\n",
+       " 453133124104520443,\n",
+       " 453133124104520444,\n",
+       " 453133124104520445,\n",
+       " 453133124104520446,\n",
+       " 453133124104520447,\n",
+       " 453133124104520448,\n",
+       " 453133124104520449,\n",
+       " 453133124104520450,\n",
+       " 453133124104520451,\n",
+       " 453133124104520452,\n",
+       " 453133124104520453,\n",
+       " 453133124104520454,\n",
+       " 453133124104520455,\n",
+       " 453133124104520456,\n",
+       " 453133124104520457,\n",
+       " 453133124104520458,\n",
+       " 453133124104520459,\n",
+       " 453133124104520460,\n",
+       " 453133124104520461,\n",
+       " 453133124104520462,\n",
+       " 453133124104520463,\n",
+       " 453133124104520464,\n",
+       " 453133124104520465,\n",
+       " 453133124104520466,\n",
+       " 453133124104520467,\n",
+       " 453133124104520468,\n",
+       " 453133124104520469,\n",
+       " 453133124104520470,\n",
+       " 453133124104520471,\n",
+       " 453133124104520472,\n",
+       " 453133124104520473,\n",
+       " 453133124104520474,\n",
+       " 453133124104520475,\n",
+       " 453133124104520476,\n",
+       " 453133124104520477,\n",
+       " 453133124104520478,\n",
+       " 453133124104520479,\n",
+       " 453133124104520480,\n",
+       " 453133124104520481,\n",
+       " 453133124104520482,\n",
+       " 453133124104520483,\n",
+       " 453133124104520484,\n",
+       " 453133124104520485,\n",
+       " 453133124104520486,\n",
+       " 453133124104520487,\n",
+       " 453133124104520488,\n",
+       " 453133124104520489,\n",
+       " 453133124104520490,\n",
+       " 453133124104520491,\n",
+       " 453133124104520492,\n",
+       " 453133124104520493,\n",
+       " 453133124104520494,\n",
+       " 453133124104520495,\n",
+       " 453133124104520496,\n",
+       " 453133124104520497,\n",
+       " 453133124104520498,\n",
+       " 453133124104520499,\n",
+       " 453133124104520500,\n",
+       " 453133124104520501,\n",
+       " 453133124104520502,\n",
+       " 453133124104520503,\n",
+       " 453133124104520504,\n",
+       " 453133124104520505,\n",
+       " 453133124104520506,\n",
+       " 453133124104520507,\n",
+       " 453133124104520508,\n",
+       " 453133124104520509,\n",
+       " 453133124104520510,\n",
+       " 453133124104520511,\n",
+       " 453133124104520512,\n",
+       " 453133124104520513,\n",
+       " 453133124104520514,\n",
+       " 453133124104520515,\n",
+       " 453133124104520516,\n",
+       " 453133124104520517,\n",
+       " 453133124104520518,\n",
+       " 453133124104520519,\n",
+       " 453133124104520520,\n",
+       " 453133124104520521,\n",
+       " 453133124104520522,\n",
+       " 453133124104520523,\n",
+       " 453133124104520524,\n",
+       " 453133124104520525,\n",
+       " 453133124104520526,\n",
+       " 453133124104520527,\n",
+       " 453133124104520528,\n",
+       " 453133124104520529,\n",
+       " 453133124104520530,\n",
+       " 453133124104520531,\n",
+       " 453133124104520532,\n",
+       " 453133124104520533,\n",
+       " 453133124104520534,\n",
+       " 453133124104520535,\n",
+       " 453133124104520536,\n",
+       " 453133124104520537,\n",
+       " 453133124104520538,\n",
+       " 453133124104520539,\n",
+       " 453133124104520540,\n",
+       " 453133124104520541,\n",
+       " 453133124104520542,\n",
+       " 453133124104520543,\n",
+       " 453133124104520544,\n",
+       " 453133124104520545,\n",
+       " 453133124104520546,\n",
+       " 453133124104520547,\n",
+       " 453133124104520548,\n",
+       " 453133124104520549,\n",
+       " 453133124104520550,\n",
+       " 453133124104520551,\n",
+       " 453133124104520552,\n",
+       " 453133124104520553,\n",
+       " 453133124104520554,\n",
+       " 453133124104520555,\n",
+       " 453133124104520556,\n",
+       " 453133124104520557,\n",
+       " 453133124104520558,\n",
+       " 453133124104520559,\n",
+       " 453133124104520560,\n",
+       " 453133124104520561,\n",
+       " 453133124104520562,\n",
+       " 453133124104520563,\n",
+       " 453133124104520564,\n",
+       " 453133124104520565,\n",
+       " 453133124104520566,\n",
+       " 453133124104520567,\n",
+       " 453133124104520568,\n",
+       " 453133124104520569,\n",
+       " 453133124104520570,\n",
+       " 453133124104520571,\n",
+       " 453133124104520572,\n",
+       " 453133124104520573,\n",
+       " 453133124104520574,\n",
+       " 453133124104520575,\n",
+       " 453133124104520576,\n",
+       " 453133124104520577,\n",
+       " 453133124104520578,\n",
+       " 453133124104520579,\n",
+       " 453133124104520580,\n",
+       " 453133124104520581,\n",
+       " 453133124104520582,\n",
+       " 453133124104520583,\n",
+       " 453133124104520584,\n",
+       " 453133124104520585,\n",
+       " 453133124104520586,\n",
+       " 453133124104520587,\n",
+       " 453133124104520588,\n",
+       " 453133124104520589,\n",
+       " 453133124104520590,\n",
+       " 453133124104520591,\n",
+       " 453133124104520592,\n",
+       " 453133124104520593,\n",
+       " 453133124104520594,\n",
+       " 453133124104520595,\n",
+       " 453133124104520596,\n",
+       " 453133124104520597,\n",
+       " 453133124104520598,\n",
+       " 453133124104520599,\n",
+       " 453133124104520600,\n",
+       " 453133124104520601,\n",
+       " 453133124104520602,\n",
+       " 453133124104520603,\n",
+       " 453133124104520604,\n",
+       " 453133124104520605,\n",
+       " 453133124104520606,\n",
+       " 453133124104520607,\n",
+       " 453133124104520608,\n",
+       " 453133124104520609,\n",
+       " 453133124104520610,\n",
+       " 453133124104520611,\n",
+       " 453133124104520612,\n",
+       " 453133124104520613,\n",
+       " 453133124104520614,\n",
+       " 453133124104520615,\n",
+       " 453133124104520616,\n",
+       " 453133124104520617,\n",
+       " 453133124104520618,\n",
+       " 453133124104520619,\n",
+       " 453133124104520620,\n",
+       " 453133124104520621,\n",
+       " 453133124104520622,\n",
+       " 453133124104520623,\n",
+       " 453133124104520624,\n",
+       " 453133124104520625,\n",
+       " 453133124104520626,\n",
+       " 453133124104520627,\n",
+       " 453133124104520628,\n",
+       " 453133124104520629,\n",
+       " 453133124104520630,\n",
+       " 453133124104520631,\n",
+       " 453133124104520632,\n",
+       " 453133124104520633,\n",
+       " 453133124104520634,\n",
+       " 453133124104520635,\n",
+       " 453133124104520636,\n",
+       " 453133124104520637,\n",
+       " 453133124104520638,\n",
+       " 453133124104520639,\n",
+       " 453133124104520640,\n",
+       " 453133124104520641,\n",
+       " 453133124104520642,\n",
+       " 453133124104520643,\n",
+       " 453133124104520644,\n",
+       " 453133124104520645,\n",
+       " 453133124104520646,\n",
+       " 453133124104520647,\n",
+       " 453133124104520648,\n",
+       " 453133124104520649,\n",
+       " 453133124104520650,\n",
+       " 453133124104520651,\n",
+       " 453133124104520652,\n",
+       " 453133124104520653,\n",
+       " 453133124104520654,\n",
+       " 453133124104520655,\n",
+       " 453133124104520656,\n",
+       " 453133124104520657,\n",
+       " 453133124104520658,\n",
+       " 453133124104520659,\n",
+       " 453133124104520660,\n",
+       " 453133124104520661,\n",
+       " 453133124104520662,\n",
+       " 453133124104520663,\n",
+       " 453133124104520664,\n",
+       " 453133124104520665,\n",
+       " 453133124104520666,\n",
+       " 453133124104520667,\n",
+       " 453133124104520668,\n",
+       " 453133124104520669,\n",
+       " 453133124104520670,\n",
+       " 453133124104520671,\n",
+       " 453133124104520672,\n",
+       " 453133124104520673,\n",
+       " 453133124104520674,\n",
+       " 453133124104520675,\n",
+       " 453133124104520676,\n",
+       " 453133124104520677,\n",
+       " 453133124104520678,\n",
+       " 453133124104520679,\n",
+       " 453133124104520680,\n",
+       " 453133124104520681,\n",
+       " 453133124104520682,\n",
+       " 453133124104520683,\n",
+       " 453133124104520684,\n",
+       " 453133124104520685,\n",
+       " 453133124104520686,\n",
+       " 453133124104520687,\n",
+       " 453133124104520688,\n",
+       " 453133124104520689,\n",
+       " 453133124104520690,\n",
+       " 453133124104520691,\n",
+       " 453133124104520692,\n",
+       " 453133124104520693,\n",
+       " 453133124104520694,\n",
+       " 453133124104520695,\n",
+       " 453133124104520696,\n",
+       " 453133124104520697,\n",
+       " 453133124104520698,\n",
+       " 453133124104520699,\n",
+       " 453133124104520700,\n",
+       " 453133124104520701,\n",
+       " 453133124104520702,\n",
+       " 453133124104520703,\n",
+       " 453133124104520704,\n",
+       " 453133124104520705,\n",
+       " 453133124104520706,\n",
+       " 453133124104520707,\n",
+       " 453133124104520708,\n",
+       " 453133124104520709,\n",
+       " 453133124104520710,\n",
+       " 453133124104520711,\n",
+       " 453133124104520712,\n",
+       " 453133124104520713,\n",
+       " 453133124104520714,\n",
+       " 453133124104520715,\n",
+       " 453133124104520716,\n",
+       " 453133124104520717,\n",
+       " 453133124104520718,\n",
+       " 453133124104520719,\n",
+       " 453133124104520720,\n",
+       " 453133124104520721,\n",
+       " 453133124104520722,\n",
+       " 453133124104520723,\n",
+       " 453133124104520724,\n",
+       " 453133124104520725,\n",
+       " 453133124104520726,\n",
+       " 453133124104520727,\n",
+       " 453133124104520728,\n",
+       " 453133124104520729,\n",
+       " 453133124104520730,\n",
+       " 453133124104520731,\n",
+       " 453133124104520732,\n",
+       " 453133124104520733,\n",
+       " 453133124104520734,\n",
+       " 453133124104520735,\n",
+       " 453133124104520736,\n",
+       " 453133124104520737,\n",
+       " 453133124104520738,\n",
+       " 453133124104520739,\n",
+       " 453133124104520740,\n",
+       " 453133124104520741,\n",
+       " 453133124104520742,\n",
+       " 453133124104520743,\n",
+       " 453133124104520744,\n",
+       " 453133124104520745,\n",
+       " 453133124104520746,\n",
+       " 453133124104520747,\n",
+       " 453133124104520748,\n",
+       " 453133124104520749,\n",
+       " 453133124104520750,\n",
+       " 453133124104520751,\n",
+       " 453133124104520752,\n",
+       " 453133124104520753,\n",
+       " 453133124104520754,\n",
+       " 453133124104520755,\n",
+       " 453133124104520756,\n",
+       " 453133124104520757,\n",
+       " 453133124104520758,\n",
+       " 453133124104520759,\n",
+       " 453133124104520760,\n",
+       " 453133124104520761,\n",
+       " 453133124104520762,\n",
+       " 453133124104520763,\n",
+       " 453133124104520764,\n",
+       " 453133124104520765,\n",
+       " 453133124104520766,\n",
+       " 453133124104520767,\n",
+       " 453133124104520768,\n",
+       " 453133124104520769,\n",
+       " 453133124104520770,\n",
+       " 453133124104520771,\n",
+       " 453133124104520772,\n",
+       " 453133124104520773,\n",
+       " 453133124104520774,\n",
+       " 453133124104520775,\n",
+       " 453133124104520776,\n",
+       " 453133124104520777,\n",
+       " 453133124104520778,\n",
+       " 453133124104520779,\n",
+       " 453133124104520780,\n",
+       " 453133124104520781,\n",
+       " 453133124104520782,\n",
+       " 453133124104520783,\n",
+       " 453133124104520784,\n",
+       " 453133124104520785,\n",
+       " 453133124104520786,\n",
+       " 453133124104520787,\n",
+       " 453133124104520788,\n",
+       " 453133124104520789,\n",
+       " 453133124104520790,\n",
+       " 453133124104520791,\n",
+       " 453133124104520792,\n",
+       " 453133124104520793,\n",
+       " 453133124104520794,\n",
+       " 453133124104520795,\n",
+       " 453133124104520796,\n",
+       " 453133124104520797,\n",
+       " 453133124104520798,\n",
+       " 453133124104520799,\n",
+       " 453133124104520800,\n",
+       " 453133124104520801,\n",
+       " 453133124104520802,\n",
+       " 453133124104520803,\n",
+       " 453133124104520804,\n",
+       " 453133124104520805,\n",
+       " 453133124104520806,\n",
+       " 453133124104520807,\n",
+       " 453133124104520808,\n",
+       " 453133124104520809,\n",
+       " 453133124104520810,\n",
+       " 453133124104520811,\n",
+       " 453133124104520812,\n",
+       " 453133124104520813,\n",
+       " 453133124104520814,\n",
+       " 453133124104520815,\n",
+       " 453133124104520816,\n",
+       " 453133124104520817,\n",
+       " 453133124104520818,\n",
+       " 453133124104520819,\n",
+       " 453133124104520820,\n",
+       " 453133124104520821,\n",
+       " 453133124104520822,\n",
+       " 453133124104520823,\n",
+       " 453133124104520824,\n",
+       " 453133124104520825,\n",
+       " 453133124104520826,\n",
+       " 453133124104520827,\n",
+       " 453133124104520828,\n",
+       " 453133124104520829,\n",
+       " 453133124104520830,\n",
+       " 453133124104520831,\n",
+       " 453133124104520832,\n",
+       " 453133124104520833,\n",
+       " 453133124104520834,\n",
+       " 453133124104520835,\n",
+       " 453133124104520836,\n",
+       " 453133124104520837,\n",
+       " 453133124104520838,\n",
+       " 453133124104520839,\n",
+       " 453133124104520840,\n",
+       " 453133124104520841,\n",
+       " 453133124104520842,\n",
+       " 453133124104520843,\n",
+       " 453133124104520844,\n",
+       " 453133124104520845,\n",
+       " 453133124104520846,\n",
+       " 453133124104520847,\n",
+       " 453133124104520848,\n",
+       " 453133124104520849,\n",
+       " 453133124104520850,\n",
+       " 453133124104520851,\n",
+       " 453133124104520852,\n",
+       " 453133124104520853,\n",
+       " 453133124104520854,\n",
+       " 453133124104520855,\n",
+       " 453133124104520856,\n",
+       " 453133124104520857,\n",
+       " 453133124104520858,\n",
+       " 453133124104520859,\n",
+       " 453133124104520860,\n",
+       " 453133124104520861,\n",
+       " 453133124104520862,\n",
+       " 453133124104520863,\n",
+       " 453133124104520864,\n",
+       " 453133124104520865,\n",
+       " 453133124104520866,\n",
+       " 453133124104520867,\n",
+       " 453133124104520868,\n",
+       " 453133124104520869,\n",
+       " 453133124104520870,\n",
+       " 453133124104520871,\n",
+       " 453133124104520872,\n",
+       " 453133124104520873,\n",
+       " 453133124104520874,\n",
+       " 453133124104520875,\n",
+       " 453133124104520876,\n",
+       " 453133124104520877,\n",
+       " 453133124104520878,\n",
+       " 453133124104520879,\n",
+       " 453133124104520880,\n",
+       " 453133124104520881,\n",
+       " 453133124104520882,\n",
+       " 453133124104520883,\n",
+       " 453133124104520884,\n",
+       " 453133124104520885,\n",
+       " 453133124104520886,\n",
+       " 453133124104520887,\n",
+       " 453133124104520888,\n",
+       " 453133124104520889,\n",
+       " 453133124104520890,\n",
+       " 453133124104520891,\n",
+       " 453133124104520892,\n",
+       " 453133124104520893,\n",
+       " 453133124104520894,\n",
+       " 453133124104520895,\n",
+       " 453133124104520896,\n",
+       " 453133124104520897,\n",
+       " 453133124104520898,\n",
+       " 453133124104520899,\n",
+       " 453133124104520900,\n",
+       " 453133124104520901,\n",
+       " 453133124104520902,\n",
+       " 453133124104520903,\n",
+       " 453133124104520904,\n",
+       " 453133124104520905,\n",
+       " 453133124104520906,\n",
+       " 453133124104520907,\n",
+       " 453133124104520908,\n",
+       " 453133124104520909,\n",
+       " 453133124104520910,\n",
+       " 453133124104520911,\n",
+       " 453133124104520912,\n",
+       " 453133124104520913,\n",
+       " 453133124104520914,\n",
+       " 453133124104520915,\n",
+       " 453133124104520916,\n",
+       " 453133124104520917,\n",
+       " 453133124104520918,\n",
+       " 453133124104520919,\n",
+       " 453133124104520920,\n",
+       " 453133124104520921,\n",
+       " 453133124104520922,\n",
+       " 453133124104520923,\n",
+       " 453133124104520924,\n",
+       " 453133124104520925,\n",
+       " 453133124104520926,\n",
+       " 453133124104520927,\n",
+       " 453133124104520928,\n",
+       " 453133124104520929,\n",
+       " 453133124104520930,\n",
+       " 453133124104520931,\n",
+       " 453133124104520932,\n",
+       " 453133124104520933,\n",
+       " 453133124104520934,\n",
+       " 453133124104520935,\n",
+       " 453133124104520936,\n",
+       " 453133124104520937,\n",
+       " 453133124104520938,\n",
+       " 453133124104520939,\n",
+       " 453133124104520940,\n",
+       " 453133124104520941,\n",
+       " 453133124104520942,\n",
+       " 453133124104520943,\n",
+       " 453133124104520944,\n",
+       " 453133124104520945,\n",
+       " 453133124104520946,\n",
+       " 453133124104520947,\n",
+       " 453133124104520948,\n",
+       " 453133124104520949,\n",
+       " 453133124104520950,\n",
+       " 453133124104520951,\n",
+       " 453133124104520952,\n",
+       " 453133124104520953,\n",
+       " 453133124104520954,\n",
+       " 453133124104520955,\n",
+       " 453133124104520956,\n",
+       " 453133124104520957,\n",
+       " 453133124104520958,\n",
+       " 453133124104520959,\n",
+       " 453133124104520960,\n",
+       " 453133124104520961,\n",
+       " 453133124104520962,\n",
+       " 453133124104520963,\n",
+       " 453133124104520964,\n",
+       " 453133124104520965,\n",
+       " 453133124104520966,\n",
+       " 453133124104520967,\n",
+       " 453133124104520968,\n",
+       " 453133124104520969,\n",
+       " 453133124104520970,\n",
+       " 453133124104520971,\n",
+       " 453133124104520972,\n",
+       " 453133124104520973,\n",
+       " 453133124104520974,\n",
+       " 453133124104520975,\n",
+       " 453133124104520976,\n",
+       " 453133124104520977,\n",
+       " 453133124104520978,\n",
+       " 453133124104520979,\n",
+       " 453133124104520980,\n",
+       " 453133124104520981,\n",
+       " 453133124104520982,\n",
+       " 453133124104520983,\n",
+       " 453133124104520984,\n",
+       " 453133124104520985,\n",
+       " 453133124104520986,\n",
+       " 453133124104520987,\n",
+       " 453133124104520988,\n",
+       " 453133124104520989,\n",
+       " 453133124104520990,\n",
+       " 453133124104520991,\n",
+       " 453133124104520992,\n",
+       " 453133124104520993,\n",
+       " 453133124104520994,\n",
+       " 453133124104520995,\n",
+       " 453133124104520996,\n",
+       " 453133124104520997,\n",
+       " 453133124104520998,\n",
+       " 453133124104520999,\n",
+       " 453133124104521000,\n",
+       " 453133124104521001,\n",
+       " 453133124104521002,\n",
+       " 453133124104521003,\n",
+       " 453133124104521004,\n",
+       " 453133124104521005,\n",
+       " 453133124104521006,\n",
+       " 453133124104521007,\n",
+       " 453133124104521008,\n",
+       " 453133124104521009,\n",
+       " 453133124104521010,\n",
+       " 453133124104521011,\n",
+       " 453133124104521012,\n",
+       " 453133124104521013,\n",
+       " 453133124104521014,\n",
+       " 453133124104521015,\n",
+       " 453133124104521016,\n",
+       " 453133124104521017,\n",
+       " 453133124104521018,\n",
+       " 453133124104521019,\n",
+       " 453133124104521020,\n",
+       " 453133124104521021,\n",
+       " 453133124104521022,\n",
+       " 453133124104521023,\n",
+       " 453133124104521024,\n",
+       " 453133124104521025,\n",
+       " 453133124104521026,\n",
+       " 453133124104521027,\n",
+       " 453133124104521028,\n",
+       " 453133124104521029,\n",
+       " 453133124104521030,\n",
+       " 453133124104521031,\n",
+       " 453133124104521032,\n",
+       " 453133124104521033,\n",
+       " 453133124104521034,\n",
+       " 453133124104521035,\n",
+       " 453133124104521036,\n",
+       " 453133124104521037,\n",
+       " 453133124104521038,\n",
+       " 453133124104521039,\n",
+       " 453133124104521040,\n",
+       " 453133124104521041,\n",
+       " 453133124104521042,\n",
+       " 453133124104521043,\n",
+       " 453133124104521044,\n",
+       " 453133124104521045,\n",
+       " 453133124104521046,\n",
+       " 453133124104521047,\n",
+       " 453133124104521048,\n",
+       " 453133124104521049,\n",
+       " 453133124104521050,\n",
+       " 453133124104521051,\n",
+       " 453133124104521052,\n",
+       " 453133124104521053,\n",
+       " 453133124104521054,\n",
+       " 453133124104521055,\n",
+       " 453133124104521056,\n",
+       " 453133124104521057,\n",
+       " 453133124104521058,\n",
+       " 453133124104521059,\n",
+       " 453133124104521060,\n",
+       " 453133124104521061,\n",
+       " 453133124104521062,\n",
+       " 453133124104521063,\n",
+       " ...]"
+      ]
+     },
+     "execution_count": 14,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "db.add_documents(all_splits)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7a3d987b-8ebc-46ce-a206-48c1339b7a5b",
+   "metadata": {},
+   "source": [
+    "#### Alternatively, add new documents"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "c37f227d-a13d-456c-b91b-3c203e62fc0f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# If you don't want to use a GPU, you can remove the 'device': 'cuda' argument\n",
+    "# model_kwargs = {'trust_remote_code': True, 'device': 'cuda'}\n",
+    "# embeddings = HuggingFaceEmbeddings(\n",
+    "#     model_name=\"nomic-ai/nomic-embed-text-v1\",\n",
+    "#     model_kwargs=model_kwargs,\n",
+    "#     show_progress=True\n",
+    "# )\n",
+    "\n",
+    "# db = Milvus(\n",
+    "#     embedding_function=embeddings,\n",
+    "#     connection_args={\"host\": MILVUS_HOST, \"port\": MILVUS_PORT, \"user\": MILVUS_USERNAME, \"password\": MILVUS_PASSWORD},\n",
+    "#     collection_name=MILVUS_COLLECTION,\n",
+    "#     metadata_field=\"metadata\",\n",
+    "#     text_field=\"page_content\",\n",
+    "#     auto_id=True,\n",
+    "#     drop_old=False\n",
+    "#     )\n",
+    "\n",
+    "# db.add_documents(all_splits)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dae3b458-4979-46df-8493-7496764a2568",
+   "metadata": {},
+   "source": [
+    "#### Test query"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "489c6e6d-c42c-4de4-87cf-8edfd0e63da3",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "2778136258c74138af5abb11ad8d812c",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Batches:   0%|          | 0/1 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "query = \"How can I install OpenShift AI?\"\n",
+    "docs_with_score = db.similarity_search_with_score(query)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "90feeb37-7888-4c5f-a5cb-5f82637cec16",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "--------------------------------------------------------------------------------\n",
+      "Score:  0.4710683524608612\n",
+      "Pak for Data version 5.0.3 or greater. These versions of Cloud Pak for Data include\n",
+      "watsonx.ai. If this use case does not apply to your organization, see \n",
+      "Installing and\n",
+      "deploying OpenShift AI in a disconnected environment\n",
+      " for more generally applicable\n",
+      "instructions.\n",
+      "This procedure shows how to use the OpenShift command-line interface (CLI) to install the Red Hat\n",
+      "OpenShift AI Operator on your OpenShift cluster. You must install the Operator before you can manage\n",
+      "the installation of OpenShift AI components.\n",
+      "Prerequisites\n",
+      "You have a running OpenShift cluster, version 4.12 or greater, configured with a default storage\n",
+      "class that can be dynamically provisioned.\n",
+      "You have cluster administrator privileges for your OpenShift cluster.\n",
+      "You have downloaded and installed the OpenShift command-line interface (CLI). See \n",
+      "Installing\n",
+      "the OpenShift CLI\n",
+      ".\n",
+      "You have mirrored the required container images to a private registry. See \n",
+      "Mirroring images to\n",
+      "a private registry for a disconnected installation\n",
+      ".\n",
+      "Procedure\n",
+      "1\n",
+      ".\n",
+      "--------------------------------------------------------------------------------\n",
+      "--------------------------------------------------------------------------------\n",
+      "Score:  0.4710858166217804\n",
+      "OpenShift is a Limited Availability feature. Limited Availability means that you can install\n",
+      "and receive support for the feature only with specific approval from the Red Hat AI\n",
+      "Business Unit. Without such approval, the feature is unsupported.\n",
+      "Prerequisites\n",
+      "You have logged in to Red Hat OpenShift AI.\n",
+      "You have cluster administrator privileges for your OpenShift cluster.\n",
+      "You have created an OpenShift cluster that has a node with at least 4 CPUs and 16 GB memory.\n",
+      "You have installed the Red Hat OpenShift AI (RHOAI) Operator.\n",
+      "You have installed the OpenShift command-line interface (CLI). For more information about\n",
+      "installing the OpenShift command-line interface (CLI), see \n",
+      "Getting started with the OpenShift\n",
+      "CLI\n",
+      ".\n",
+      "You have installed KServe.\n",
+      "You have access to S3-compatible object storage.\n",
+      "For the model that you want to deploy, you know the associated folder path in your S3-\n",
+      "compatible object storage bucket.\n",
+      "To use the Caikit-TGIS runtime, you have converted your model to Caikit format. For an\n",
+      "--------------------------------------------------------------------------------\n",
+      "--------------------------------------------------------------------------------\n",
+      "Score:  0.47165608406066895\n",
+      "Red Hat OpenShift AI Self-Managed 2.13 Installing and uninstalling OpenShift AI Self-Managed\n",
+      "20\n",
+      "--------------------------------------------------------------------------------\n",
+      "--------------------------------------------------------------------------------\n",
+      "Score:  0.4717487096786499\n",
+      "Red Hat OpenShift AI Self-Managed\n",
+      " \n",
+      "2.13\n",
+      " \n",
+      "Installing and uninstalling\n",
+      "OpenShift AI Self-Managed\n",
+      "Install and uninstall OpenShift AI Self-Managed\n",
+      "--------------------------------------------------------------------------------\n"
+     ]
+    }
+   ],
+   "source": [
+    "for doc, score in docs_with_score:\n",
+    "    print(\"-\" * 80)\n",
+    "    print(\"Score: \", score)\n",
+    "    print(doc.page_content)\n",
+    "    print(\"-\" * 80)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3.9",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.18"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/lab-materials/04-rag/5.2-query-rag.ipynb b/lab-materials/04-rag/5.2-query-rag.ipynb
new file mode 100644
index 0000000..cb6eafd
--- /dev/null
+++ b/lab-materials/04-rag/5.2-query-rag.ipynb
@@ -0,0 +1,280 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "165a3407",
+   "metadata": {},
+   "source": [
+    "## Querying a Milvus index - Nomic AI Embeddings\n",
+    "\n",
+    "How to query content from a Milvus VectorStore."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "48ac3132-6929-4477-9585-31761d7d9848",
+   "metadata": {},
+   "source": [
+    "### Needed packages and imports"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "1ed97389-9c5b-46a8-bedf-f28bf7038a07",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
+      "kfp 1.8.22 requires requests-toolbelt<1,>=0.8.0, but you have requests-toolbelt 1.0.0 which is incompatible.\u001b[0m\u001b[31m\n",
+      "\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.2\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n",
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.2\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n"
+     ]
+    }
+   ],
+   "source": [
+    "!pip install -q einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6 sentence-transformers==2.4.0\n",
+    "!pip install -q --upgrade transformers\n",
+    "#!pip install einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6  transformers\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "1c53e798",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "from langchain.embeddings.huggingface import HuggingFaceEmbeddings\n",
+    "from langchain_community.vectorstores import Milvus"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f0b8ecae",
+   "metadata": {
+    "tags": []
+   },
+   "source": [
+    "### Base parameters, the Milvus connection info"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "9376e567",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "MILVUS_HOST = \"vectordb-milvus.milvus.svc.cluster.local\"\n",
+    "MILVUS_PORT = 19530\n",
+    "MILVUS_USERNAME = os.getenv('MILVUS_USERNAME')\n",
+    "MILVUS_PASSWORD = os.getenv('MILVUS_PASSWORD')\n",
+    "MILVUS_COLLECTION = \"collection_nomicai_embeddings\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "56d51868",
+   "metadata": {},
+   "source": [
+    "### Initialize the connection"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "bbb6a3e3-5ccd-441e-b80d-427555d9e9f6",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "You try to use a model that was created with version 2.4.0.dev0, however, your version is 2.4.0. This might cause unexpected behavior or errors. In that case, try to update to the latest version.\n",
+      "\n",
+      "\n",
+      "\n",
+      "<All keys matched successfully>\n"
+     ]
+    }
+   ],
+   "source": [
+    "# If you don't want to use a GPU, you can remove the 'device': 'cuda' argument\n",
+    "model_kwargs = {'trust_remote_code': True, 'device': 'cuda'}\n",
+    "embeddings = HuggingFaceEmbeddings(\n",
+    "    model_name=\"nomic-ai/nomic-embed-text-v1\",\n",
+    "    model_kwargs=model_kwargs,\n",
+    "    show_progress=True\n",
+    ")\n",
+    "\n",
+    "store = Milvus(\n",
+    "    embedding_function=embeddings,\n",
+    "    connection_args={\"host\": MILVUS_HOST, \"port\": MILVUS_PORT, \"user\": MILVUS_USERNAME, \"password\": MILVUS_PASSWORD},\n",
+    "    collection_name=MILVUS_COLLECTION,\n",
+    "    metadata_field=\"metadata\",\n",
+    "    text_field=\"page_content\",\n",
+    "    drop_old=False\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9856851c",
+   "metadata": {},
+   "source": [
+    "### Make a query to the index to verify sources"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "9621e231-3541-40bc-85ef-8aa3b2ba2331",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "da82af613881491fa0b11c75381d6c14",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Batches:   0%|          | 0/1 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/working_on_data_science_projects/index\n",
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/openshift_ai_tutorial_-_fraud_detection_example/index\n",
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/getting_started_with_red_hat_openshift_ai_self-managed/index\n",
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/working_on_data_science_projects/index\n"
+     ]
+    }
+   ],
+   "source": [
+    "query=\"How can I create a Data Science Project?\"\n",
+    "results = store.similarity_search_with_score(query, k=4, return_metadata=True)\n",
+    "for result in results:\n",
+    "    print(result[0].metadata['source'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f1005e2c",
+   "metadata": {},
+   "source": [
+    "### Work with a retriever"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "566f9347-a40a-4eeb-a690-e199b91947a3",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "retriever = store.as_retriever(search_type=\"similarity\", search_kwargs={\"k\": 4})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "1c378fbd-395d-43af-8cca-268bc05d0f51",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/opt/app-root/lib64/python3.11/site-packages/langchain_core/_api/deprecation.py:119: LangChainDeprecationWarning: The method `BaseRetriever.get_relevant_documents` was deprecated in langchain-core 0.1.46 and will be removed in 0.3.0. Use invoke instead.\n",
+      "  warn_deprecated(\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "26c8cb75f7574c18a59185e533ffedc6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Batches:   0%|          | 0/1 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/plain": [
+       "[Document(page_content='CHAPTER 1. USING DATA SCIENCE PROJECTS\\n1.1. CREATING A DATA SCIENCE PROJECT\\nTo implement a data science workflow, you must create a project. In OpenShift, a project is a Kubernetes\\nnamespace with additional annotations, and is the main way that you can manage user access to\\nresources. A project organizes your data science work in one place and also allows you to collaborate\\nwith other developers and data scientists in your organization.\\nWithin a project, you can add the following functionality:\\nData connections so that you can access data without having to hardcode information like\\nendpoints or credentials.\\nWorkbenches for working with and processing data, and for developing models.\\nDeployed models so that you can test them and then integrate them into intelligent\\napplications. Deploying a model makes it available as a service that you can access by using an\\nAPI.\\nPipelines for automating your ML workflow.\\nPrerequisites\\nYou have logged in to Red Hat OpenShift AI.', metadata={'source': 'https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/working_on_data_science_projects/index', 'page': 7}),\n",
+       " Document(page_content='However, it would be a one-off Jupyter notebook run in isolation. To implement a data science\\nworkflow, you must create a data science project (as described in the following procedure).\\nProjects allow you and your team to organize and collaborate on resources within separated\\nnamespaces. From a project you can create multiple workbenches, each with their own IDE\\nenvironment (for example, JupyterLab), and each with their own data connections and cluster\\nstorage. In addition, the workbenches can share models and data with pipelines and model\\nservers.\\n2\\n. \\nIf you are using the Red Hat Developer Sandbox, you are provided with a default data science\\nproject (for example, \\nmyname-dev\\n). Select it and skip over the next step to the \\nVerification\\nsection.\\nIf you are using your own OpenShift cluster, click \\nCreate data science project\\n.\\n3\\n. \\nEnter a display name and description. Based on the display name, a resource name is\\nautomatically generated, but you can change it if you prefer.\\nVerification', metadata={'source': 'https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/openshift_ai_tutorial_-_fraud_detection_example/index', 'page': 9}),\n",
+       " Document(page_content='CHAPTER 3. CREATING A DATA SCIENCE PROJECT\\nTo implement a data science workflow, you must create a project. In OpenShift, a project is a Kubernetes\\nnamespace with additional annotations, and is the main way that you can manage user access to\\nresources. A project organizes your data science work in one place and also allows you to collaborate\\nwith other developers and data scientists in your organization.\\nWithin a project, you can add the following functionality:\\nData connections so that you can access data without having to hardcode information like\\nendpoints or credentials.\\nWorkbenches for working with and processing data, and for developing models.\\nDeployed models so that you can test them and then integrate them into intelligent\\napplications. Deploying a model makes it available as a service that you can access by using an\\nAPI.\\nPipelines for automating your ML workflow.\\nPrerequisites\\nYou have logged in to Red Hat OpenShift AI.', metadata={'source': 'https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/getting_started_with_red_hat_openshift_ai_self-managed/index', 'page': 9}),\n",
+       " Document(page_content='PREFACE\\nAs a data scientist, you can organize your data science work into a single project. A data science project\\nin OpenShift AI can consist of the following components:\\nWorkbenches\\nCreating a workbench allows you to add a Jupyter notebook to your project.\\nCluster storage\\nFor data science projects that require data retention, you can add cluster storage to the project.\\nData connections\\nAdding a data connection to your project allows you to connect data inputs to your workbenches.\\nPipelines\\nStandardize and automate machine learning workflows to enable you to further enhance and deploy\\nyour data science models.\\nModels and model servers\\nDeploy a trained data science model to serve intelligent applications. Your model is deployed with an\\nendpoint that allows applications to send requests to the model.\\nPREFACE\\n3', metadata={'source': 'https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/working_on_data_science_projects/index', 'page': 6})]"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "docs = retriever.get_relevant_documents(query)\n",
+    "docs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "00308570-179b-4112-a1df-81c276d1b513",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3.9",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.18"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/lab-materials/04-rag/5.3-simple-rag.ipynb b/lab-materials/04-rag/5.3-simple-rag.ipynb
new file mode 100644
index 0000000..dab2247
--- /dev/null
+++ b/lab-materials/04-rag/5.3-simple-rag.ipynb
@@ -0,0 +1,371 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "2a331fd6",
+   "metadata": {},
+   "source": [
+    "## RAG example with Langchain, Milvus, and vLLM\n",
+    "\n",
+    "Requirements:\n",
+    "- A Milvus instance, either standalone or cluster.\n",
+    "- Connection credentials to Milvus must be available as environment variables: MILVUS_USERNAME and MILVUS_PASSWORD.\n",
+    "- A vLLM inference endpoint. In this example we use the OpenAI Compatible API."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e712b3e8-f406-4387-9188-3e2f20a6841f",
+   "metadata": {},
+   "source": [
+    "### Needed packages and imports"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "d4a359bd-4f69-4e88-82c0-5763c26aa0af",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.2\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n"
+     ]
+    }
+   ],
+   "source": [
+    "!pip install -q einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6\n",
+    "#!pip install -q einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6 openai==1.13.3\n",
+    "#!pip install einops==0.7.0 langchain==0.1.9 pymilvus==2.3.6 sentence-transformers==2.4.0 openai==1.13.3\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "83e11d23-c0ad-4875-b67f-149fc8b14725",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "from langchain.callbacks.base import BaseCallbackHandler\n",
+    "from langchain.chains import RetrievalQA\n",
+    "from langchain.embeddings.huggingface import HuggingFaceEmbeddings\n",
+    "from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler\n",
+    "from langchain_community.llms import VLLMOpenAI\n",
+    "from langchain.prompts import PromptTemplate\n",
+    "from langchain_community.vectorstores import Milvus"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9cd4537b",
+   "metadata": {},
+   "source": [
+    "#### Bases parameters, Inference server and Milvus info"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "51baf1a6-4111-4b40-b43a-833438bdc222",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "# Replace values according to your Milvus deployment\n",
+    "INFERENCE_SERVER_URL = \"https://mistral-7b-instruct-v0-3-maas-apicast-production.apps.prod.rhoai.rh-aiservices-bu.com:443/v1\"\n",
+    "MODEL_NAME = \"mistral-7b-instruct\"\n",
+    "API_KEY= os.getenv('API_KEY')\n",
+    "#API_KEY= \"Empty\"\n",
+    "MAX_TOKENS=1024\n",
+    "TOP_P=0.95\n",
+    "TEMPERATURE=0.01\n",
+    "PRESENCE_PENALTY=1.03\n",
+    "MILVUS_HOST = \"vectordb-milvus.milvus.svc.cluster.local\"\n",
+    "MILVUS_PORT = 19530\n",
+    "MILVUS_USERNAME = os.getenv('MILVUS_USERNAME')\n",
+    "MILVUS_PASSWORD = os.getenv('MILVUS_PASSWORD')\n",
+    "MILVUS_COLLECTION = \"collection_nomicai_embeddings\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fe4c1b1a",
+   "metadata": {},
+   "source": [
+    "#### Initialize the connection"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "bbb6a3e3-5ccd-441e-b80d-427555d9e9f6",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "You try to use a model that was created with version 2.4.0.dev0, however, your version is 2.4.0. This might cause unexpected behavior or errors. In that case, try to update to the latest version.\n",
+      "\n",
+      "\n",
+      "\n",
+      "<All keys matched successfully>\n"
+     ]
+    }
+   ],
+   "source": [
+    "model_kwargs = {'trust_remote_code': True}\n",
+    "embeddings = HuggingFaceEmbeddings(\n",
+    "    model_name=\"nomic-ai/nomic-embed-text-v1\",\n",
+    "    model_kwargs=model_kwargs,\n",
+    "    show_progress=False\n",
+    ")\n",
+    "\n",
+    "store = Milvus(\n",
+    "    embedding_function=embeddings,\n",
+    "    connection_args={\"host\": MILVUS_HOST, \"port\": MILVUS_PORT, \"user\": MILVUS_USERNAME, \"password\": MILVUS_PASSWORD},\n",
+    "    collection_name=MILVUS_COLLECTION,\n",
+    "    metadata_field=\"metadata\",\n",
+    "    text_field=\"page_content\",\n",
+    "    drop_old=False\n",
+    "    )"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b72a3a2b",
+   "metadata": {},
+   "source": [
+    "#### Initialize query chain"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "ed8fd396-0798-45c5-8969-6b6ede134c77",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "template=\"\"\"<s>[INST] <<SYS>>\n",
+    "You are a helpful, respectful and honest assistant named HatBot answering questions.\n",
+    "You will be given a question you need to answer, and a context to provide you with information. You must answer the question based as much as possible on this context.\n",
+    "Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\n",
+    "\n",
+    "If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.\n",
+    "<</SYS>>\n",
+    "\n",
+    "Context: \n",
+    "{context}\n",
+    "\n",
+    "Question: {question} [/INST]\n",
+    "\"\"\"\n",
+    "\n",
+    "QA_CHAIN_PROMPT = PromptTemplate.from_template(template)\n",
+    "\n",
+    "llm =  ChatOpenAI(\n",
+    "    openai_api_key=API_KEY,\n",
+    "    openai_api_base=INFERENCE_SERVER_URL,\n",
+    "    model_name=MODEL_NAME,\n",
+    "    max_tokens=MAX_TOKENS,\n",
+    "    top_p=TOP_P,\n",
+    "    temperature=TEMPERATURE,\n",
+    "    presence_penalty=PRESENCE_PENALTY,\n",
+    "    streaming=True,\n",
+    "    verbose=False,\n",
+    "    callbacks=[StreamingStdOutCallbackHandler()]\n",
+    ")\n",
+    "\n",
+    "qa_chain = RetrievalQA.from_chain_type(\n",
+    "        llm,\n",
+    "        retriever=store.as_retriever(\n",
+    "            search_type=\"similarity\",\n",
+    "            search_kwargs={\"k\": 4}\n",
+    "            ),\n",
+    "        chain_type_kwargs={\"prompt\": QA_CHAIN_PROMPT},\n",
+    "        return_source_documents=True\n",
+    "        )\n",
+    "\n",
+    "os.environ[\"TOKENIZERS_PARALLELISM\"] = \"false\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7db84a77-ead5-43d8-9372-1e58e64830d2",
+   "metadata": {},
+   "source": [
+    "### Query the LLM without RAG"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "16a30bbb-47c5-45ee-a1fc-84c5f65fc516",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "An accelerator profile is a setting in some software applications or devices that can enhance the performance of the system. The specific steps to use an accelerator profile may vary depending on the software or device you're using. Here's a general idea of how you might use one:\n",
+      "\n",
+      "1. Locate the settings or preferences menu within your software or device. This is usually found in the main menu or under the gear icon.\n",
+      "\n",
+      "2. Look for a section labeled \"Performance,\" \"Performance Settings,\" or something similar.\n",
+      "\n",
+      "3. In this section, you should find options for different performance profiles. These might be labeled as \"Balanced,\" \"High Performance,\" \"Ultra,\" etc.\n",
+      "\n",
+      "4. Select the \"High Performance\" or \"Ultra\" option to enable the accelerator profile. This will typically increase the speed and responsiveness of your software or device, but may also consume more resources and potentially drain battery life faster.\n",
+      "\n",
+      "5. Save your changes and test the performance of your software or device to see if it meets your needs. If not, you can always switch back to a different profile or adjust other settings as needed."
+     ]
+    }
+   ],
+   "source": [
+    "from langchain.chains import ConversationChain\n",
+    "from langchain.memory import ConversationBufferMemory\n",
+    "from langchain_community.llms import VLLMOpenAI\n",
+    "from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler\n",
+    "from langchain.prompts import PromptTemplate\n",
+    "\n",
+    "template=\"\"\"<s>[INST] <<SYS>>\n",
+    "You are a helpful, respectful and honest assistant. Always be as helpful as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\n",
+    "\n",
+    "If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.\n",
+    "<</SYS>>\n",
+    "\n",
+    "Current conversation:\n",
+    "{history}\n",
+    "Human: {input}\n",
+    "AI:\n",
+    "[/INST]\n",
+    "\"\"\"\n",
+    "PROMPT = PromptTemplate(input_variables=[\"history\", \"input\"], template=template)\n",
+    "\n",
+    "memory=ConversationBufferMemory()\n",
+    "\n",
+    "conversation = ConversationChain(llm=llm,\n",
+    "                                 prompt=PROMPT,\n",
+    "                                 verbose=False,\n",
+    "                                 memory=memory\n",
+    "                                )\n",
+    "\n",
+    "question = \"How can I use an accelerator profile?\"\n",
+    "conversation.predict(input=question);"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3a45ad23",
+   "metadata": {},
+   "source": [
+    "### Query example with RAG"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "105d2fd1-f36c-409d-8e52-ec6d23a56ad1",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "To use an accelerator profile in OpenShift AI, you need to follow these steps:\n",
+      "\n",
+      "1. First, ensure that your OpenShift instance contains an associated accelerator. If it's a new accelerator, you'll need to configure an accelerator profile for the accelerator in context. You can create an accelerator profile from the \"Settings\" page on the OpenShift AI dashboard, under the \"Accelerator profiles\" section.\n",
+      "\n",
+      "2. If you have upgraded your OpenShift AI to version 2.13 or later and your instance already has an accelerator, its accelerator profile will be preserved after the upgrade. No additional action is required for existing accelerators.\n",
+      "\n",
+      "3. For Intel Gaudi AI accelerators, you'll need to install the necessary dependencies and the version of the HabanaAI Operator that matches the Habana version of the HabanaAI workbench image in your deployment. You can find more information about this process in the resources provided: \"HabanaAI Operator v1.10 for OpenShift\" and \"HabanaAI Operator v1.13 for OpenShift\".\n",
+      "\n",
+      "4. Once you have the necessary prerequisites in place, you can enable and use the Intel Gaudi AI accelerators in your OpenShift AI environment. The specific steps for this may vary depending on whether you are using the accelerators on-premises or with AWS DL1 compute nodes on an AWS instance."
+     ]
+    }
+   ],
+   "source": [
+    "question = \"How can I use an accelerator profile?\"\n",
+    "result = qa_chain.invoke({\"query\": question})\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "97d75d0c",
+   "metadata": {},
+   "source": [
+    "#### Retrieve source"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "acda357e-558a-4879-8ad8-21f0567f2f2e",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/managing_resources/index\n",
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/upgrading_openshift_ai_self-managed_in_a_disconnected_environment/index\n",
+      "https://access.redhat.com/documentation/en-us/red_hat_openshift_ai_self-managed/2.13/html-single/installing_and_uninstalling_openshift_ai_self-managed_in_a_disconnected_environment/index\n"
+     ]
+    }
+   ],
+   "source": [
+    "def remove_duplicates(input_list):\n",
+    "    unique_list = []\n",
+    "    for item in input_list:\n",
+    "        if item.metadata['source'] not in unique_list:\n",
+    "            unique_list.append(item.metadata['source'])\n",
+    "    return unique_list\n",
+    "\n",
+    "results = remove_duplicates(result['source_documents'])\n",
+    "\n",
+    "for s in results:\n",
+    "    print(s)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3.9",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.18"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}