diff --git a/.env b/.env new file mode 100644 index 0000000..e570b8b --- /dev/null +++ b/.env @@ -0,0 +1 @@ +OPENAI_API_KEY= diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..5e49e1a Binary files /dev/null and b/.gitignore differ diff --git a/your-code/chroma_db_LAB/chroma.sqlite3 b/your-code/chroma_db_LAB/chroma.sqlite3 new file mode 100644 index 0000000..57f25c9 Binary files /dev/null and b/your-code/chroma_db_LAB/chroma.sqlite3 differ diff --git a/your-code/chroma_db_lesson/chroma.sqlite3 b/your-code/chroma_db_lesson/chroma.sqlite3 new file mode 100644 index 0000000..1626eb2 Binary files /dev/null and b/your-code/chroma_db_lesson/chroma.sqlite3 differ diff --git a/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/data_level0.bin b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/data_level0.bin new file mode 100644 index 0000000..eb69439 Binary files /dev/null and b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/data_level0.bin differ diff --git a/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/header.bin b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/header.bin new file mode 100644 index 0000000..b04cf10 Binary files /dev/null and b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/header.bin differ diff --git a/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/index_metadata.pickle b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/index_metadata.pickle new file mode 100644 index 0000000..0ce2275 Binary files /dev/null and b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/index_metadata.pickle differ diff --git a/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/length.bin b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/length.bin new file mode 100644 index 0000000..243ad1f Binary files /dev/null and b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/length.bin differ diff --git a/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/link_lists.bin b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/link_lists.bin new file mode 100644 index 0000000..dd64b1f Binary files /dev/null and b/your-code/chroma_db_lesson/f161f97d-9874-4aad-a7a9-8cd3f2994fa3/link_lists.bin differ diff --git a/your-code/main.ipynb b/your-code/main.ipynb index e3a225a..33c5207 100644 --- a/your-code/main.ipynb +++ b/your-code/main.ipynb @@ -59,9 +59,178 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: langchain in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.2.6)\n", + "Requirement already satisfied: langchain_community in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (0.4.1)\n", + "Requirement already satisfied: pypdf in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (6.6.0)\n", + "Requirement already satisfied: langchain-core<2.0.0,>=1.2.7 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain) (1.2.7)\n", + "Requirement already satisfied: langgraph<1.1.0,>=1.0.2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain) (1.0.7)\n", + "Requirement already satisfied: pydantic<3.0.0,>=2.7.4 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain) (2.10.3)\n", + "Requirement already satisfied: jsonpatch<2.0.0,>=1.33.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (1.33)\n", + "Requirement already satisfied: langsmith<1.0.0,>=0.3.45 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (0.6.4)\n", + "Requirement already satisfied: packaging<26.0.0,>=23.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (24.2)\n", + "Requirement already satisfied: pyyaml<7.0.0,>=5.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (6.0.2)\n", + "Requirement already satisfied: tenacity!=8.4.0,<10.0.0,>=8.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (9.0.0)\n", + "Requirement already satisfied: typing-extensions<5.0.0,>=4.7.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (4.12.2)\n", + "Requirement already satisfied: uuid-utils<1.0,>=0.12.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.7->langchain) (0.14.0)\n", + "Requirement already satisfied: jsonpointer>=1.9 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonpatch<2.0.0,>=1.33.0->langchain-core<2.0.0,>=1.2.7->langchain) (2.1)\n", + "Requirement already satisfied: langgraph-checkpoint<5.0.0,>=2.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph<1.1.0,>=1.0.2->langchain) (4.0.0)\n", + "Requirement already satisfied: langgraph-prebuilt<1.1.0,>=1.0.7 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph<1.1.0,>=1.0.2->langchain) (1.0.7)\n", + "Requirement already satisfied: langgraph-sdk<0.4.0,>=0.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph<1.1.0,>=1.0.2->langchain) (0.3.3)\n", + "Requirement already satisfied: xxhash>=3.5.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph<1.1.0,>=1.0.2->langchain) (3.6.0)\n", + "Requirement already satisfied: ormsgpack>=1.12.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph-checkpoint<5.0.0,>=2.1.0->langgraph<1.1.0,>=1.0.2->langchain) (1.12.2)\n", + "Requirement already satisfied: httpx>=0.25.2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (0.28.1)\n", + "Requirement already satisfied: orjson>=3.10.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (3.11.5)\n", + "Requirement already satisfied: requests-toolbelt>=1.0.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.7->langchain) (1.0.0)\n", + "Requirement already satisfied: requests>=2.0.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.7->langchain) (2.32.5)\n", + "Requirement already satisfied: zstandard>=0.23.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.7->langchain) (0.23.0)\n", + "Requirement already satisfied: anyio in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (4.7.0)\n", + "Requirement already satisfied: certifi in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (2025.7.14)\n", + "Requirement already satisfied: httpcore==1.* in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (1.0.9)\n", + "Requirement already satisfied: idna in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (3.7)\n", + "Requirement already satisfied: h11>=0.16 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpcore==1.*->httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (0.16.0)\n", + "Requirement already satisfied: annotated-types>=0.6.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic<3.0.0,>=2.7.4->langchain) (0.6.0)\n", + "Requirement already satisfied: pydantic-core==2.27.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic<3.0.0,>=2.7.4->langchain) (2.27.1)\n", + "Requirement already satisfied: langchain-classic<2.0.0,>=1.0.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (1.0.1)\n", + "Requirement already satisfied: SQLAlchemy<3.0.0,>=1.4.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (2.0.39)\n", + "Requirement already satisfied: aiohttp<4.0.0,>=3.8.3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (3.11.10)\n", + "Requirement already satisfied: dataclasses-json<0.7.0,>=0.6.7 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (0.6.7)\n", + "Requirement already satisfied: pydantic-settings<3.0.0,>=2.10.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (2.12.0)\n", + "Requirement already satisfied: httpx-sse<1.0.0,>=0.4.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (0.4.3)\n", + "Requirement already satisfied: numpy>=2.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_community) (2.1.3)\n", + "Requirement already satisfied: aiohappyeyeballs>=2.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (2.4.4)\n", + "Requirement already satisfied: aiosignal>=1.1.2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (1.2.0)\n", + "Requirement already satisfied: attrs>=17.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (24.3.0)\n", + "Requirement already satisfied: frozenlist>=1.1.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (1.5.0)\n", + "Requirement already satisfied: multidict<7.0,>=4.5 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (6.1.0)\n", + "Requirement already satisfied: propcache>=0.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (0.3.1)\n", + "Requirement already satisfied: yarl<2.0,>=1.17.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from aiohttp<4.0.0,>=3.8.3->langchain_community) (1.18.0)\n", + "Requirement already satisfied: marshmallow<4.0.0,>=3.18.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from dataclasses-json<0.7.0,>=0.6.7->langchain_community) (3.26.2)\n", + "Requirement already satisfied: typing-inspect<1,>=0.4.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from dataclasses-json<0.7.0,>=0.6.7->langchain_community) (0.9.0)\n", + "Requirement already satisfied: langchain-text-splitters<2.0.0,>=1.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-classic<2.0.0,>=1.0.0->langchain_community) (1.1.0)\n", + "Requirement already satisfied: python-dotenv>=0.21.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic-settings<3.0.0,>=2.10.1->langchain_community) (1.1.0)\n", + "Requirement already satisfied: typing-inspection>=0.4.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic-settings<3.0.0,>=2.10.1->langchain_community) (0.4.2)\n", + "Requirement already satisfied: charset_normalizer<4,>=2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from requests>=2.0.0->langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.7->langchain) (3.3.2)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from requests>=2.0.0->langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.7->langchain) (2.3.0)\n", + "Requirement already satisfied: greenlet!=0.4.17 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from SQLAlchemy<3.0.0,>=1.4.0->langchain_community) (3.1.1)\n", + "Requirement already satisfied: mypy-extensions>=0.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from typing-inspect<1,>=0.4.0->dataclasses-json<0.7.0,>=0.6.7->langchain_community) (1.0.0)\n", + "Requirement already satisfied: sniffio>=1.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from anyio->httpx>=0.25.2->langgraph-sdk<0.4.0,>=0.3.0->langgraph<1.1.0,>=1.0.2->langchain) (1.3.0)\n", + "Note: you may need to restart the kernel to use updated packages.\n", + "Requirement already satisfied: termcolor in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (3.3.0)\n", + "Requirement already satisfied: langchain_openai in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.1.7)\n", + "Requirement already satisfied: langchain-huggingface in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.2.0)\n", + "Requirement already satisfied: sentence-transformers in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (5.2.0)\n", + "Requirement already satisfied: chromadb in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.4.1)\n", + "Requirement already satisfied: langchain_chroma in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.1.0)\n", + "Requirement already satisfied: tiktoken in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (0.12.0)\n", + "Requirement already satisfied: openai in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (2.15.0)\n", + "Requirement already satisfied: python-dotenv in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (1.1.0)\n", + "Requirement already satisfied: langchain-core<2.0.0,>=1.2.6 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain_openai) (1.2.7)\n", + "Requirement already satisfied: regex>=2022.1.18 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from tiktoken) (2024.11.6)\n", + "Requirement already satisfied: requests>=2.26.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from tiktoken) (2.32.5)\n", + "Requirement already satisfied: anyio<5,>=3.5.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (4.7.0)\n", + "Requirement already satisfied: distro<2,>=1.7.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (1.9.0)\n", + "Requirement already satisfied: httpx<1,>=0.23.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (0.28.1)\n", + "Requirement already satisfied: jiter<1,>=0.10.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (0.12.0)\n", + "Requirement already satisfied: pydantic<3,>=1.9.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (2.10.3)\n", + "Requirement already satisfied: sniffio in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (1.3.0)\n", + "Requirement already satisfied: tqdm>4 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (4.67.1)\n", + "Requirement already satisfied: typing-extensions<5,>=4.11 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from openai) (4.12.2)\n", + "Requirement already satisfied: idna>=2.8 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from anyio<5,>=3.5.0->openai) (3.7)\n", + "Requirement already satisfied: certifi in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx<1,>=0.23.0->openai) (2025.7.14)\n", + "Requirement already satisfied: httpcore==1.* in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpx<1,>=0.23.0->openai) (1.0.9)\n", + "Requirement already satisfied: h11>=0.16 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from httpcore==1.*->httpx<1,>=0.23.0->openai) (0.16.0)\n", + "Requirement already satisfied: jsonpatch<2.0.0,>=1.33.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (1.33)\n", + "Requirement already satisfied: langsmith<1.0.0,>=0.3.45 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (0.6.4)\n", + "Requirement already satisfied: packaging<26.0.0,>=23.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (24.2)\n", + "Requirement already satisfied: pyyaml<7.0.0,>=5.3.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (6.0.2)\n", + "Requirement already satisfied: tenacity!=8.4.0,<10.0.0,>=8.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (9.0.0)\n", + "Requirement already satisfied: uuid-utils<1.0,>=0.12.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-core<2.0.0,>=1.2.6->langchain_openai) (0.14.0)\n", + "Requirement already satisfied: jsonpointer>=1.9 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonpatch<2.0.0,>=1.33.0->langchain-core<2.0.0,>=1.2.6->langchain_openai) (2.1)\n", + "Requirement already satisfied: orjson>=3.9.14 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.6->langchain_openai) (3.11.5)\n", + "Requirement already satisfied: requests-toolbelt>=1.0.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.6->langchain_openai) (1.0.0)\n", + "Requirement already satisfied: zstandard>=0.23.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langsmith<1.0.0,>=0.3.45->langchain-core<2.0.0,>=1.2.6->langchain_openai) (0.23.0)\n", + "Requirement already satisfied: annotated-types>=0.6.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic<3,>=1.9.0->openai) (0.6.0)\n", + "Requirement already satisfied: pydantic-core==2.27.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from pydantic<3,>=1.9.0->openai) (2.27.1)\n", + "Requirement already satisfied: huggingface-hub<1.0.0,>=0.33.4 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-huggingface) (0.36.0)\n", + "Requirement already satisfied: tokenizers<1.0.0,>=0.19.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from langchain-huggingface) (0.22.2)\n", + "Requirement already satisfied: filelock in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from huggingface-hub<1.0.0,>=0.33.4->langchain-huggingface) (3.17.0)\n", + "Requirement already satisfied: fsspec>=2023.5.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from huggingface-hub<1.0.0,>=0.33.4->langchain-huggingface) (2025.3.2)\n", + "Requirement already satisfied: transformers<6.0.0,>=4.41.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from sentence-transformers) (4.57.6)\n", + "Requirement already satisfied: torch>=1.11.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from sentence-transformers) (2.10.0)\n", + "Requirement already satisfied: scikit-learn in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from sentence-transformers) (1.6.1)\n", + "Requirement already satisfied: scipy in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from sentence-transformers) (1.15.3)\n", + "Requirement already satisfied: numpy>=1.17 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from transformers<6.0.0,>=4.41.0->sentence-transformers) (2.1.3)\n", + "Requirement already satisfied: safetensors>=0.4.3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from transformers<6.0.0,>=4.41.0->sentence-transformers) (0.7.0)\n", + "Requirement already satisfied: build>=1.0.3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.4.0)\n", + "Requirement already satisfied: pybase64>=1.4.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.4.3)\n", + "Requirement already satisfied: uvicorn>=0.18.3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from uvicorn[standard]>=0.18.3->chromadb) (0.40.0)\n", + "Requirement already satisfied: posthog<6.0.0,>=2.4.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (5.4.0)\n", + "Requirement already satisfied: onnxruntime>=1.14.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.23.2)\n", + "Requirement already satisfied: opentelemetry-api>=1.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.39.1)\n", + "Requirement already satisfied: opentelemetry-exporter-otlp-proto-grpc>=1.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.39.1)\n", + "Requirement already satisfied: opentelemetry-sdk>=1.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.39.1)\n", + "Requirement already satisfied: pypika>=0.48.9 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (0.50.0)\n", + "Requirement already satisfied: overrides>=7.3.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (7.4.0)\n", + "Requirement already satisfied: importlib-resources in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (6.5.2)\n", + "Requirement already satisfied: grpcio>=1.58.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (1.76.0)\n", + "Requirement already satisfied: bcrypt>=4.0.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (4.3.0)\n", + "Requirement already satisfied: typer>=0.9.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (0.9.0)\n", + "Requirement already satisfied: kubernetes>=28.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (35.0.0)\n", + "Requirement already satisfied: mmh3>=4.0.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (5.2.0)\n", + "Requirement already satisfied: rich>=10.11.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (13.9.4)\n", + "Requirement already satisfied: jsonschema>=4.19.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from chromadb) (4.23.0)\n", + "Requirement already satisfied: six>=1.5 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from posthog<6.0.0,>=2.4.0->chromadb) (1.17.0)\n", + "Requirement already satisfied: python-dateutil>=2.2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from posthog<6.0.0,>=2.4.0->chromadb) (2.9.0.post0)\n", + "Requirement already satisfied: backoff>=1.10.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from posthog<6.0.0,>=2.4.0->chromadb) (2.2.1)\n", + "Requirement already satisfied: charset_normalizer<4,>=2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from requests>=2.26.0->tiktoken) (3.3.2)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from requests>=2.26.0->tiktoken) (2.3.0)\n", + "Requirement already satisfied: pyproject_hooks in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from build>=1.0.3->chromadb) (1.2.0)\n", + "Requirement already satisfied: colorama in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from build>=1.0.3->chromadb) (0.4.6)\n", + "Requirement already satisfied: attrs>=22.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonschema>=4.19.0->chromadb) (24.3.0)\n", + "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonschema>=4.19.0->chromadb) (2023.7.1)\n", + "Requirement already satisfied: referencing>=0.28.4 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonschema>=4.19.0->chromadb) (0.30.2)\n", + "Requirement already satisfied: rpds-py>=0.7.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jsonschema>=4.19.0->chromadb) (0.22.3)\n", + "Requirement already satisfied: websocket-client!=0.40.0,!=0.41.*,!=0.42.*,>=0.32.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from kubernetes>=28.1.0->chromadb) (1.8.0)\n", + "Requirement already satisfied: requests-oauthlib in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from kubernetes>=28.1.0->chromadb) (2.0.0)\n", + "Requirement already satisfied: durationpy>=0.7 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from kubernetes>=28.1.0->chromadb) (0.10)\n", + "Requirement already satisfied: coloredlogs in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from onnxruntime>=1.14.1->chromadb) (15.0.1)\n", + "Requirement already satisfied: flatbuffers in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from onnxruntime>=1.14.1->chromadb) (25.12.19)\n", + "Requirement already satisfied: protobuf in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from onnxruntime>=1.14.1->chromadb) (5.29.3)\n", + "Requirement already satisfied: sympy in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from onnxruntime>=1.14.1->chromadb) (1.13.3)\n", + "Requirement already satisfied: importlib-metadata<8.8.0,>=6.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from opentelemetry-api>=1.2.0->chromadb) (8.5.0)\n", + "Requirement already satisfied: zipp>=3.20 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from importlib-metadata<8.8.0,>=6.0->opentelemetry-api>=1.2.0->chromadb) (3.21.0)\n", + "Requirement already satisfied: googleapis-common-protos~=1.57 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb) (1.72.0)\n", + "Requirement already satisfied: opentelemetry-exporter-otlp-proto-common==1.39.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb) (1.39.1)\n", + "Requirement already satisfied: opentelemetry-proto==1.39.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb) (1.39.1)\n", + "Requirement already satisfied: opentelemetry-semantic-conventions==0.60b1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from opentelemetry-sdk>=1.2.0->chromadb) (0.60b1)\n", + "Requirement already satisfied: markdown-it-py>=2.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from rich>=10.11.0->chromadb) (2.2.0)\n", + "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from rich>=10.11.0->chromadb) (2.19.1)\n", + "Requirement already satisfied: mdurl~=0.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->chromadb) (0.1.0)\n", + "Requirement already satisfied: networkx>=2.5.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from torch>=1.11.0->sentence-transformers) (3.4.2)\n", + "Requirement already satisfied: jinja2 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from torch>=1.11.0->sentence-transformers) (3.1.6)\n", + "Requirement already satisfied: setuptools in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from torch>=1.11.0->sentence-transformers) (72.1.0)\n", + "Requirement already satisfied: mpmath<1.4,>=1.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from sympy->onnxruntime>=1.14.1->chromadb) (1.3.0)\n", + "Requirement already satisfied: click<9.0.0,>=7.1.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from typer>=0.9.0->chromadb) (8.1.8)\n", + "Requirement already satisfied: httptools>=0.6.3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from uvicorn[standard]>=0.18.3->chromadb) (0.7.1)\n", + "Requirement already satisfied: watchfiles>=0.13 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from uvicorn[standard]>=0.18.3->chromadb) (1.1.1)\n", + "Requirement already satisfied: websockets>=10.4 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from uvicorn[standard]>=0.18.3->chromadb) (16.0)\n", + "Requirement already satisfied: humanfriendly>=9.1 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from coloredlogs->onnxruntime>=1.14.1->chromadb) (10.0)\n", + "Requirement already satisfied: pyreadline3 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from humanfriendly>=9.1->coloredlogs->onnxruntime>=1.14.1->chromadb) (3.5.4)\n", + "Requirement already satisfied: MarkupSafe>=2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from jinja2->torch>=1.11.0->sentence-transformers) (3.0.2)\n", + "Requirement already satisfied: oauthlib>=3.0.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from requests-oauthlib->kubernetes>=28.1.0->chromadb) (3.3.1)\n", + "Requirement already satisfied: joblib>=1.2.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from scikit-learn->sentence-transformers) (1.4.2)\n", + "Requirement already satisfied: threadpoolctl>=3.1.0 in c:\\users\\vorpc\\anaconda3\\lib\\site-packages (from scikit-learn->sentence-transformers) (3.5.0)\n", + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], "source": [ "%pip install langchain langchain_community pypdf\n", "%pip install termcolor langchain_openai langchain-huggingface sentence-transformers chromadb langchain_chroma tiktoken openai python-dotenv\n" @@ -69,15 +238,15 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": { "id": "6heKZkQUxYZr" }, "outputs": [], "source": [ "import os\n", - "from langchain.document_loaders import PyPDFLoader\n", - "from langchain.text_splitter import CharacterTextSplitter, RecursiveCharacterTextSplitter\n", + "from langchain_community.document_loaders import PyPDFLoader\n", + "from langchain_text_splitters import RecursiveCharacterTextSplitter,CharacterTextSplitter\n", "import warnings\n", "warnings.filterwarnings('ignore')\n" ] @@ -96,7 +265,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 3, "metadata": { "id": "cuREtJRixYZt" }, @@ -104,7 +273,7 @@ "source": [ "# File path for the document\n", "\n", - "file_path = \"LAB/ai-for-everyone.pdf\"" + "file_path = r\"C:\\Users\\VORPC\\Ironhack\\classes\\labs\\week 18\\lab-intro-rag\\ai-for-everyone.pdf\"" ] }, { @@ -122,12 +291,23 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 4, "metadata": { "id": "_b5Z_45UxYZu", "outputId": "a600d69f-14fe-4492-f236-97261d6ff36c" }, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "297" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Load and split the document\n", "loader = PyPDFLoader(file_path)\n", @@ -168,9 +348,20 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "1096" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "text_splitter = RecursiveCharacterTextSplitter(\n", " chunk_size=1000,\n", @@ -285,31 +476,43 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "metadata": { "id": "L0xDxElwxYZw" }, "outputs": [], "source": [ - "from langchain.embeddings import OpenAIEmbeddings\n", + "\n", + "from langchain_openai import OpenAIEmbeddings\n", "from dotenv import load_dotenv" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": { "id": "_WRIo3_0xYZx", "outputId": "78bfbbf3-9d25-4e31-bdbc-3e932e6bbfec" }, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "True" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "load_dotenv()" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": { "id": "MNZfTng5xYZz", "outputId": "db1a7c85-ef9f-447e-92cd-9d097e959847" @@ -343,25 +546,31 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": { "id": "brKe6wUgxYZ0" }, "outputs": [], "source": [ - "from langchain.vectorstores import Chroma" + "\n", + "from langchain_chroma import Chroma" ] }, { "cell_type": "code", - "execution_count": null, - "metadata": { - "id": "VkjHR-RkxYZ0", - "outputId": "bc11bda9-f283-457a-f584-5a06b95c4dd9" - }, - "outputs": [], + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "ChromaDB created with document embeddings.\n" + ] + } + ], "source": [ - "db = Chroma.from_documents(chunks, embeddings, persist_directory=\"./chroma_db_LAB\")\n", + "db = Chroma.from_documents(chunks, embeddings, persist_directory=\"./chroma_db_lesson\")\n", "print(\"ChromaDB created with document embeddings.\")" ] }, @@ -383,24 +592,63 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 18, "metadata": { "id": "XiLv-TfrxYZ1" }, "outputs": [], "source": [ - "user_question = \"\" # User question\n", + "user_question = \"How is AI quietly reshaping normal people’s lives without their consent or understanding?\" # User question\n", "retrieved_docs = db.similarity_search(user_question, k=10) # k is the number of documents to retrieve" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 19, "metadata": { "id": "qgWsh50JxYZ1", "outputId": "c8640c5d-5955-471f-fdd2-37096f5f68c7" }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Document 1:\n", + "nce because they are not the expression of a hypothesis but sim-\n", + "ply an extrapolation from a set of data points. And yet AI is performative; by \n", + "intervening in the world and reorganising the phenomena it claims to describe, \n", + "it brings our experience into closer alignment with its constructs (Mackenzie \n", + "2008). This invalidates the methods as a form of statistical insight but makes it \n", + "very effective as a mode of subjection.\n", + "Automated Segregation\n", + "As the logic of AI migrates from the abstract mathematical space of tensors \n", + "to the space of real social tensions, it comes to bear in specific ways. First and \n", + "foremost of these is automated segregation.\n", + "There is nothing personal about the predictions of AI – at root, they are always \n", + "some form of labelling in terms of ‘people/objects like you’ . As an offshoot of \n", + "the statistics family tree, machine learning’s classifications are governed by the\n", + "Document 2:\n", + "Coeckelbergh 2020, Ch. 8). It is often the case that we do \n", + "not understand how algorithms function and interrelate, what exactly their \n", + "operation encompasses, what impact they have on our lives and under what \n", + "conditions this happens. This is why algorithms can lead to results and con -\n", + "sequences that might not be intended in the first place and sometimes cannot \n", + "even be adequately explained.\n", + "There have been numerous cases of encoded biases in algorithms such as \n", + "racist profiling or sexism (Bridle 2018, 142), which were a consequence of \n", + "comparable biases historically existing in society. The poet Joy Buolamwini, for \n", + "example, criticized them in a project AI, Ain’t I A Woman (www.notflawless.ai), \n", + "which focused on grave failures of facial recognition when it came to black \n", + "women. A myriad of such incidents demonstrates both that algorithms are far \n", + "from neutral artefacts, a point I return to later, but also that even their designers\n", + "Document 3:\n", + "tends long-standing debates on modes of \n", + "capitalism that significantly shape the circumstances of working people whilst \n", + "limiting their ability to influence decisions that govern their lives.\n" + ] + } + ], "source": [ "# Display top results\n", "for i, doc in enumerate(retrieved_docs[:3]): # Display top 3 results\n", @@ -418,7 +666,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 20, "metadata": { "id": "2iB3lZqHxYZ2" }, @@ -434,12 +682,20 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 21, "metadata": { "id": "2okzmuADxYZ2", "outputId": "0aa6cdca-188d-40e0-f5b4-8888d3549ea4" }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Context formatted for GPT model.\n" + ] + } + ], "source": [ "# Generate a formatted context from the retrieved documents\n", "formatted_context = _get_document_prompt(retrieved_docs)\n", @@ -464,7 +720,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 22, "metadata": { "id": "tqxVh9s3xYZ3", "outputId": "97cca95d-4ab3-44d8-a76c-5713aad387d8" @@ -473,13 +729,52 @@ "source": [ "prompt = f\"\"\"\n", "\n", + "## SYSTEM ROLE\n", + "You are a knowledgeable and factual chatbot designed to Explain this AI concept as if you are teaching an everyday person with no technical background.\n", + "Your answers must be based exclusively on provided content from technical books provided.\n", + "\n", + "## USER QUESTION\n", + "The user has asked:\n", + "\"{user_question}\"\n", + "\n", + "## CONTEXT\n", + "Here is the relevant content from the technical books:\n", + "'''\n", + "{formatted_context}\n", + "'''\n", + "\n", + "## GUIDELINES\n", + "1. **Accuracy**:\n", + " - Only use the content in the `CONTEXT` section to answer.\n", + " - If the answer cannot be found, explicitly state: \"The provided context does not contain this information.\"\n", + " - Show how this concept affects their daily life right now (work, money, creativity, or decisions).\n", + "\n", + "2. **Transparency**:\n", + " - Do not speculate or provide opinions.\n", "\n", + "3. **Clarity**:\n", + " - Use plain language, real-life examples, and zero jargon.\n", + " - Format your response in Markdown for readability.\n", + "\n", + "## TASK\n", + "1. Answer the user's question **directly** if possible.\n", + "2. Point the user to relevant parts of the documentation.\n", + "3. Provide the response in the following format:\n", + "\n", + "## RESPONSE FORMAT\n", + "'''\n", + "# [Brief Title of the Answer]\n", + "[Answer in simple, clear text.]\n", + "\n", + "**Source**:\n", + "• [Book Title], Page(s): [...]\n", + "'''\n", "\"\"\"\n" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 23, "metadata": { "id": "0mjkQJ_ZxYZ3" }, @@ -497,7 +792,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 24, "metadata": { "id": "ylypRWRlxYZ4" }, @@ -507,11 +802,11 @@ "client = openai.OpenAI()\n", "model_params = {\n", " 'model': 'gpt-4o',\n", - " 'temperature': , # Increase creativity\n", - " 'max_tokens': , # Allow for longer responses\n", - " 'top_p': , # Use nucleus sampling\n", - " 'frequency_penalty': , # Reduce repetition\n", - " 'presence_penalty': # Encourage new topics\n", + " 'temperature':0.7 , # Increase creativity\n", + " 'max_tokens': 2000, # Allow for longer responses\n", + " 'top_p': 0.9 , # Use nucleus sampling\n", + " 'frequency_penalty':0.5 , # Reduce repetition\n", + " 'presence_penalty': 0.6 # Encourage new topics\n", "}" ] }, @@ -526,7 +821,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 25, "metadata": { "id": "4eXZO4pIxYZ4" }, @@ -538,12 +833,37 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 26, "metadata": { "id": "wLPAcchBxYZ5", "outputId": "976c7800-16ed-41fe-c4cf-58f60d3230d2" }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "'''\n", + "# How AI Quietly Reshapes Our Lives\n", + "\n", + "Artificial Intelligence (AI) is influencing our everyday lives in ways that many people might not fully realize or understand. It’s working behind the scenes, impacting several areas:\n", + "\n", + "1. **Employment and Work**: AI is changing how jobs are organized and performed. For instance, algorithms are used in hiring processes and assessing performance, which can affect job opportunities and work evaluations without employees' direct awareness.\n", + "\n", + "2. **Automation**: AI systems are increasingly taking over tasks that humans used to do. This shift can lead to concerns about job security as machines handle more work efficiently, which may result in fewer available jobs for people.\n", + "\n", + "3. **Data Collection**: Companies collect vast amounts of data on individuals' activities both at work and in their personal lives. This data is used by machine learning systems to make decisions that influence how tasks are allocated and completed.\n", + "\n", + "4. **Biases in Algorithms**: There have been cases where AI systems reflect societal biases, such as racism or sexism, because they learn from historical data that contains these biases. This can lead to unfair treatment of certain groups without individuals being aware of the underlying causes.\n", + "\n", + "These examples show how AI integrates into various aspects of life — like employment and personal privacy — often without explicit consent or understanding from those affected.\n", + "\n", + "**Source**:\n", + "• \"AI for Everyone?\", Pages: 214-218\n", + "'''\n" + ] + } + ], "source": [ "answer = completion.choices[0].message.content\n", "print(answer)" @@ -595,7 +915,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 27, "metadata": { "id": "nCXL9Cz1xYaV" }, @@ -615,7 +935,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 28, "metadata": { "id": "9y3E0YWExYaV" }, @@ -636,14 +956,27 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 31, "metadata": { "id": "i7SkWPpnxYaW", "outputId": "28e82563-edba-4b41-acad-ec27e5ba134f" }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Snippet 1:\n", + "70 AI for Everyone?\n", + "dilution of science because they are not the expression of a hypothesis but sim-\n", + "ply an extrapolation from a set of data points. And yet AI is performative; by \n", + "intervening in the \n", + "--------------------------------------------------------------------------------\n" + ] + } + ], "source": [ - "query_keywords = [] # add your keywords\n", + "query_keywords = [\"ai\", \"life\", \"everyone\"] # add your keywords\n", "for i, doc in enumerate(retrieved_docs[:1]):\n", " snippet = doc.page_content[:200]\n", " highlighted = highlight_keywords(snippet, query_keywords)\n", @@ -687,7 +1020,7 @@ "provenance": [] }, "kernelspec": { - "display_name": "llm", + "display_name": "base", "language": "python", "name": "python3" }, @@ -701,7 +1034,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.12.10" + "version": "3.13.5" } }, "nbformat": 4,