diff --git a/.github/workflows/publish_release.yml b/.github/workflows/publish_release.yml index fdb07cb5aae36..62e7457da3760 100644 --- a/.github/workflows/publish_release.yml +++ b/.github/workflows/publish_release.yml @@ -14,6 +14,7 @@ env: jobs: build-n-publish: name: Build and publish to PyPI + if: github.repository == 'run-llama/llama_index' runs-on: ubuntu-latest steps: diff --git a/.github/workflows/publish_sub_package.yml b/.github/workflows/publish_sub_package.yml new file mode 100644 index 0000000000000..3dd6ae4bc18cb --- /dev/null +++ b/.github/workflows/publish_sub_package.yml @@ -0,0 +1,43 @@ +name: Publish Sub-Package to PyPI if Needed + +on: + push: + branches: + - main + +env: + POETRY_VERSION: "1.6.1" + PYTHON_VERSION: "3.10" + +jobs: + publish_subpackage_if_needed: + if: github.repository == 'run-llama/llama_index' + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v3 + with: + fetch-depth: 0 + - name: Set up python ${{ env.PYTHON_VERSION }} + uses: actions/setup-python@v4 + with: + python-version: ${{ env.PYTHON_VERSION }} + - name: Install Poetry + uses: snok/install-poetry@v1 + with: + version: ${{ env.POETRY_VERSION }} + - name: Get changed pyproject files + id: changed-files + run: | + echo "changed_files=$(git diff --name-only ${{ github.event.before }} ${{ github.event.after }} | grep -v llama-index-core | grep llama-index | grep pyproject | xargs)" >> $GITHUB_OUTPUT + - name: Publish changed packages + env: + PYPI_TOKEN: ${{ secrets.LLAMA_INDEX_PYPI_TOKEN }} + run: | + for file in ${{ steps.changed-files.outputs.changed_files }}; do + cd `echo $file | sed 's/\/pyproject.toml//g'` + poetry lock + pip install -e . + poetry config pypi-token.pypi $PYPI_TOKEN + poetry publish --build + cd - + done diff --git a/CHANGELOG.md b/CHANGELOG.md index 275302e0025e8..b2676ba77f4da 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,43 @@ # ChangeLog +## [0.10.16] - 2024-03-05 + +### New Features + +- Anthropic support for new models (#11623, #11612) +- Easier creation of chat prompts (#11583) +- Added a raptor retriever llama-pack (#11527) +- Improve batch cohere embeddings through bedrock (#11572) +- Added support for vertex AI embeddings (#11561) + +### Bug Fixes / Nits + +- Ensure order in async embeddings generation (#11562) +- Fixed empty metadata for csv reader (#11563) +- Serializable fix for composable retrievers (#11617) +- Fixed milvus metadata filter support (#11566) +- FIxed pydantic import in clickhouse vector store (#11631) +- Fixed system prompts for gemini/vertext-gemini (#11511) + +## [0.10.15] - 2024-03-01 + +### New Features + +- Added FeishuWikiReader (#11491) +- Added videodb retriever integration (#11463) +- Added async to opensearch vector store (#11513) +- New LangFuse one-click callback handler (#11324) + +### Bug Fixes / Nits + +- Fixed deadlock issue with async chat streaming (#11548) +- Improved hidden file check in SimpleDirectoryReader (#11496) +- Fixed null values in document metadata when using SimpleDirectoryReader (#11501) +- Fix for sqlite utils in jsonalyze query engine (#11519) +- Added base url and timeout to ollama multimodal LLM (#11526) +- Updated duplicate handling in query fusion retriever (#11542) +- Fixed bug in kg indexx struct updating (#11475) + ## [0.10.14] - 2024-02-28 ### New Features diff --git a/docs/BUILD b/docs/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/docs/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/docs/community/integrations/uptrain.md b/docs/community/integrations/uptrain.md index d07e25fcbf1b5..da808ae3db271 100644 --- a/docs/community/integrations/uptrain.md +++ b/docs/community/integrations/uptrain.md @@ -1,89 +1,121 @@ # Perform Evaluations on LlamaIndex with UpTrain -**Overview**: In this example, we will see how to use UpTrain with LlamaIndex. +**Overview**: In this example, we will see how to use UpTrain with LlamaIndex. UpTrain ([github](https://github.com/uptrain-ai/uptrain) || [website](https://github.com/uptrain-ai/uptrain/) || [docs](https://docs.uptrain.ai/)) is an open-source platform to evaluate and improve GenAI applications. It provides grades for 20+ preconfigured checks (covering language, code, embedding use cases), performs root cause analysis on failure cases and gives insights on how to resolve them. More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-). -**Problem**: There are two main problems: +**Problem**: As an increasing number of companies are graduating their LLM prototypes to production-ready applications, their RAG pipelines are also getting complex. Developers are utilising modules like QueryRewrite, Context ReRank, etc., to enhance the accuracy of their RAG systems. -1. The data that most Large Language Models are trained on is not representative of the data that they are used on. This leads to a mismatch between the training and test distributions, which can lead to poor performance. -2. The results generated by Large Language Models are not always reliable. The responses might not be relevant to the prompt, not align with the desired tone or the context, or might be offensive etc. +With increasing complexity comes more points of failure. -**Solution**: The above two problems are solved by two different tools and we will show you how to use them together: +1. Advanced Evals are needed to evaluate the quality of these newer modules and determine if they actually improve the system's accuracy. +2. A robust experimentation framework is needed to systematically test different modules and make data-driven decisions. -1. LlamaIndex solves the first problem by allowing you to perform Retrieval Augmented Generation (RAG) with a retriever that is fine-tuned on your own data. This allows you to use your own data to fine-tune a retriever, and then use that retriever to perform RAG. -2. UpTrain solves the second problem by allowing you to perform evaluations on the generated responses. This helps you to ensure that the responses are relevant to the prompt, align with the desired tone or the context, and are not offensive etc. +**Solution**: UpTrain helps to solve for both: + +1. UpTrain provides a series of checks to evaluate the quality of generated response, retrieved-context as well as all the interim steps. The relevant checks are ContextRelevance, SubQueryCompleteness, ContextReranking, ContextConciseness, FactualAccuracy, ContextUtilization, ResponseCompleteness, ResponseConciseness, etc. +2. UpTrain also allows you to experiment with different embedding models as well as have an "evaluate_experiments" method to compare different RAG configurations. # How to go about it? -There two ways you can use UpTrain with LlamaIndex: +There are two ways you can use UpTrain with LlamaIndex: -1. **Using the UpTrain Callback Handler**: This method allows you to seamlessly integrate UpTrain with LlamaIndex. You can simply add UpTrainCallbackHandler to your existing LlamaIndex pipeline and it will take care of sending the generated responses to the UpTrain Managed Service for evaluations. This is the recommended method as it is the easiest to use and provides you with dashboards and insights with minimal effort. +1. **Using the UpTrain Callback Handler**: This method allows you to seamlessly integrate UpTrain with LlamaIndex. You can simply add UpTrainCallbackHandler to your existing LlamaIndex pipeline and it will evaluate all components of your RAG pipeline. This is the recommended method as it is the easiest to use and provides you with dashboards and insights with minimal effort. 2. **Using UpTrain's EvalLlamaIndex**: This method allows you to use UpTrain to perform evaluations on the generated responses. You can use the EvalLlamaIndex object to generate responses for the queries and then perform evaluations on the responses. You can find a detailed tutorial on how to do this below. This method offers more flexibility and control over the evaluations, but requires more effort to set up and use. # 1. Using the UpTrain Callback Handler Open In Colab -Three additional evaluations for Llamaindex have been introduced, complementing existing ones. These evaluations run automatically, with results displayed in the output. More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-). +Below is how to use UpTrain Callback Handler to evaluate different components of your RAG pipelines. + +## 1. **RAG Query Engine Evaluations**: + +The RAG query engine plays a crucial role in retrieving context and generating responses. To ensure its performance and response quality, we conduct the following evaluations: + +- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not. +- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context. +- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively. + +## 2. **Sub-Question Query Generation Evaluation**: + +The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using an RAG query engine. To measure it's accuracy, we use: + +- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query. + +## 3. **Re-Ranking Evaluations**: + +Re-ranking involves reordering nodes based on relevance to the query and choosing the top nodes. Different evaluations are performed based on the number of nodes returned after re-ranking. + +a. Same Number of Nodes + +- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. + +b. Different Number of Nodes: + +- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information. + +These evaluations collectively ensure the robustness and effectiveness of the RAG query engine, SubQuestionQueryGeneration operator, and the re-ranking process in the LlamaIndex pipeline. + +#### **Note:** -Selected operators from the LlamaIndex pipeline are highlighted for demonstration: +- We have performed evaluations using a basic RAG query engine; the same evaluations can be performed using the advanced RAG query engine as well. +- Same is true for Re-Ranking evaluations, we have performed evaluations using SentenceTransformerRerank, the same evaluations can be performed using other re-rankers as well. ## 1. **RAG Query Engine Evaluations**: The RAG query engine plays a crucial role in retrieving context and generating responses. To ensure its performance and response quality, we conduct the following evaluations: -- **Context Relevance**: Determines if the context extracted from the query is relevant to the response. -- **Factual Accuracy**: Assesses if the LLM is hallcuinating or providing incorrect information. -- **Response Completeness**: Checks if the response contains all the information requested by the query. +- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not. +- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context. +- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively. ## 2. **Sub-Question Query Generation Evaluation**: -The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using a RAG query engine. Given the complexity, we include the previous evaluations and add: +The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using an RAG query engine. To measure it's accuracy, we use: -- **Sub Query Completeness**: Assures that the sub-questions accurately and comprehensively cover the original query. +- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query. ## 3. **Re-Ranking Evaluations**: -Re-ranking involves reordering nodes based on relevance to the query and choosing top n nodes. Different evaluations are performed based on the number of nodes returned after re-ranking. +Re-ranking involves reordering nodes based on relevance to the query and choosing the top nodes. Different evaluations are performed based on the number of nodes returned after re-ranking. a. Same Number of Nodes -- **Context Reranking**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. +- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. b. Different Number of Nodes: -- **Context Conciseness**: Examines whether the reduced number of nodes still provides all the required information. +- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information. These evaluations collectively ensure the robustness and effectiveness of the RAG query engine, SubQuestionQueryGeneration operator, and the re-ranking process in the LlamaIndex pipeline. #### **Note:** - We have performed evaluations using basic RAG query engine, the same evaluations can be performed using the advanced RAG query engine as well. -- Same is true for Re-Ranking evaluations, we have performed evaluations using CohereRerank, the same evaluations can be performed using other re-rankers as well. +- Same is true for Re-Ranking evaluations, we have performed evaluations using SentenceTransformerRerank, the same evaluations can be performed using other re-rankers as well. ## Install Dependencies and Import Libraries Install notebook dependencies. ```bash -pip install -q html2text llama-index pandas tqdm uptrain cohere +%pip install llama-index-readers-web +%pip install llama-index-callbacks-uptrain +%pip install -q html2text llama-index pandas tqdm uptrain torch sentence-transformers ``` Import libraries. ```python -from llama_index import ( - ServiceContext, - VectorStoreIndex, -) -from llama_index.node_parser import SentenceSplitter -from llama_index.readers import SimpleWebPageReader -from llama_index.callbacks import CallbackManager, UpTrainCallbackHandler -from llama_index.postprocessor.cohere_rerank import CohereRerank -from llama_index.service_context import set_global_service_context -from llama_index.query_engine.sub_question_query_engine import ( - SubQuestionQueryEngine, -) -from llama_index.tools.query_engine import QueryEngineTool -from llama_index.tools.types import ToolMetadata +from llama_index.core import Settings, VectorStoreIndex +from llama_index.core.node_parser import SentenceSplitter +from llama_index.readers.web import SimpleWebPageReader +from llama_index.core.callbacks import CallbackManager +from llama_index.callbacks.uptrain.base import UpTrainCallbackHandler +from llama_index.core.query_engine import SubQuestionQueryEngine +from llama_index.core.tools import QueryEngineTool, ToolMetadata +from llama_index.core.postprocessor import SentenceTransformerRerank +from llama_index.llms.openai import OpenAI + +import os ``` ## Setup @@ -123,16 +155,17 @@ Parameters: **Note:** The `project_name_prefix` will be used as prefix for the project names in the UpTrain dashboard. These will be different for different types of evals. For example, if you set project_name_prefix="llama" and perform the sub_question evaluation, the project name will be "llama_sub_question_answering". ```python +os.environ[ + "OPENAI_API_KEY" +] = "sk-***********" # Replace with your OpenAI API key + callback_handler = UpTrainCallbackHandler( key_type="openai", - api_key="sk-******************************", + api_key=os.environ["OPENAI_API_KEY"], project_name_prefix="llama", ) -callback_manager = CallbackManager([callback_handler]) -service_context = ServiceContext.from_defaults( - callback_manager=callback_manager -) -set_global_service_context(service_context) + +Settings.callback_manager = CallbackManager([callback_handler]) ``` ## Load and Parse Documents @@ -158,13 +191,13 @@ nodes = parser.get_nodes_from_documents(documents) UpTrain callback handler will automatically capture the query, context and response once generated and will run the following three evaluations _(Graded from 0 to 1)_ on the response: -- **Context Relevance**: Check if the context extractedfrom the query is relevant to the response. -- **Factual Accuracy**: Check how factually accurate the response is. -- **Response Completeness**: Check if the response contains all the information that the query is asking for. +- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not. +- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context. +- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively. ```python index = VectorStoreIndex.from_documents( - documents, service_context=service_context + documents, ) query_engine = index.as_query_engine() @@ -181,55 +214,66 @@ for query in queries: ``` Question: What did Paul Graham do growing up? + Response: Paul Graham wrote short stories and started programming on the IBM 1401 in 9th grade using an early version of Fortran. Later, he convinced his father to buy a TRS-80, where he wrote simple games, a program to predict rocket heights, and a word processor. + Context Relevance Score: 0.0 Factual Accuracy Score: 1.0 - Response Completeness Score: 0.0 + Response Completeness Score: 1.0 Question: When and how did Paul Graham's mother die? + Response: Paul Graham's mother died when he was 18 years old, from a brain tumor. + Context Relevance Score: 0.0 - Factual Accuracy Score: 1.0 - Response Completeness Score: 0.0 + Factual Accuracy Score: 0.0 + Response Completeness Score: 1.0 Question: What, in Paul Graham's opinion, is the most distinctive thing about YC? - Context Relevance Score: 1.0 - Factual Accuracy Score: 1.0 + Response: The most distinctive thing about Y Combinator, according to Paul Graham, is that instead of deciding for himself what to work on, the problems come to him. Every 6 months, a new batch of startups brings their problems, which then become the focus of YC's work. + + Context Relevance Score: 0.0 + Factual Accuracy Score: 0.5 Response Completeness Score: 1.0 Question: When and how did Paul Graham meet Jessica Livingston? + Response: Paul Graham met Jessica Livingston at a big party at his house in October 2003. + Context Relevance Score: 1.0 - Factual Accuracy Score: 1.0 - Response Completeness Score: 0.5 + Factual Accuracy Score: 0.5 + Response Completeness Score: 1.0 Question: What is Bel, and when and where was it written? + Response: Bel is a new Lisp that was written in Arc. It was developed over a period of 4 years, from March 26, 2015 to October 12, 2019. Most of the work on Bel was done in England, where the author had moved to in the summer of 2016. + Context Relevance Score: 1.0 Factual Accuracy Score: 1.0 - Response Completeness Score: 0.0 + Response Completeness Score: 1.0 Here's an example of the dashboard showing how you can filter and drill down to the failing cases and get insights on the failing cases: ![image-2.png](https://uptrain-assets.s3.ap-south-1.amazonaws.com/images/llamaindex/image-2.png) # 2. Sub-Question Query Engine Evaluation -The **sub question query engine** is used to tackle the problem of answering a complex query using multiple data sources. It first breaks down the complex query into sub questions for each relevant data source, then gather all the intermediate responses and synthesizes a final response. +The **sub-question query engine** is used to tackle the problem of answering a complex query using multiple data sources. It first breaks down the complex query into sub-questions for each relevant data source, then gathers all the intermediate responses and synthesizes a final response. UpTrain callback handler will automatically capture the sub-question and the responses for each of them once generated and will run the following three evaluations _(Graded from 0 to 1)_ on the response: -- **Context Relevance**: Check if the context extractedfrom the query is relevant to the response. -- **Factual Accuracy**: Check how factually accurate the response is. -- **Response Completeness**: Check if the response contains all the information that the query is asking for. +- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not. +- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context. +- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively. In addition to the above evaluations, the callback handler will also run the following evaluation: -- **Sub Query Completeness**: Checks if the sub-questions accurately and completely cover the original query. +- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query. ```python # build index and query engine vector_query_engine = VectorStoreIndex.from_documents( - documents=documents, use_async=True, service_context=service_context + documents=documents, + use_async=True, ).as_query_engine() query_engine_tools = [ @@ -244,7 +288,6 @@ query_engine_tools = [ query_engine = SubQuestionQueryEngine.from_defaults( query_engine_tools=query_engine_tools, - service_context=service_context, use_async=True, ) @@ -253,22 +296,38 @@ response = query_engine.query( ) ``` - Question: What did Paul Graham work on during YC? - Context Relevance Score: 0.5 + Generated 3 sub questions. + [documents] Q: What did Paul Graham work on before Y Combinator? + [documents] Q: What did Paul Graham work on during Y Combinator? + [documents] Q: What did Paul Graham work on after Y Combinator? + [documents] A: Paul Graham worked on a project with Robert and Trevor after Y Combinator. + [documents] A: Paul Graham worked on projects with his colleagues Robert and Trevor before Y Combinator. + [documents] A: Paul Graham worked on writing essays and working on Y Combinator during his time at Y Combinator. +  + + + Question: What did Paul Graham work on after Y Combinator? + Response: Paul Graham worked on a project with Robert and Trevor after Y Combinator. + + Context Relevance Score: 0.0 Factual Accuracy Score: 1.0 Response Completeness Score: 0.5 - Question: What did Paul Graham work on after YC? - Context Relevance Score: 0.5 + Question: What did Paul Graham work on before Y Combinator? + Response: Paul Graham worked on projects with his colleagues Robert and Trevor before Y Combinator. + + Context Relevance Score: 0.0 Factual Accuracy Score: 1.0 Response Completeness Score: 0.5 - Question: What did Paul Graham work on before YC? - Context Relevance Score: 1.0 - Factual Accuracy Score: 1.0 - Response Completeness Score: 0.0 + Question: What did Paul Graham work on during Y Combinator? + Response: Paul Graham worked on writing essays and working on Y Combinator during his time at Y Combinator. + + Context Relevance Score: 0.0 + Factual Accuracy Score: 0.5 + Response Completeness Score: 0.5 Question: How was Paul Grahams life different before, during, and after YC? @@ -280,7 +339,7 @@ Here's an example of the dashboard visualizing the scores of the sub-questions i # 3. Re-ranking -Re-ranking is the process of reordering the nodes based on their relevance to the query. There are multiple classes of re-ranking algorithms offered by Llamaindex. We have used CohereRerank for this example. +Re-ranking is the process of reordering the nodes based on their relevance to the query. There are multiple classes of re-ranking algorithms offered by Llamaindex. We have used LLMRerank for this example. The re-ranker allows you to enter the number of top n nodes that will be returned after re-ranking. If this value remains the same as the original number of nodes, the re-ranker will only re-rank the nodes and not change the number of nodes. Otherwise, it will re-rank the nodes and return the top n nodes. @@ -290,22 +349,28 @@ We will perform different evaluations based on the number of nodes returned afte If the number of nodes returned after re-ranking is the same as the original number of nodes, the following evaluation will be performed: -- **Context Reranking**: Check if the order of the re-ranked nodes is more relevant to the query than the original order. +- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. ```python -api_key = "**********************************" # Insert cohere API key here -cohere_rerank = CohereRerank( - api_key=api_key, top_n=5 -) # In this example, the number of nodes before re-ranking is 5 and after re-ranking is also 5. +callback_handler = UpTrainCallbackHandler( + key_type="openai", + api_key=os.environ["OPENAI_API_KEY"], + project_name_prefix="llama", +) +Settings.callback_manager = CallbackManager([callback_handler]) + +rerank_postprocessor = SentenceTransformerRerank( + top_n=3, # number of nodes after reranking + keep_retrieval_score=True, +) index = VectorStoreIndex.from_documents( - documents=documents, service_context=service_context + documents=documents, ) query_engine = index.as_query_engine( - similarity_top_k=10, - node_postprocessors=[cohere_rerank], - service_context=service_context, + similarity_top_k=3, # number of nodes before reranking + node_postprocessors=[rerank_postprocessor], ) response = query_engine.query( @@ -316,25 +381,39 @@ response = query_engine.query( Question: What did Sam Altman do in this essay? Context Reranking Score: 0.0 + + Question: What did Sam Altman do in this essay? + Response: Sam Altman was asked to become the president of Y Combinator after the original founders decided to step back and reorganize the company for long-term sustainability. + + Context Relevance Score: 1.0 + Factual Accuracy Score: 1.0 + Response Completeness Score: 0.5 + # 3b. Re-ranking (With different number of nodes) If the number of nodes returned after re-ranking is the lesser as the original number of nodes, the following evaluation will be performed: -- **Context Conciseness**: If the re-ranked nodes are able to provide all the information required by the query. +- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information. ```python -api_key = "**********************************" # insert cohere API key here -cohere_rerank = CohereRerank( - api_key=api_key, top_n=2 -) # In this example, the number of nodes before re-ranking is 5 and after re-ranking is 2. +callback_handler = UpTrainCallbackHandler( + key_type="openai", + api_key=os.environ["OPENAI_API_KEY"], + project_name_prefix="llama", +) +Settings.callback_manager = CallbackManager([callback_handler]) + +rerank_postprocessor = SentenceTransformerRerank( + top_n=2, # Number of nodes after re-ranking + keep_retrieval_score=True, +) index = VectorStoreIndex.from_documents( - documents=documents, service_context=service_context + documents=documents, ) query_engine = index.as_query_engine( - similarity_top_k=10, - node_postprocessors=[cohere_rerank], - service_context=service_context, + similarity_top_k=5, # Number of nodes before re-ranking + node_postprocessors=[rerank_postprocessor], ) # Use your advanced RAG @@ -344,18 +423,20 @@ response = query_engine.query( ``` Question: What did Sam Altman do in this essay? - Context Conciseness Score: 1.0 + Context Conciseness Score: 0.0 -# UpTrain's Managed Service Dashboard and Insights -The UpTrain Managed Service offers the following features: + Question: What did Sam Altman do in this essay? + Response: Sam Altman offered unsolicited advice to the author during a visit to California for interviews. + + + Context Relevance Score: 1.0 + Factual Accuracy Score: 1.0 + Response Completeness Score: 0.5 -1. Advanced dashboards with drill-down and filtering options. -1. Identification of insights and common themes among unsuccessful cases. -1. Real-time observability and monitoring of production data. -1. Integration with CI/CD pipelines for seamless regression testing. +# UpTrain's Managed Service Dashboard and Insights -To define the UpTrain callback handler, the only change required is to set the `key_type` and `api_key` parameters. The rest of the code remains the same. +To use the UpTrain's managed service via the UpTrain callback handler, the only change required is to set the `key_type` and `api_key` parameters. The rest of the code remains the same. ```python callback_handler = UpTrainCallbackHandler( @@ -380,12 +461,13 @@ pip install uptrain llama_index ## Import required libraries ```python +import httpx import os import openai import pandas as pd -from llama_index.core import VectorStoreIndex, SimpleDirectoryReader -from uptrain import Evals, EvalLlamaIndex, Settings +from llama_index.core import VectorStoreIndex, SimpleDirectoryReader, Settings +from uptrain import Evals, EvalLlamaIndex, Settings as UpTrainSettings ``` ## Create the dataset folder for the query engine @@ -399,8 +481,6 @@ if not os.path.exists("nyc_wikipedia"): dataset_path = os.path.join("./nyc_wikipedia", "nyc_text.txt") if not os.path.exists(dataset_path): - import httpx - r = httpx.get(url) with open(dataset_path, "wb") as f: f.write(r.content) @@ -436,8 +516,6 @@ openai.api_key = "sk-************************" # your OpenAI API key Let's create a vector store index using LLamaIndex and then use that as a query engine to retrieve relevant sections from the documentation. ```python -from llama_index.core import Settings - Settings.chunk_size = 512 documents = SimpleDirectoryReader("./nyc_wikipedia/").load_data() @@ -452,7 +530,7 @@ query_engine = vector_index.as_query_engine() # Alternative 1: Evaluate using UpTrain's Open-Source Software (OSS) ```python -settings = Settings( +settings = UpTrainSettings( openai_api_key=openai.api_key, ) ``` @@ -502,7 +580,7 @@ You can create a free UpTrain account [here](https://uptrain.ai/) and get free t UPTRAIN_API_KEY = "up-**********************" # your UpTrain API key # We use `uptrain_access_token` parameter instead of 'openai_api_key' in settings in this case -settings = Settings( +settings = UpTrainSettings( uptrain_access_token=UPTRAIN_API_KEY, ) ``` diff --git a/docs/cookbooks/mixedbread_reranker.ipynb b/docs/cookbooks/mixedbread_reranker.ipynb new file mode 100644 index 0000000000000..1f95a31e234ba --- /dev/null +++ b/docs/cookbooks/mixedbread_reranker.ipynb @@ -0,0 +1,280 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "964030f7-40e4-4398-a5ab-668aabcf3bad", + "metadata": {}, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "markdown", + "id": "360313ab-9393-430e-9647-e0d5545809b9", + "metadata": {}, + "source": [ + "# mixedbread Rerank Cookbook\n", + "\n", + "mixedbread.ai has released three fully open-source reranker models under the Apache 2.0 license. For more in-depth information, you can check out their detailed [blog post](https://www.mixedbread.ai/blog/mxbai-rerank-v1). The following are the three models:\n", + "\n", + "1. `mxbai-rerank-xsmall-v1`\n", + "2. `mxbai-rerank-base-v1`\n", + "3. `mxbai-rerank-large-v1`\n", + "\n", + "In this notebook, we'll demonstrate how to use the `mxbai-rerank-base-v1` model with the `SentenceTransformerRerank` module in LlamaIndex. This setup allows you to seamlessly swap in any reranker model of your choice using the `SentenceTransformerRerank` module to enhance your RAG pipeline." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "856ecfdc-04fa-4fe9-a81c-9a5858cd4a6d", + "metadata": {}, + "source": [ + "### Installation" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bfb5314f-e6c7-409c-86df-8e1a5ca59adb", + "metadata": {}, + "outputs": [], + "source": [ + "!pip install llama-index\n", + "!pip install sentence-transformers" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "5f5393fb-b410-4769-9380-0ef90a33b82e", + "metadata": {}, + "source": [ + "### Set API Keys" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a9782acf-b0ab-4933-bb41-27cd2a02b5dd", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "os.environ[\"OPENAI_API_KEY\"] = \"YOUR OPENAI API KEY\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b7596ddf-e1de-4098-81f3-fce504d2da94", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import (\n", + " VectorStoreIndex,\n", + " SimpleDirectoryReader,\n", + ")\n", + "\n", + "from llama_index.core.postprocessor import SentenceTransformerRerank" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "8011ff9c-2b82-47b4-983f-4fafc29e3127", + "metadata": {}, + "source": [ + "### Download Data" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "6dd335cb-900b-462f-987a-d4af2aac88fa", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "--2024-03-01 09:52:09-- https://raw.githubusercontent.com/run-llama/llama_index/main/docs/examples/data/paul_graham/paul_graham_essay.txt\n", + "Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.110.133, 185.199.108.133, 185.199.109.133, ...\n", + "Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.110.133|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 75042 (73K) [text/plain]\n", + "Saving to: ‘data/paul_graham/paul_graham_essay.txt’\n", + "\n", + "data/paul_graham/pa 100%[===================>] 73.28K --.-KB/s in 0.007s \n", + "\n", + "2024-03-01 09:52:09 (9.86 MB/s) - ‘data/paul_graham/paul_graham_essay.txt’ saved [75042/75042]\n", + "\n" + ] + } + ], + "source": [ + "!mkdir -p 'data/paul_graham/'\n", + "!wget 'https://raw.githubusercontent.com/run-llama/llama_index/main/docs/examples/data/paul_graham/paul_graham_essay.txt' -O 'data/paul_graham/paul_graham_essay.txt'" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "e482b09c-a0df-4788-a75b-a33ade7001d1", + "metadata": {}, + "source": [ + "### Load Documents" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "342c91b8-301f-40ed-9d09-9acdb1bbdc44", + "metadata": {}, + "outputs": [], + "source": [ + "documents = SimpleDirectoryReader(\"./data/paul_graham/\").load_data()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "8afdfeb1-57ae-4d2b-ae73-683db205be32", + "metadata": {}, + "source": [ + "### Build Index" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "47c335e9-dd4d-475c-bade-e2a588e33294", + "metadata": {}, + "outputs": [], + "source": [ + "index = VectorStoreIndex.from_documents(documents=documents)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "f1ab8157-dbcb-4588-9b3c-5bd2fc4a721e", + "metadata": {}, + "source": [ + "### Define postprocessor for `mxbai-rerank-base-v1` reranker" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "3fcc5590-2e58-4a7e-8b18-a7153c06d1ff", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core.postprocessor import SentenceTransformerRerank\n", + "\n", + "postprocessor = SentenceTransformerRerank(\n", + " model=\"mixedbread-ai/mxbai-rerank-base-v1\", top_n=2\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "c7c81b0d-0449-4092-80cb-88080e69f980", + "metadata": {}, + "source": [ + "### Create Query Engine\n", + "\n", + "We will first retrieve 10 relevant nodes and pick top-2 nodes using the defined postprocessor." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e1b23700-15ae-4f1a-9443-43eb1eecab5f", + "metadata": {}, + "outputs": [], + "source": [ + "query_engine = index.as_query_engine(\n", + " similarity_top_k=10,\n", + " node_postprocessors=[postprocessor],\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "93871f9c-8871-4f43-8ee9-b3ca4e403d86", + "metadata": {}, + "source": [ + "### Test Queries" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "658d3092-7d86-4520-83a2-c3e630dc02b6", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Sam Altman initially declined the offer of becoming president of Y Combinator because he wanted to start a startup focused on making nuclear reactors.\n" + ] + } + ], + "source": [ + "response = query_engine.query(\n", + " \"Why did Sam Altman decline the offer of becoming president of Y Combinator?\",\n", + ")\n", + "\n", + "print(response)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "497e715e-3f7a-4140-a3ba-34356e473702", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Paul Graham started YC because he and his partners wanted to create an investment firm where they could implement their own ideas and provide the kind of support to startups that they felt was lacking when they were founders themselves. They aimed to not only make seed investments but also assist startups with various aspects of setting up a company, similar to the help they had received from others in the past.\n" + ] + } + ], + "source": [ + "response = query_engine.query(\n", + " \"Why did Paul Graham start YC?\",\n", + ")\n", + "\n", + "print(response)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/examples/agent/custom_agent.ipynb b/docs/examples/agent/custom_agent.ipynb index 7a26db4db1cfe..729d6cec4dd41 100644 --- a/docs/examples/agent/custom_agent.ipynb +++ b/docs/examples/agent/custom_agent.ipynb @@ -79,7 +79,7 @@ " Task,\n", " AgentChatResponse,\n", ")\n", - "from typing import Dict, Any, List, Tuple\n", + "from typing import Dict, Any, List, Tuple, Optional\n", "from llama_index.core.tools import BaseTool, QueryEngineTool\n", "from llama_index.core.program import LLMTextCompletionProgram\n", "from llama_index.core.output_parsers import PydanticOutputParser\n", @@ -200,7 +200,7 @@ " return {\"count\": 0, \"current_reasoning\": []}\n", "\n", " def _run_step(\n", - " self, state: Dict[str, Any], task: Task\n", + " self, state: Dict[str, Any], task: Task, input: Optional[str] = None\n", " ) -> Tuple[AgentChatResponse, bool]:\n", " \"\"\"Run step.\n", "\n", diff --git a/docs/examples/callbacks/LangfuseCallbackHandler.ipynb b/docs/examples/callbacks/LangfuseCallbackHandler.ipynb new file mode 100644 index 0000000000000..639178110583d --- /dev/null +++ b/docs/examples/callbacks/LangfuseCallbackHandler.ipynb @@ -0,0 +1,288 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "id": "d6509c3a", + "metadata": {}, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "markdown", + "id": "c0d8b66c", + "metadata": {}, + "source": [ + "# Langfuse Callback Handler\n", + "\n", + "[Langfuse](https://langfuse.com/docs) is an open source LLM engineering platform to help teams collaboratively debug, analyze and iterate on their LLM Applications.\n", + "\n", + "The `LangfuseCallbackHandler` is integrated with Langfuse and empowers you to seamlessly track and monitor performance, traces, and metrics of your LlamaIndex application. Detailed traces of the LlamaIndex context augmentation and the LLM querying processes are captured and can be inspected directly in the Langfuse UI." + ] + }, + { + "cell_type": "markdown", + "id": "4a59a00e", + "metadata": {}, + "source": [ + "![langfuse-tracing](https://static.langfuse.com/llamaindex-langfuse-docs.gif)" + ] + }, + { + "cell_type": "markdown", + "id": "3b9057da", + "metadata": {}, + "source": [ + "## Setup" + ] + }, + { + "cell_type": "markdown", + "id": "5d9dfc7f", + "metadata": {}, + "source": [ + "### Install packages" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "49c3527e", + "metadata": {}, + "outputs": [], + "source": [ + "%pip install llama-index llama-index-callbacks-langfuse" + ] + }, + { + "cell_type": "markdown", + "id": "bc10630b", + "metadata": {}, + "source": [ + "### Configure environment" + ] + }, + { + "cell_type": "markdown", + "id": "4c256817", + "metadata": {}, + "source": [ + "If you haven't done yet, [sign up on Langfuse](https://cloud.langfuse.com/auth/sign-up) and obtain your API keys from the project settings." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "787e836d", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "# Langfuse\n", + "os.environ[\"LANGFUSE_SECRET_KEY\"] = \"sk-lf-...\"\n", + "os.environ[\"LANGFUSE_PUBLIC_KEY\"] = \"pk-lf-...\"\n", + "os.environ[\n", + " \"LANGFUSE_HOST\"\n", + "] = \"https://cloud.langfuse.com\" # 🇪🇺 EU region, 🇺🇸 US region: \"https://us.cloud.langfuse.com\"\n", + "\n", + "# OpenAI\n", + "os.environ[\"OPENAI_API_KEY\"] = \"sk-...\"" + ] + }, + { + "cell_type": "markdown", + "id": "1fe2ba01", + "metadata": {}, + "source": [ + "### Register the Langfuse callback handler" + ] + }, + { + "cell_type": "markdown", + "id": "cfef9ddc", + "metadata": {}, + "source": [ + "#### Option 1: Set global LlamaIndex handler" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "72afb2b9", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import global_handler, set_global_handler\n", + "\n", + "set_global_handler(\"langfuse\")\n", + "langfuse_callback_handler = global_handler" + ] + }, + { + "cell_type": "markdown", + "id": "0e6557d2", + "metadata": {}, + "source": [ + "#### Option 2: Use Langfuse callback directly" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4bdd95bf", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import Settings\n", + "from llama_index.core.callbacks import CallbackManager\n", + "from langfuse.llama_index import LlamaIndexCallbackHandler\n", + "\n", + "langfuse_callback_handler = LlamaIndexCallbackHandler()\n", + "Settings.callback_manager = CallbackManager([langfuse_callback_handler])" + ] + }, + { + "cell_type": "markdown", + "id": "e3e03ce7", + "metadata": {}, + "source": [ + "### Flush events to Langfuse" + ] + }, + { + "cell_type": "markdown", + "id": "e2c811ec", + "metadata": {}, + "source": [ + "The Langfuse SDKs queue and batches events in the background to reduce the number of network requests and improve overall performance. Before exiting your application, make sure all queued events have been flushed to Langfuse servers." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4e28876c", + "metadata": {}, + "outputs": [], + "source": [ + "# ... your LlamaIndex calls here ...\n", + "\n", + "langfuse_callback_handler.flush()" + ] + }, + { + "cell_type": "markdown", + "id": "6b86f1b5", + "metadata": {}, + "source": [ + "Done!✨ Traces and metrics from your LlamaIndex application are now automatically tracked in Langfuse. If you construct a new index or query an LLM with your documents in context, your traces and metrics are immediately visible in the Langfuse UI. Next, let's take a look at how traces will look in Langfuse." + ] + }, + { + "cell_type": "markdown", + "id": "1f0d4465", + "metadata": {}, + "source": [ + "## Example" + ] + }, + { + "cell_type": "markdown", + "id": "8a9f3428", + "metadata": {}, + "source": [ + "Fetch and save example data." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "aa303ae3", + "metadata": {}, + "outputs": [], + "source": [ + "!mkdir -p 'data/'\n", + "!wget 'https://raw.githubusercontent.com/run-llama/llama_index/main/docs/examples/data/paul_graham/paul_graham_essay.txt' -O 'data/paul_graham_essay.txt'" + ] + }, + { + "cell_type": "markdown", + "id": "9f053996", + "metadata": {}, + "source": [ + "Run an example index construction, query, and chat." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "983cbedd", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import SimpleDirectoryReader, VectorStoreIndex\n", + "\n", + "# Create index\n", + "documents = SimpleDirectoryReader(\"data\").load_data()\n", + "index = VectorStoreIndex.from_documents(documents)\n", + "\n", + "# Execute query\n", + "query_engine = index.as_query_engine()\n", + "query_response = query_engine.query(\"What did the author do growing up?\")\n", + "print(query_response)\n", + "\n", + "# Execute chat query\n", + "chat_engine = index.as_chat_engine()\n", + "chat_response = chat_engine.chat(\"What did the author do growing up?\")\n", + "print(chat_response)\n", + "\n", + "# As we want to immediately see result in Langfuse, we need to flush the callback handler\n", + "langfuse_callback_handler.flush()" + ] + }, + { + "cell_type": "markdown", + "id": "d5cdd88f", + "metadata": {}, + "source": [ + "Done!✨ You will now see traces of your index and query in your Langfuse project.\n", + "\n", + "Example traces (public links):\n", + "1. [Index construction](https://cloud.langfuse.com/project/clsuh9o2y0000mbztvdptt1mh/traces/1294ed01-8193-40a5-bb4e-2f0723d2c827)\n", + "2. [Query Engine](https://cloud.langfuse.com/project/clsuh9o2y0000mbztvdptt1mh/traces/eaa4ea74-78e0-42ef-ace0-7aa02c6fbbc6)\n", + "3. [Chat Engine](https://cloud.langfuse.com/project/clsuh9o2y0000mbztvdptt1mh/traces/d95914f5-66eb-4520-b996-49e84fd7f323)" + ] + }, + { + "cell_type": "markdown", + "id": "0b50845f", + "metadata": {}, + "source": [ + "## 📚 More details\n", + "\n", + "Check out the full [Langfuse documentation](https://langfuse.com/docs) for more details on Langfuse's tracing and analytics capabilities and how to make most of this integration." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/examples/callbacks/UpTrainCallback.ipynb b/docs/examples/callbacks/UpTrainCallback.ipynb index 7ccc72565c127..d4fb0947a7a31 100644 --- a/docs/examples/callbacks/UpTrainCallback.ipynb +++ b/docs/examples/callbacks/UpTrainCallback.ipynb @@ -13,30 +13,30 @@ "source": [ "# UpTrain Callback Handler\n", "\n", - "This notebook showcases the UpTrain callback handler seamlessly integrating into your pipeline, facilitating diverse evaluations. Three additional evaluations for Llamaindex have been introduced, complementing existing ones. These evaluations run automatically, with results displayed in the output. More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-). \n", + "UpTrain ([github](https://github.com/uptrain-ai/uptrain) || [website](https://github.com/uptrain-ai/uptrain/) || [docs](https://docs.uptrain.ai/)) is an open-source platform to evaluate and improve GenAI applications. It provides grades for 20+ preconfigured checks (covering language, code, embedding use cases), performs root cause analysis on failure cases and gives insights on how to resolve them. \n", "\n", - "Selected operators from the LlamaIndex pipeline are highlighted for demonstration:\n", + "This notebook showcases how to use UpTrain Callback Handler to evaluate different components of your RAG pipelines.\n", "\n", "## 1. **RAG Query Engine Evaluations**:\n", "The RAG query engine plays a crucial role in retrieving context and generating responses. To ensure its performance and response quality, we conduct the following evaluations:\n", "\n", - "- **Context Relevance**: Determines if the context extracted from the query is relevant to the response.\n", - "- **Factual Accuracy**: Assesses if the LLM is hallcuinating or providing incorrect information.\n", - "- **Response Completeness**: Checks if the response contains all the information requested by the query.\n", + "- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not.\n", + "- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context.\n", + "- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively.\n", "\n", "## 2. **Sub-Question Query Generation Evaluation**:\n", - "The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using a RAG query engine. Given the complexity, we include the previous evaluations and add:\n", + "The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using an RAG query engine. To measure it's accuracy, we use:\n", "\n", - "- **Sub Query Completeness**: Assures that the sub-questions accurately and comprehensively cover the original query.\n", + "- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query.\n", "\n", "## 3. **Re-Ranking Evaluations**:\n", - "Re-ranking involves reordering nodes based on relevance to the query and chosing top n nodes. Different evaluations are performed based on the number of nodes returned after re-ranking.\n", + "Re-ranking involves reordering nodes based on relevance to the query and choosing the top nodes. Different evaluations are performed based on the number of nodes returned after re-ranking.\n", "\n", "a. Same Number of Nodes\n", - "- **Context Reranking**: Checks if the order of re-ranked nodes is more relevant to the query than the original order.\n", + "- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order.\n", "\n", "b. Different Number of Nodes:\n", - "- **Context Conciseness**: Examines whether the reduced number of nodes still provides all the required information.\n", + "- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information.\n", "\n", "These evaluations collectively ensure the robustness and effectiveness of the RAG query engine, SubQuestionQueryGeneration operator, and the re-ranking process in the LlamaIndex pipeline." ] @@ -47,7 +47,7 @@ "source": [ "#### **Note:** \n", "- We have performed evaluations using basic RAG query engine, the same evaluations can be performed using the advanced RAG query engine as well.\n", - "- Same is true for Re-Ranking evaluations, we have performed evaluations using CohereRerank, the same evaluations can be performed using other re-rankers as well." + "- Same is true for Re-Ranking evaluations, we have performed evaluations using SentenceTransformerRerank, the same evaluations can be performed using other re-rankers as well." ] }, { @@ -65,10 +65,9 @@ "metadata": {}, "outputs": [], "source": [ - "%pip install llama-index-postprocessor-cohere-rerank\n", "%pip install llama-index-readers-web\n", - "%pip install llama-index-callback-uptrain\n", - "%pip install -q html2text llama-index pandas tqdm uptrain cohere" + "%pip install llama-index-callbacks-uptrain\n", + "%pip install -q html2text llama-index pandas tqdm uptrain torch sentence-transformers" ] }, { @@ -84,15 +83,14 @@ "metadata": {}, "outputs": [], "source": [ - "from llama_index.core.settings import Settings\n", - "from llama_index.core import VectorStoreIndex\n", + "from llama_index.core import Settings, VectorStoreIndex\n", "from llama_index.core.node_parser import SentenceSplitter\n", "from llama_index.readers.web import SimpleWebPageReader\n", "from llama_index.core.callbacks import CallbackManager\n", "from llama_index.callbacks.uptrain.base import UpTrainCallbackHandler\n", "from llama_index.core.query_engine import SubQuestionQueryEngine\n", "from llama_index.core.tools import QueryEngineTool, ToolMetadata\n", - "from llama_index.core.postprocessor.llm_rerank import LLMRerank\n", + "from llama_index.core.postprocessor import SentenceTransformerRerank\n", "from llama_index.llms.openai import OpenAI\n", "\n", "import os" @@ -141,11 +139,16 @@ "metadata": {}, "outputs": [], "source": [ + "os.environ[\n", + " \"OPENAI_API_KEY\"\n", + "] = \"sk-************\" # Replace with your OpenAI API key\n", + "\n", "callback_handler = UpTrainCallbackHandler(\n", " key_type=\"openai\",\n", - " api_key=\"sk-...\", # replace with your OpenAI API key\n", + " api_key=os.environ[\"OPENAI_API_KEY\"],\n", " project_name_prefix=\"llama\",\n", ")\n", + "\n", "Settings.callback_manager = CallbackManager([callback_handler])" ] }, @@ -200,9 +203,9 @@ "metadata": {}, "source": [ "UpTrain callback handler will automatically capture the query, context and response once generated and will run the following three evaluations *(Graded from 0 to 1)* on the response:\n", - "- **Context Relevance**: Check if the context extractedfrom the query is relevant to the response.\n", - "- **Factual Accuracy**: Check how factually accurate the response is.\n", - "- **Response Completeness**: Check if the response contains all the information that the query is asking for." + "- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not.\n", + "- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context.\n", + "- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively." ] }, { @@ -214,7 +217,10 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 16:04:09.869\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.33s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.36s/it]\n", + "100%|██████████| 1/1 [00:03<00:00, 3.50s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.32s/it]\n" ] }, { @@ -223,8 +229,9 @@ "text": [ "\n", "Question: What did Paul Graham do growing up?\n", - "Response: Growing up, Paul Graham worked on writing and programming. He wrote short stories and also tried his hand at programming on the IBM 1401 computer that his school district had. He later got a microcomputer, a TRS-80, and started programming more extensively, creating simple games and even a word processor.\n", - "Context Relevance Score: 0.5\n", + "Response: Growing up, Paul Graham worked on writing short stories and programming. He started programming on an IBM 1401 in 9th grade using an early version of Fortran. Later, he got a TRS-80 computer and wrote simple games, a rocket prediction program, and a word processor. Despite his interest in programming, he initially planned to study philosophy in college before eventually switching to AI.\n", + "\n", + "Context Relevance Score: 0.0\n", "Factual Accuracy Score: 1.0\n", "Response Completeness Score: 1.0\n", "\n" @@ -234,7 +241,10 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 16:04:36.895\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.59s/it]\n", + "100%|██████████| 1/1 [00:00<00:00, 1.01it/s]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.76s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.28s/it]\n" ] }, { @@ -243,10 +253,11 @@ "text": [ "\n", "Question: When and how did Paul Graham's mother die?\n", - "Response: The context information does not provide any information about Paul Graham's mother or her death.\n", + "Response: Paul Graham's mother died when he was 18 years old, from a brain tumor.\n", + "\n", "Context Relevance Score: 0.0\n", "Factual Accuracy Score: 0.0\n", - "Response Completeness Score: 0.0\n", + "Response Completeness Score: 0.5\n", "\n" ] }, @@ -254,7 +265,10 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 16:04:55.245\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.75s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.55s/it]\n", + "100%|██████████| 1/1 [00:03<00:00, 3.39s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.48s/it]\n" ] }, { @@ -263,10 +277,11 @@ "text": [ "\n", "Question: What, in Paul Graham's opinion, is the most distinctive thing about YC?\n", - "Response: The most distinctive thing about YC, according to Paul Graham's opinion, is that it provides a sense of community and support for startup founders. It solves the problem of isolation that founders often face by connecting them with colleagues who understand the challenges they are going through and can offer guidance and support. Additionally, YC fosters a tight-knit alumni community where startups can help each other and even become each other's customers.\n", - "Context Relevance Score: 0.0\n", - "Factual Accuracy Score: 1.0\n", - "Response Completeness Score: 0.5\n", + "Response: The most distinctive thing about Y Combinator, according to Paul Graham, is that instead of deciding for himself what to work on, the problems come to him. Every 6 months, a new batch of startups brings their problems, which then become the focus of YC. This engagement with a variety of startup problems and the direct involvement in solving them is what Graham finds most unique about Y Combinator.\n", + "\n", + "Context Relevance Score: 1.0\n", + "Factual Accuracy Score: 0.3333333333333333\n", + "Response Completeness Score: 1.0\n", "\n" ] }, @@ -274,7 +289,10 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 16:05:24.705\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.92s/it]\n", + "100%|██████████| 1/1 [00:00<00:00, 1.20it/s]\n", + "100%|██████████| 1/1 [00:02<00:00, 2.15s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.08s/it]\n" ] }, { @@ -283,9 +301,10 @@ "text": [ "\n", "Question: When and how did Paul Graham meet Jessica Livingston?\n", - "Response: Paul Graham met Jessica Livingston at a party at his house in October 2003. They were introduced to each other by a mutual friend named Maria Daniels. A couple of days later, Paul asked Jessica out and they started dating.\n", - "Context Relevance Score: 0.5\n", - "Factual Accuracy Score: 1.0\n", + "Response: Paul Graham met Jessica Livingston at a big party at his house in October 2003.\n", + "\n", + "Context Relevance Score: 1.0\n", + "Factual Accuracy Score: 0.5\n", "Response Completeness Score: 1.0\n", "\n" ] @@ -294,7 +313,10 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 16:05:52.062\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.82s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.14s/it]\n", + "100%|██████████| 1/1 [00:03<00:00, 3.19s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.50s/it]" ] }, { @@ -303,10 +325,18 @@ "text": [ "\n", "Question: What is Bel, and when and where was it written?\n", - "Response: Bel is a new Lisp that was written in Arc. It was written over a period of 4 years, from March 26, 2015, to October 12, 2019. The majority of Bel was written in England, as the author moved there in the summer of 2016.\n", + "Response: Bel is a new Lisp that was written in Arc. It was developed over a period of 4 years, from March 26, 2015 to October 12, 2019. The majority of Bel was written in England.\n", + "\n", "Context Relevance Score: 1.0\n", "Factual Accuracy Score: 1.0\n", - "Response Completeness Score: 0.5\n", + "Response Completeness Score: 1.0\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ "\n" ] } @@ -348,15 +378,15 @@ "source": [ "# 2. Sub-Question Query Engine Evaluation\n", "\n", - "The **sub question query engine** is used to tackle the problem of answering a complex query using multiple data sources. It first breaks down the complex query into sub questions for each relevant data source, then gather all the intermediate reponses and synthesizes a final response.\n", + "The **sub-question query engine** is used to tackle the problem of answering a complex query using multiple data sources. It first breaks down the complex query into sub-questions for each relevant data source, then gathers all the intermediate responses and synthesizes a final response.\n", "\n", "UpTrain callback handler will automatically capture the sub-question and the responses for each of them once generated and will run the following three evaluations *(Graded from 0 to 1)* on the response:\n", - "- **Context Relevance**: Check if the context extractedfrom the query is relevant to the response.\n", - "- **Factual Accuracy**: Check how factually accurate the response is.\n", - "- **Response Completeness**: Check if the response contains all the information that the query is asking for.\n", + "- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the retrieved context has sufficient information to answer the user query or not.\n", + "- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM's response can be verified via the retrieved context.\n", + "- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information required to answer the user query comprehensively.\n", "\n", "In addition to the above evaluations, the callback handler will also run the following evaluation:\n", - "- **Sub Query Completeness**: Checks if the sub-questions accurately and completely cover the original query." + "- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query." ] }, { @@ -372,9 +402,9 @@ "\u001b[1;3;38;2;237;90;200m[documents] Q: What did Paul Graham work on before YC?\n", "\u001b[0m\u001b[1;3;38;2;90;149;237m[documents] Q: What did Paul Graham work on during YC?\n", "\u001b[0m\u001b[1;3;38;2;11;159;203m[documents] Q: What did Paul Graham work on after YC?\n", - "\u001b[0m\u001b[1;3;38;2;237;90;200m[documents] A: Before Y Combinator (YC), Paul Graham worked on a startup called Viaweb.\n", - "\u001b[0m\u001b[1;3;38;2;11;159;203m[documents] A: After leaving Y Combinator, Paul Graham focused on painting. He wanted to see how good he could get at painting if he dedicated his time and effort to it. He spent most of 2014 working on his painting skills, but eventually ran out of steam in November.\n", - "\u001b[0m\u001b[1;3;38;2;90;149;237m[documents] A: During his time at Y Combinator (YC), Paul Graham worked on various projects. He initially intended to work on three things: hacking, writing essays, and working on YC. However, as YC grew and he became more excited about it, it started to take up a lot more of his attention. He also worked on writing essays and was responsible for writing all of YC's internal software in Arc.\n", + "\u001b[0m\u001b[1;3;38;2;11;159;203m[documents] A: After Y Combinator, Paul Graham decided to focus on painting as his next endeavor.\n", + "\u001b[0m\u001b[1;3;38;2;90;149;237m[documents] A: Paul Graham worked on writing essays and working on Y Combinator during YC.\n", + "\u001b[0m\u001b[1;3;38;2;237;90;200m[documents] A: Before Y Combinator, Paul Graham worked on projects with his colleagues Robert and Trevor.\n", "\u001b[0m" ] }, @@ -382,40 +412,65 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-14 08:24:08.958\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n", - "\u001b[32m2024-02-14 08:24:34.450\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 3/3 [00:02<00:00, 1.47it/s]\n", + "100%|██████████| 3/3 [00:00<00:00, 3.28it/s]\n", + "100%|██████████| 3/3 [00:01<00:00, 1.68it/s]\n", + "100%|██████████| 3/3 [00:01<00:00, 2.28it/s]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\n", - "Question: What did Paul Graham work on before YC?\n", - "Response: Before Y Combinator (YC), Paul Graham worked on a startup called Viaweb.\n", - "Context Relevance Score: 0.0\n", - "Factual Accuracy Score: 1.0\n", - "Response Completeness Score: 0.5\n", - "\n", "\n", "Question: What did Paul Graham work on after YC?\n", - "Response: After leaving Y Combinator, Paul Graham focused on painting. He wanted to see how good he could get at painting if he dedicated his time and effort to it. He spent most of 2014 working on his painting skills, but eventually ran out of steam in November.\n", - "Context Relevance Score: 1.0\n", + "Response: After Y Combinator, Paul Graham decided to focus on painting as his next endeavor.\n", + "\n", + "Context Relevance Score: 0.0\n", "Factual Accuracy Score: 0.0\n", - "Response Completeness Score: 0.0\n", + "Response Completeness Score: 0.5\n", "\n", "\n", "Question: What did Paul Graham work on during YC?\n", - "Response: During his time at Y Combinator (YC), Paul Graham worked on various projects. He initially intended to work on three things: hacking, writing essays, and working on YC. However, as YC grew and he became more excited about it, it started to take up a lot more of his attention. He also worked on writing essays and was responsible for writing all of YC's internal software in Arc.\n", - "Context Relevance Score: 0.5\n", + "Response: Paul Graham worked on writing essays and working on Y Combinator during YC.\n", + "\n", + "Context Relevance Score: 0.0\n", "Factual Accuracy Score: 1.0\n", "Response Completeness Score: 0.5\n", "\n", + "\n", + "Question: What did Paul Graham work on before YC?\n", + "Response: Before Y Combinator, Paul Graham worked on projects with his colleagues Robert and Trevor.\n", + "\n", + "Context Relevance Score: 0.0\n", + "Factual Accuracy Score: 0.0\n", + "Response Completeness Score: 0.5\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "100%|██████████| 1/1 [00:01<00:00, 1.24s/it]" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ "\n", "Question: How was Paul Grahams life different before, during, and after YC?\n", "Sub Query Completeness Score: 1.0\n", "\n" ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "\n" + ] } ], "source": [ @@ -465,7 +520,7 @@ "source": [ "# 3. Re-ranking \n", "\n", - "Re-ranking is the process of reordering the nodes based on their relevance to the query. There are multiple classes of re-ranking algorithms offered by Llamaindex. We have used CohereRerank for this example.\n", + "Re-ranking is the process of reordering the nodes based on their relevance to the query. There are multiple classes of re-ranking algorithms offered by Llamaindex. We have used LLMRerank for this example.\n", "\n", "The re-ranker allows you to enter the number of top n nodes that will be returned after re-ranking. If this value remains the same as the original number of nodes, the re-ranker will only re-rank the nodes and not change the number of nodes. Otherwise, it will re-rank the nodes and return the top n nodes.\n", "\n", @@ -479,7 +534,8 @@ "## 3a. Re-ranking (With same number of nodes)\n", "\n", "If the number of nodes returned after re-ranking is the same as the original number of nodes, the following evaluation will be performed:\n", - "- **Context Reranking**: Check if the order of the re-ranked nodes is more relevant to the query than the original order." + "\n", + "- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order." ] }, { @@ -491,7 +547,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-13 20:00:17.459\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:01<00:00, 1.89s/it]\n" ] }, { @@ -500,28 +556,62 @@ "text": [ "\n", "Question: What did Sam Altman do in this essay?\n", + "Context Reranking Score: 1.0\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "100%|██████████| 1/1 [00:01<00:00, 1.88s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.44s/it]\n", + "100%|██████████| 1/1 [00:02<00:00, 2.77s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.45s/it]" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Question: What did Sam Altman do in this essay?\n", + "Response: Sam Altman was asked to become the president of Y Combinator after the original founders decided to step down and reorganize the company for long-term sustainability.\n", + "\n", "Context Relevance Score: 1.0\n", "Factual Accuracy Score: 1.0\n", - "Response Completeness Score: 1.0\n", + "Response Completeness Score: 0.5\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ "\n" ] } ], "source": [ - "os.environ[\"OPENAI_API_KEY\"] = \"sk-...\" # Replace with your OpenAI API key\n", - "llm = OpenAI(model=\"gpt-4-turbo-preview\")\n", + "callback_handler = UpTrainCallbackHandler(\n", + " key_type=\"openai\",\n", + " api_key=os.environ[\"OPENAI_API_KEY\"],\n", + " project_name_prefix=\"llama\",\n", + ")\n", + "Settings.callback_manager = CallbackManager([callback_handler])\n", "\n", - "cohere_rerank = LLMRerank(\n", - " llm=llm, top_n=5\n", - ") # In this example, the number of nodes before re-ranking is 5 and after re-ranking is also 5.\n", + "rerank_postprocessor = SentenceTransformerRerank(\n", + " top_n=3, # number of nodes after reranking\n", + " keep_retrieval_score=True,\n", + ")\n", "\n", "index = VectorStoreIndex.from_documents(\n", " documents=documents,\n", ")\n", "\n", "query_engine = index.as_query_engine(\n", - " similarity_top_k=10,\n", - " node_postprocessors=[cohere_rerank],\n", + " similarity_top_k=3, # number of nodes before reranking\n", + " node_postprocessors=[rerank_postprocessor],\n", ")\n", "\n", "response = query_engine.query(\n", @@ -536,7 +626,8 @@ "# 3b. Re-ranking (With different number of nodes)\n", "\n", "If the number of nodes returned after re-ranking is the lesser as the original number of nodes, the following evaluation will be performed:\n", - "- **Context Conciseness**: If the re-ranked nodes are able to provide all the information required by the query." + "\n", + "- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information." ] }, { @@ -548,7 +639,27 @@ "name": "stderr", "output_type": "stream", "text": [ - "\u001b[32m2024-02-13 20:01:39.343\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36muptrain.framework.evalllm\u001b[0m:\u001b[36mevaluate\u001b[0m:\u001b[36m110\u001b[0m - \u001b[1mSending evaluation request for rows 0 to <50 to the Uptrain\u001b[0m\n" + "100%|██████████| 1/1 [00:02<00:00, 2.22s/it]\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "Question: What did Sam Altman do in this essay?\n", + "Context Conciseness Score: 0.0\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "100%|██████████| 1/1 [00:01<00:00, 1.58s/it]\n", + "100%|██████████| 1/1 [00:00<00:00, 1.19it/s]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.62s/it]\n", + "100%|██████████| 1/1 [00:01<00:00, 1.42s/it]" ] }, { @@ -557,27 +668,41 @@ "text": [ "\n", "Question: What did Sam Altman do in this essay?\n", - "Context Relevance Score: 0.5\n", + "Response: Sam Altman offered unsolicited advice to the author during a visit to California for interviews.\n", + "\n", + "Context Relevance Score: 0.0\n", "Factual Accuracy Score: 1.0\n", - "Response Completeness Score: 1.0\n", + "Response Completeness Score: 0.5\n", + "\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ "\n" ] } ], "source": [ - "os.environ[\"OPENAI_API_KEY\"] = \"sk-...\" # Replace with your OpenAI API key\n", - "llm = OpenAI(model=\"gpt-4-turbo-preview\")\n", + "callback_handler = UpTrainCallbackHandler(\n", + " key_type=\"openai\",\n", + " api_key=os.environ[\"OPENAI_API_KEY\"],\n", + " project_name_prefix=\"llama\",\n", + ")\n", + "Settings.callback_manager = CallbackManager([callback_handler])\n", "\n", - "cohere_rerank = LLMRerank(\n", - " llm=llm, top_n=2\n", - ") # In this example, the number of nodes before re-ranking is 5 and after re-ranking is 2.\n", + "rerank_postprocessor = SentenceTransformerRerank(\n", + " top_n=2, # Number of nodes after re-ranking\n", + " keep_retrieval_score=True,\n", + ")\n", "\n", "index = VectorStoreIndex.from_documents(\n", " documents=documents,\n", ")\n", "query_engine = index.as_query_engine(\n", - " similarity_top_k=10,\n", - " node_postprocessors=[cohere_rerank],\n", + " similarity_top_k=5, # Number of nodes before re-ranking\n", + " node_postprocessors=[rerank_postprocessor],\n", ")\n", "\n", "# Use your advanced RAG\n", @@ -592,14 +717,7 @@ "source": [ "# UpTrain's Managed Service Dashboard and Insights\n", "\n", - "The UpTrain Managed Service offers the following features:\n", - "\n", - "1. Advanced dashboards with drill-down and filtering options.\n", - "1. Identification of insights and common themes among unsuccessful cases.\n", - "1. Real-time observability and monitoring of production data.\n", - "1. Integration with CI/CD pipelines for seamless regression testing.\n", - "\n", - "To define the UpTrain callback handler, the only change required is to set the `key_type` and `api_key` parameters. The rest of the code remains the same.\n", + "To use the UpTrain's managed service via the UpTrain callback handler, the only change required is to set the `key_type` and `api_key` parameters. The rest of the code remains the same.\n", "\n", "```python\n", "callback_handler = UpTrainCallbackHandler(\n", @@ -622,7 +740,7 @@ ], "metadata": { "kernelspec": { - "display_name": "phoenixdev", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -639,5 +757,5 @@ } }, "nbformat": 4, - "nbformat_minor": 2 + "nbformat_minor": 4 } diff --git a/docs/examples/customization/prompts/chat_prompts.ipynb b/docs/examples/customization/prompts/chat_prompts.ipynb index 8efc743c68d8c..18a4408e92d4c 100644 --- a/docs/examples/customization/prompts/chat_prompts.ipynb +++ b/docs/examples/customization/prompts/chat_prompts.ipynb @@ -8,7 +8,6 @@ ] }, { - "attachments": {}, "cell_type": "markdown", "metadata": {}, "source": [ @@ -41,13 +40,51 @@ ] }, { - "attachments": {}, "cell_type": "markdown", "metadata": {}, "source": [ "## Prompt Setup\n", "\n", - "Below, we take the default prompts and customize them to always answer, even if the context is not helpful." + "Below, we take the default prompts and customize them to always answer, even if the context is not helpful.\n", + "\n", + "We show two ways of setting up the prompts:\n", + "1. Explicitly define ChatMessage and MessageRole objects.\n", + "2. Call ChatPromptTemplate.from_messages" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "qa_prompt_str = (\n", + " \"Context information is below.\\n\"\n", + " \"---------------------\\n\"\n", + " \"{context_str}\\n\"\n", + " \"---------------------\\n\"\n", + " \"Given the context information and not prior knowledge, \"\n", + " \"answer the question: {query_str}\\n\"\n", + ")\n", + "\n", + "refine_prompt_str = (\n", + " \"We have the opportunity to refine the original answer \"\n", + " \"(only if needed) with some more context below.\\n\"\n", + " \"------------\\n\"\n", + " \"{context_msg}\\n\"\n", + " \"------------\\n\"\n", + " \"Given the new context, refine the original answer to better \"\n", + " \"answer the question: {query_str}. \"\n", + " \"If the context isn't useful, output the original answer again.\\n\"\n", + " \"Original Answer: {existing_answer}\"\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### 1. Explicitly Define `ChatMessage` and `MessageRole` objects" ] }, { @@ -67,17 +104,7 @@ " \"Always answer the question, even if the context isn't helpful.\"\n", " ),\n", " ),\n", - " ChatMessage(\n", - " role=MessageRole.USER,\n", - " content=(\n", - " \"Context information is below.\\n\"\n", - " \"---------------------\\n\"\n", - " \"{context_str}\\n\"\n", - " \"---------------------\\n\"\n", - " \"Given the context information and not prior knowledge, \"\n", - " \"answer the question: {query_str}\\n\"\n", - " ),\n", - " ),\n", + " ChatMessage(role=MessageRole.USER, content=qa_prompt_str),\n", "]\n", "text_qa_template = ChatPromptTemplate(chat_text_qa_msgs)\n", "\n", @@ -89,26 +116,50 @@ " \"Always answer the question, even if the context isn't helpful.\"\n", " ),\n", " ),\n", - " ChatMessage(\n", - " role=MessageRole.USER,\n", - " content=(\n", - " \"We have the opportunity to refine the original answer \"\n", - " \"(only if needed) with some more context below.\\n\"\n", - " \"------------\\n\"\n", - " \"{context_msg}\\n\"\n", - " \"------------\\n\"\n", - " \"Given the new context, refine the original answer to better \"\n", - " \"answer the question: {query_str}. \"\n", - " \"If the context isn't useful, output the original answer again.\\n\"\n", - " \"Original Answer: {existing_answer}\"\n", - " ),\n", - " ),\n", + " ChatMessage(role=MessageRole.USER, content=refine_prompt_str),\n", "]\n", "refine_template = ChatPromptTemplate(chat_refine_msgs)" ] }, { - "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "#### 2. Call `ChatPromptTemplate.from_messages`\n", + "\n", + "`from_messages` is syntatic sugar that allows you to define a chat prompt template as a list of tuples, with each tuple corresponding to a chat message (\"role\", \"message\"). " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import ChatPromptTemplate\n", + "\n", + "# Text QA Prompt\n", + "chat_text_qa_msgs = [\n", + " (\n", + " \"system\",\n", + " \"Always answer the question, even if the context isn't helpful.\",\n", + " ),\n", + " (\"user\", qa_prompt_str),\n", + "]\n", + "text_qa_template = ChatPromptTemplate.from_messages(chat_text_qa_msgs)\n", + "\n", + "# Refine Prompt\n", + "chat_refine_msgs = [\n", + " (\n", + " \"system\",\n", + " \"Always answer the question, even if the context isn't helpful.\",\n", + " ),\n", + " (\"user\", refine_prompt_str),\n", + "]\n", + "refine_template = ChatPromptTemplate.from_messages(chat_refine_msgs)" + ] + }, + { "cell_type": "markdown", "metadata": {}, "source": [ @@ -165,7 +216,6 @@ ] }, { - "attachments": {}, "cell_type": "markdown", "metadata": {}, "source": [ @@ -181,7 +231,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "I'm sorry, but the given context does not provide any information about Joe Biden.\n" + "I'm unable to provide an answer to that question based on the context information provided.\n" ] } ], @@ -190,7 +240,6 @@ ] }, { - "attachments": {}, "cell_type": "markdown", "metadata": {}, "source": [ @@ -206,7 +255,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Joe Biden is the 46th President of the United States.\n" + "Joe Biden is the current President of the United States, having taken office in January 2021. He previously served as Vice President under President Barack Obama from 2009 to 2017.\n" ] } ], @@ -223,9 +272,9 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3 (ipykernel)", + "display_name": "llama_index_v3", "language": "python", - "name": "python3" + "name": "llama_index_v3" }, "language_info": { "codemirror_mode": { diff --git a/docs/examples/discover_llamaindex/document_management/BUILD b/docs/examples/discover_llamaindex/document_management/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/docs/examples/discover_llamaindex/document_management/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/docs/examples/embeddings/bedrock.ipynb b/docs/examples/embeddings/bedrock.ipynb index ef727d08147c5..45bcc63e8328e 100644 --- a/docs/examples/embeddings/bedrock.ipynb +++ b/docs/examples/embeddings/bedrock.ipynb @@ -41,12 +41,12 @@ "metadata": {}, "outputs": [], "source": [ - "embed_model = BedrockEmbedding.from_credentials(\n", + "embed_model = BedrockEmbedding(\n", " aws_access_key_id=os.getenv(\"AWS_ACCESS_KEY_ID\"),\n", " aws_secret_access_key=os.getenv(\"AWS_SECRET_ACCESS_KEY\"),\n", " aws_session_token=os.getenv(\"AWS_SESSION_TOKEN\"),\n", - " aws_region=\"\",\n", - " aws_profile=\"\",\n", + " region_name=\"\",\n", + " profile_name=\"\",\n", ")" ] }, @@ -97,9 +97,7 @@ "source": [ "from llama_index.embeddings.bedrock import BedrockEmbedding\n", "\n", - "model = BedrockEmbedding().from_credentials(\n", - " model_name=\"amazon.titan-embed-g1-text-02\"\n", - ")\n", + "model = BedrockEmbedding(model=\"amazon.titan-embed-g1-text-02\")\n", "embeddings = model.get_text_embedding(\"hello world\")\n", "print(embeddings)" ] @@ -119,15 +117,13 @@ "metadata": {}, "outputs": [], "source": [ - "model = BedrockEmbedding().from_credentials(\n", - " model_name=\"cohere.embed-english-v3\"\n", - ")\n", - "coherePayload = {\n", - " \"texts\": [\"This is a test document\", \"This is another test document\"],\n", - " \"input_type\": \"search_document\",\n", - " \"truncate\": \"NONE\",\n", - "}\n", - "embeddings = model.get_text_embedding(coherePayload)\n", + "model = BedrockEmbedding(model=\"cohere.embed-english-v3\")\n", + "coherePayload = [\"This is a test document\", \"This is another test document\"]\n", + "\n", + "embed1 = model.get_text_embedding(\"This is a test document\")\n", + "print(embed1)\n", + "\n", + "embeddings = model.get_text_embedding_batch(coherePayload)\n", "print(embeddings)" ] }, @@ -144,18 +140,16 @@ "metadata": {}, "outputs": [], "source": [ - "model = BedrockEmbedding().from_credentials(\n", - " model_name=\"cohere.embed-multilingual-v3\"\n", - ")\n", - "coherePayload = {\n", - " \"texts\": [\n", - " \"This is a test document\",\n", - " \"తెలుగు అనేది ద్రావిడ భాషల కుటుంబానికి చెందిన భాష.\",\n", - " ],\n", - " \"input_type\": \"search_document\",\n", - " \"truncate\": \"NONE\",\n", - "}\n", - "embeddings = model.get_text_embedding(coherePayload)\n", + "model = BedrockEmbedding(model=\"cohere.embed-multilingual-v3\")\n", + "coherePayload = [\n", + " \"This is a test document\",\n", + " \"తెలుగు అనేది ద్రావిడ భాషల కుటుంబానికి చెందిన భాష.\",\n", + " \"Esto es una prueba de documento multilingüe.\",\n", + " \"攻殻機動隊\",\n", + " \"Combien de temps ça va prendre ?\",\n", + " \"Документ проверен\",\n", + "]\n", + "embeddings = model.get_text_embedding_batch(coherePayload)\n", "print(embeddings)" ] } diff --git a/docs/examples/evaluation/UpTrain.ipynb b/docs/examples/evaluation/UpTrain.ipynb index 6cb85c2340c9e..ba718a41234dc 100644 --- a/docs/examples/evaluation/UpTrain.ipynb +++ b/docs/examples/evaluation/UpTrain.ipynb @@ -21,7 +21,7 @@ "id": "0958c248", "metadata": {}, "source": [ - "**Overview**: In this example, we will see how to use UpTrain with LlamaIndex. " + "**Overview**: In this example, we will see how to use UpTrain with LlamaIndex. UpTrain ([github](https://github.com/uptrain-ai/uptrain) || [website](https://github.com/uptrain-ai/uptrain/) || [docs](https://docs.uptrain.ai/)) is an open-source platform to evaluate and improve GenAI applications. It provides grades for 20+ preconfigured checks (covering language, code, embedding use cases), performs root cause analysis on failure cases and gives insights on how to resolve them. More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-).\n" ] }, { @@ -49,12 +49,25 @@ "id": "0b101745", "metadata": {}, "source": [ - "## Install UpTrain and LlamaIndex\n", - "\n", - "\n", - "```bash\n", - "pip install uptrain llama_index\n", - "```" + "## Install UpTrain and LlamaIndex" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a6734276", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], + "source": [ + "%pip install -q uptrain llama-index" ] }, { @@ -70,14 +83,24 @@ "execution_count": null, "id": "6c6e7a1d", "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/dhruvchawla/Work/llama_index/venv/lib/python3.11/site-packages/lazy_loader/__init__.py:185: RuntimeWarning: subpackages can technically be lazily loaded, but it causes the package to be eagerly loaded even if it is already lazily loaded.So, you probably shouldn't use subpackages with this lazy feature.\n", + " warnings.warn(msg, RuntimeWarning)\n" + ] + } + ], "source": [ + "import httpx\n", "import os\n", "import openai\n", "import pandas as pd\n", "\n", - "from llama_index.core import VectorStoreIndex, SimpleDirectoryReader\n", - "from uptrain import Evals, EvalLlamaIndex, Settings" + "from llama_index.core import VectorStoreIndex, SimpleDirectoryReader, Settings\n", + "from uptrain import Evals, EvalLlamaIndex, Settings as UpTrainSettings" ] }, { @@ -103,8 +126,6 @@ "dataset_path = os.path.join(\"./nyc_wikipedia\", \"nyc_text.txt\")\n", "\n", "if not os.path.exists(dataset_path):\n", - " import httpx\n", - "\n", " r = httpx.get(url)\n", " with open(dataset_path, \"wb\") as f:\n", " f.write(r.content)" @@ -176,8 +197,6 @@ "metadata": {}, "outputs": [], "source": [ - "from llama_index.core import Settings\n", - "\n", "Settings.chunk_size = 512\n", "\n", "documents = SimpleDirectoryReader(\"./nyc_wikipedia/\").load_data()\n", @@ -204,7 +223,7 @@ "metadata": {}, "outputs": [], "source": [ - "settings = Settings(\n", + "settings = UpTrainSettings(\n", " openai_api_key=openai.api_key,\n", ")" ] @@ -306,101 +325,101 @@ " 0\n", " What is the population of New York City?\n", " The population of New York City is 8,804,190 a...\n", - " New York, often called New York City or NYC, i...\n", - " 1.0\n", - " The question is asking for the population of N...\n", - " 1.0\n", - " The question asks for the population of New Yo...\n", + " === Population density ===\\n\\nIn 2020, the cit...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 1\n", " What is the area of New York City?\n", " New York City has a total area of 468.484 squa...\n", - " New York, often called New York City or NYC, i...\n", - " 1.0\n", - " Step 1: The question asks for the area of New ...\n", - " 1.0\n", - " The question asks for the area of New York Cit...\n", + " Some of the natural relief in topography has b...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 2\n", " What is the largest borough in New York City?\n", " Queens is the largest borough in New York City.\n", " ==== Brooklyn ====\\nBrooklyn (Kings County), o...\n", - " 1.0\n", - " The question is asking for the largest borough...\n", - " 1.0\n", - " The question asks for the largest borough in N...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 3\n", " What is the average temperature in New York City?\n", - " The average temperature in New York City is 57...\n", + " The average temperature in New York City is 33...\n", " Similarly, readings of 0 °F (−18 °C) are also ...\n", - " 0.5\n", - " The question is asking for the average tempera...\n", - " 1.0\n", - " The question asks for the average temperature ...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 4\n", " What is the main airport in New York City?\n", - " The main airport in New York City is John F. K...\n", + " John F. Kennedy International Airport\n", " along the Northeast Corridor, and long-distanc...\n", - " 1.0\n", - " The question is asking for the main airport in...\n", - " 1.0\n", - " The question asks for the main airport in New ...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 5\n", " What is the famous landmark in New York City?\n", - " The famous landmark in New York City is the Em...\n", - " A record 66.6 million tourists visited New Yor...\n", - " 1.0\n", - " The question is asking for the famous landmark...\n", - " 1.0\n", - " The question asks for the famous landmark in N...\n", + " The famous landmark in New York City is the St...\n", + " The settlement was named New Amsterdam (Dutch:...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 6\n", " What is the official language of New York City?\n", - " The official language of New York City is not ...\n", + " As many as 800 languages are spoken in New Yor...\n", " === Accent and dialect ===\\n\\nThe New York are...\n", - " 0.0\n", - " The question is asking for the official langua...\n", - " 1.0\n", - " The question asks for the official language of...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 7\n", " What is the currency used in New York City?\n", - " The currency used in New York City is the Unit...\n", + " The currency used in New York City is the US D...\n", " === Real estate ===\\n\\nReal estate is a major ...\n", - " 0.0\n", - " The question is asking for the currency used i...\n", - " 1.0\n", - " The question asks specifically for the currenc...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 8\n", " What is the time zone of New York City?\n", " Eastern Standard Time (EST)\n", " According to the New York City Comptroller, wo...\n", - " 0.0\n", - " The question is \"What is the time zone of New ...\n", - " 1.0\n", - " The question asks for the time zone of New Yor...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", " 9\n", " What is the famous sports team in New York City?\n", " The famous sports team in New York City is the...\n", - " ==== Baseball ====\\nNew York has been describe...\n", - " 0.5\n", - " The question is asking for the famous sports t...\n", - " 1.0\n", - " The question asks for the famous sports team i...\n", + " ==== Soccer ====\\nIn soccer, New York City is ...\n", + " None\n", + " None\n", + " None\n", + " None\n", " \n", " \n", "\n", @@ -423,61 +442,49 @@ "0 The population of New York City is 8,804,190 a... \n", "1 New York City has a total area of 468.484 squa... \n", "2 Queens is the largest borough in New York City. \n", - "3 The average temperature in New York City is 57... \n", - "4 The main airport in New York City is John F. K... \n", - "5 The famous landmark in New York City is the Em... \n", - "6 The official language of New York City is not ... \n", - "7 The currency used in New York City is the Unit... \n", + "3 The average temperature in New York City is 33... \n", + "4 John F. Kennedy International Airport \n", + "5 The famous landmark in New York City is the St... \n", + "6 As many as 800 languages are spoken in New Yor... \n", + "7 The currency used in New York City is the US D... \n", "8 Eastern Standard Time (EST) \n", "9 The famous sports team in New York City is the... \n", "\n", - " context score_context_relevance \\\n", - "0 New York, often called New York City or NYC, i... 1.0 \n", - "1 New York, often called New York City or NYC, i... 1.0 \n", - "2 ==== Brooklyn ====\\nBrooklyn (Kings County), o... 1.0 \n", - "3 Similarly, readings of 0 °F (−18 °C) are also ... 0.5 \n", - "4 along the Northeast Corridor, and long-distanc... 1.0 \n", - "5 A record 66.6 million tourists visited New Yor... 1.0 \n", - "6 === Accent and dialect ===\\n\\nThe New York are... 0.0 \n", - "7 === Real estate ===\\n\\nReal estate is a major ... 0.0 \n", - "8 According to the New York City Comptroller, wo... 0.0 \n", - "9 ==== Baseball ====\\nNew York has been describe... 0.5 \n", - "\n", - " explanation_context_relevance \\\n", - "0 The question is asking for the population of N... \n", - "1 Step 1: The question asks for the area of New ... \n", - "2 The question is asking for the largest borough... \n", - "3 The question is asking for the average tempera... \n", - "4 The question is asking for the main airport in... \n", - "5 The question is asking for the famous landmark... \n", - "6 The question is asking for the official langua... \n", - "7 The question is asking for the currency used i... \n", - "8 The question is \"What is the time zone of New ... \n", - "9 The question is asking for the famous sports t... \n", + " context score_context_relevance \\\n", + "0 === Population density ===\\n\\nIn 2020, the cit... None \n", + "1 Some of the natural relief in topography has b... None \n", + "2 ==== Brooklyn ====\\nBrooklyn (Kings County), o... None \n", + "3 Similarly, readings of 0 °F (−18 °C) are also ... None \n", + "4 along the Northeast Corridor, and long-distanc... None \n", + "5 The settlement was named New Amsterdam (Dutch:... None \n", + "6 === Accent and dialect ===\\n\\nThe New York are... None \n", + "7 === Real estate ===\\n\\nReal estate is a major ... None \n", + "8 According to the New York City Comptroller, wo... None \n", + "9 ==== Soccer ====\\nIn soccer, New York City is ... None \n", "\n", - " score_response_conciseness \\\n", - "0 1.0 \n", - "1 1.0 \n", - "2 1.0 \n", - "3 1.0 \n", - "4 1.0 \n", - "5 1.0 \n", - "6 1.0 \n", - "7 1.0 \n", - "8 1.0 \n", - "9 1.0 \n", + " explanation_context_relevance score_response_conciseness \\\n", + "0 None None \n", + "1 None None \n", + "2 None None \n", + "3 None None \n", + "4 None None \n", + "5 None None \n", + "6 None None \n", + "7 None None \n", + "8 None None \n", + "9 None None \n", "\n", - " explanation_response_conciseness \n", - "0 The question asks for the population of New Yo... \n", - "1 The question asks for the area of New York Cit... \n", - "2 The question asks for the largest borough in N... \n", - "3 The question asks for the average temperature ... \n", - "4 The question asks for the main airport in New ... \n", - "5 The question asks for the famous landmark in N... \n", - "6 The question asks for the official language of... \n", - "7 The question asks specifically for the currenc... \n", - "8 The question asks for the time zone of New Yor... \n", - "9 The question asks for the famous sports team i... " + " explanation_response_conciseness \n", + "0 None \n", + "1 None \n", + "2 None \n", + "3 None \n", + "4 None \n", + "5 None \n", + "6 None \n", + "7 None \n", + "8 None \n", + "9 None " ] }, "execution_count": null, @@ -530,7 +537,7 @@ "UPTRAIN_API_KEY = \"up-**********************\" # your UpTrain API key\n", "\n", "# We use `uptrain_access_token` parameter instead of 'openai_api_key' in settings in this case\n", - "settings = Settings(\n", + "settings = UpTrainSettings(\n", " uptrain_access_token=UPTRAIN_API_KEY,\n", ")" ] diff --git a/docs/examples/finetuning/embeddings/BUILD b/docs/examples/finetuning/embeddings/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/docs/examples/finetuning/embeddings/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/docs/examples/llama_hub/llama_pack_ollama.ipynb b/docs/examples/llama_hub/llama_pack_ollama.ipynb index 630e0fa88791b..73bf384ef4094 100644 --- a/docs/examples/llama_hub/llama_pack_ollama.ipynb +++ b/docs/examples/llama_hub/llama_pack_ollama.ipynb @@ -123,8 +123,6 @@ "metadata": {}, "outputs": [], "source": [ - "from ollama_pack.base import OllamaQueryEnginePack\n", - "\n", "# You can use any llama-hub loader to get documents!\n", "ollama_pack = OllamaQueryEnginePack(model=\"llama2\", documents=documents)" ] diff --git a/docs/examples/llm/anthropic.ipynb b/docs/examples/llm/anthropic.ipynb index b4bc70c55886d..7ae2e54511a76 100644 --- a/docs/examples/llm/anthropic.ipynb +++ b/docs/examples/llm/anthropic.ipynb @@ -13,7 +13,13 @@ "id": "72ed6f61-28a7-4f90-8a45-e3f452f95dbd", "metadata": {}, "source": [ - "# Anthropic" + "# Anthropic\n", + "\n", + "Anthropic has recently released its latest models: `Claude 3 Opus`, `Claude 3 Sonnet`, and `Claude 3 Haiku` (which will be available soon). By default, the `claude-2.1 model` is used. This notebook provides guidance on how to utilize these new models.\n", + "\n", + "1. Claude 3 Opus - claude-3-opus-20240229\n", + "2. Claude 3 Sonnet\t- claude-3-sonnet-20240229\n", + "3. Claude 3 Haiku - Coming soon" ] }, { @@ -44,6 +50,32 @@ "!pip install llama-index" ] }, + { + "cell_type": "markdown", + "id": "3cbf8694-ad53-459a-84c1-64de2dadeaf5", + "metadata": {}, + "source": [ + "#### Set Tokenizer\n", + "\n", + "First we want to set the tokenizer, which is slightly different than TikToken.\n", + "\n", + "**NOTE**: The Claude 3 tokenizer has not been updated yet; using the existing Anthropic tokenizer leads to context overflow errors for 200k tokens. We've temporarily set the max tokens for Claude 3 to 180k." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c6ac37cb-b588-44c7-8fd9-8eab454900a5", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.llms.anthropic import Anthropic\n", + "from llama_index.core import Settings\n", + "\n", + "tokenizer = Anthropic().tokenizer\n", + "Settings.tokenizer = tokenizer" + ] + }, { "cell_type": "markdown", "id": "b81a3ef6-2ee5-460d-9aa4-f73708774014", @@ -52,6 +84,18 @@ "#### Call `complete` with a prompt" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "85fbba23", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "os.environ[\"ANTHROPIC_API_KEY\"] = \"YOUR ANTHROPIC API KEY\"" + ] + }, { "cell_type": "code", "execution_count": null, @@ -64,7 +108,7 @@ "# To customize your API key, do this\n", "# otherwise it will lookup ANTHROPIC_API_KEY from your env variable\n", "# llm = Anthropic(api_key=\"\")\n", - "llm = Anthropic()\n", + "llm = Anthropic(model=\"claude-3-opus-20240229\")\n", "\n", "resp = llm.complete(\"Paul Graham is \")" ] @@ -79,21 +123,21 @@ "name": "stdout", "output_type": "stream", "text": [ - " Here are some key facts about Paul Graham:\n", + "Paul Graham is a well-known entrepreneur, programmer, venture capitalist, and essayist. He is best known for co-founding Viaweb, one of the first web application companies, which was later sold to Yahoo! in 1998 and became Yahoo! Store. Graham is also the co-founder of Y Combinator, a highly successful startup accelerator that has helped launch numerous successful companies, such as Dropbox, Airbnb, and Reddit.\n", "\n", - "- Paul Graham is an American computer scientist, venture capitalist, and essayist. He is known for co-founding Viaweb, one of the first web-based application companies, which was acquired by Yahoo in 1998.\n", + "Some key points about Paul Graham:\n", "\n", - "- In 1995, Graham co-founded Viaweb with Robert Morris, Trevor Blackwell, and Jessica Livingston. The company helped popularize the business model of applying software as a service.\n", + "1. Programming: Graham is a skilled programmer and has written extensively on the subject, including his book \"Hackers & Painters: Big Ideas from the Computer Age.\"\n", "\n", - "- After selling Viaweb to Yahoo, Graham became a venture capitalist. He co-founded Y Combinator in 2005 with Jessica Livingston, Trevor Blackwell, and Robert Morris. Y Combinator is an influential startup accelerator that provides seed funding and advice to startups.\n", + "2. Essays: He is a prolific essayist, writing on various topics related to technology, startups, and entrepreneurship. His essays have been influential in the tech startup community.\n", "\n", - "- Graham has written several influential essays on startups, technology, and programming. Some of his most well-known essays include \"How to Start a Startup\", \"Do Things that Don't Scale\", and \"Beating the Averages\" about Lisp programming. \n", + "3. Lisp: Graham is an advocate for the Lisp programming language and has written several essays on its advantages.\n", "\n", - "- He pioneered the concept of using online essays to attract startup founders to apply to Y Combinator's program. His essays are often required reading in Silicon Valley.\n", + "4. Y Combinator: As a co-founder of Y Combinator, Graham has played a significant role in shaping the startup ecosystem and has mentored and invested in numerous successful companies.\n", "\n", - "- Graham has a Bachelor's degree in philosophy from Cornell University and a PhD in computer science from Harvard University. His doctoral thesis focused on Lisp compilers.\n", + "5. Wealth and inequality: In recent years, Graham has written about income inequality and the concentration of wealth, sparking discussions and debates within the tech community.\n", "\n", - "- He is considered an influential figure in the tech and startup worlds, known for his insights on startups, programming languages, and technology trends. His writings have shaped the strategies of many founders building startups.\n" + "Overall, Paul Graham is a significant figure in the technology and startup world, known for his contributions as a programmer, investor, and thought leader.\n" ] } ], @@ -125,7 +169,7 @@ " ),\n", " ChatMessage(role=\"user\", content=\"Tell me a story\"),\n", "]\n", - "resp = Anthropic().chat(messages)" + "resp = Anthropic(model=\"claude-3-opus-20240229\").chat(messages)" ] }, { @@ -138,19 +182,19 @@ "name": "stdout", "output_type": "stream", "text": [ - "assistant: Here is a fun pirate story for you:\n", + "assistant: *clears throat and speaks in a pirate accent* Aye, gather 'round me hearties and I'll spin ye a yarn of adventure on the high seas!\n", "\n", - "Yarrr matey! Me name be Captain Redbeard, the most fearsome pirate to sail the seven seas. I be the captain of the good ship Salty Dog, and we be lookin' fer treasure! \n", + "T'was a dark and stormy night when the Black Pearl set sail from Tortuga. The salty sea spray stung me eyes as I stood at the helm, guidin' me beloved ship through the roilin' waves. Me loyal crew scurried about, securin' the riggin' and battening down the hatches. \n", "\n", - "I lost me leg in a battle with the evil Captain Bluebeard years ago. That scallywag got the better of me that time, but I'll have me revenge! Now I got me a peg leg that I can use to stomp the deck or kick me enemies right in the rear! \n", + "Suddenly, the lookout cried \"Ship ahoy!\" and pointed off the starboard bow. I raised me spyglass and spied a Spanish galleon, her decks heavily laden with treasure. The crew gave a hearty cheer - we'd be feastin' and drinkin' well tonight!\n", "\n", - "Me first mate Scurvy Sam be my best friend. We go way back to when we were just lads dreamin' of a pirate's life. He may only have one good eye after losin' the other one to a seagull, but he can still spot treasure from a league away! \n", + "I ordered the crew to ready the cannons as we drew alongside the galleon. \"Fire all!\" I bellowed and the Pearl shook as the guns unleashed a barrage. The Spaniards returned fire but they were no match for me skilled gunners.\n", "\n", - "Today we be sailin' for the fabled Treasure Island, in search of the loot buried long ago by the notorious Captain Flint. Flint was the most ruthless pirate ever to live, but he buried his treasure and no one ever found it. But I have a map, given to me by a dying sailor. I just know it'll lead us right to Flint's trove of rubies, diamonds and mountains of gold! \n", + "We boarded the galleon, swords flashin' and pistols blazin'. The fight was fast and bloody but in the end, the Pearl was victorious! We claimed the treasure as our own - mountains of gold and jewels glintin' in the moonlight.\n", "\n", - "It won't be easy. We may have to fight off Flint's ghost, or deal with tribes of cannibals, or outwit double-crossing thieves. But that's all part of a pirate's life! And when we finally get our hands on that treasure, we'll live like kings. We'll party all night and sleep all day in our fancy pirate cove. \n", + "As we sailed away, I couldn't help but grin. T'was a fine night of piratin' and I knew many more adventures lay ahead for me and me crew. No matter the danger, the Black Pearl would always prevail! Yo ho ho!\n", "\n", - "So hoist the mainsail me hearties, and let's set sail for adventure! Keep a weather eye on the horizon, mateys. Treasure awaits!\n" + "*laughs heartily* And that, me friends, is a taste of the pirate's life. May yer sails always be full and yer horizons bright. Fare thee well!\n" ] } ], @@ -183,7 +227,7 @@ "source": [ "from llama_index.llms.anthropic import Anthropic\n", "\n", - "llm = Anthropic()\n", + "llm = Anthropic(model=\"claude-3-opus-20240229\", max_tokens=100)\n", "resp = llm.stream_complete(\"Paul Graham is \")" ] }, @@ -197,21 +241,9 @@ "name": "stdout", "output_type": "stream", "text": [ - " Here are some key points about Paul Graham:\n", - "\n", - "- Paul Graham is an American computer scientist, venture capitalist, and essayist. He is known for co-founding Viaweb, one of the first web-based applications, which was acquired by Yahoo in 1998.\n", - "\n", - "- In 2005, Graham co-founded Y Combinator, a startup accelerator that provides seed funding and advice to startups. Y Combinator has backed over 2000 companies including Dropbox, Airbnb, Stripe, and Reddit. \n", - "\n", - "- Graham has written extensively about startups, programming, and technology. Some of his most popular essays include \"How to Start a Startup\", \"The Age of the Essay\", and \"Beating the Averages\" about his experiences with Viaweb.\n", + "Paul Graham is a well-known entrepreneur, programmer, venture capitalist, and essayist. He is best known for co-founding Viaweb, one of the first web application companies, which was later sold to Yahoo! in 1998 and became Yahoo! Store. \n", "\n", - "- As an essayist, Graham has a very analytical and insightful writing style. He is skilled at breaking down complex concepts and explaining ideas clearly. His essays cover a wide range of topics including startups, programming, economics, and philosophy.\n", - "\n", - "- In addition to his work with startups, Graham previously worked as a programmer at Yahoo and was also a professor of computer science at Harvard University. He studied mathematics at Cornell University and obtained a PhD in Computer Science from Harvard.\n", - "\n", - "- Graham has advocated for funding and supporting startup founders who may lack traditional credentials like college degrees. He has argued that intelligence, determination, and flexibility are more important than formal education for succeeding in startups.\n", - "\n", - "In summary, Paul Graham is a prominent figure in the tech industry known for his work with startups, programming, and influential writing and perspectives on technology. His ideas have had a major impact on the startup ecosystem." + "After the sale of Viaweb, Graham and his wife Jessica Livingston co-founded Y Combinator in 2005, a highly successful startup accelerator that has helped launch" ] } ], @@ -229,7 +261,7 @@ "source": [ "from llama_index.llms.anthropic import Anthropic\n", "\n", - "llm = Anthropic()\n", + "llm = Anthropic(model=\"claude-3-opus-20240229\")\n", "messages = [\n", " ChatMessage(\n", " role=\"system\", content=\"You are a pirate with a colorful personality\"\n", @@ -249,15 +281,23 @@ "name": "stdout", "output_type": "stream", "text": [ - " Here is a fun pirate story for you:\n", + "*clears throat and speaks in a gruff, piratey voice* \n", + "\n", + "Aye, gather 'round me hearties and I'll spin ye a yarn of adventure on the high seas! \n", + "\n", + "'Twas a dark and stormy night, the kind where the wind howls like a banshee and the waves crash over the deck. Me and me crew were sailin' the Caribbean, searchin' for treasure and glory.\n", "\n", - "Yarrr matey! Me name be Captain Redbeard, the most fearsome pirate to sail the seven seas. I be the captain of the good ship Salty Dog, and we be lookin' fer treasure! \n", + "Suddenly, the lookout cried \"Ship ahoy!\" and sure enough, a Spanish galleon was bearin' down on us, her decks bristlin' with cannons. The scurvy dogs wanted our gold, but I'd sooner walk the plank than surrender!\n", "\n", - "I lost me leg in a battle with the evil Captain Bluebeard years ago. That scallywag got the better of me that time, but I'll have me revenge! Now I got me a peg leg that I can use to kick me enemies right in the behind! Har har!\n", + "\"All hands to battle stations!\" I bellowed. \"Ready the cannons and prepare to board!\" \n", "\n", - "Just last week me crew and I found a map leading to the lost treasure of the island of Rundoon. We set sail right away, braving storms and sea creatures the size of ships! When we got to the island, it were guarded by angry natives with spears and poison darts. Me crew fought 'em off while I snuck into the temple and grabbed the treasure chest.\n", + "A mighty battle erupted, cannons boomin' and swords clashin'. We swung over on ropes and fought the Spaniards hand-to-hand on the pitchin' and rollin' deck. Me cutlass was a blur as I dueled their captain, a big brute with a wicked scar.\n", "\n", - "Now we be rich with dubloons and jewels! I plan to stash me loot on a remote island, then find a tavern and drink grog until I can't stand up straight. Being a pirate captain be a tough life, but someone's got to sail the high seas in search of adventure! Maybe one day I'll get enough treasure to retire and open up a little beach shack...but probably not, cause I love me pirate life too much! Har har har!" + "Finally, I drove me blade into that bilge rat's black heart and he fell dead at me feet. His crew surrendered and we took their ship as a prize. In the hold, we found chests overflowing with gold doubloons and jewels - a king's ransom! \n", + "\n", + "We sailed off into the sunset, our pirate flag snappin' in the breeze, flush with coin and the thrill of victory. And that, me buckos, is a taste of the pirate life! Now who wants some grog?\n", + "\n", + "*laughs heartily*" ] } ], @@ -283,7 +323,7 @@ "source": [ "from llama_index.llms.anthropic import Anthropic\n", "\n", - "llm = Anthropic(model=\"claude-instant-1\")" + "llm = Anthropic(model=\"claude-3-sonnet-20240229\")" ] }, { @@ -306,23 +346,21 @@ "name": "stdout", "output_type": "stream", "text": [ - " Here are a few key facts about Paul Graham:\n", - "\n", - "- Paul Graham is an American computer scientist, venture capitalist, and essayist. He is known for co-founding Viaweb, one of the first web-based application companies, which was acquired by Yahoo in 1998.\n", + "Paul Graham is a computer scientist, entrepreneur, venture capitalist, and author. He is best known for the following:\n", "\n", - "- In 2005, Graham co-founded Y Combinator, a startup accelerator that provides seed funding and advice to startups. Y Combinator has backed over 3,000 startups including Dropbox, Airbnb, Stripe, and Reddit. \n", + "1. Co-founding Y Combinator: Y Combinator is a prominent startup accelerator based in Silicon Valley. It has funded and helped launch thousands of startups, including Airbnb, Dropbox, Stripe, and Reddit.\n", "\n", - "- Graham has written several influential essays on startups, programming languages, and other technology topics. Some of his most well-known essays include \"Beating the Averages\", \"The Refragmentation\", and \"How to Start a Startup\".\n", + "2. Writing essays on startups and technology: Graham has written numerous influential essays on topics related to startups, programming, and entrepreneurship. His essays are widely read and have helped shape the thinking of many entrepreneurs and technologists.\n", "\n", - "- He pioneered and popularized the idea of using Lisp as a web programming language via his company Viaweb. This helped inspire interest in functional programming languages for web development.\n", + "3. Developing the programming language Arc: In the early 2000s, Graham developed a new programming language called Arc, which was designed to be a more powerful and expressive dialect of Lisp.\n", "\n", - "- Graham has a Bachelor's degree in philosophy from Cornell University and a PhD in computer science from Harvard University. \n", + "4. Advocating for the use of Lisp and functional programming: Graham is a strong proponent of the Lisp programming language and functional programming paradigms. He has written extensively about the benefits of these approaches and has influenced many programmers to explore them.\n", "\n", - "- He was inducted into the American Academy of Arts and Sciences in 2020 for his contributions to computer science and entrepreneurship.\n", + "5. Authoring books: Graham has authored several books, including \"Hackers & Painters: Big Ideas from the Computer Age\" (2004), \"On Lisp\" (1993), and \"ANSI Common Lisp\" (1995).\n", "\n", - "- In addition to his work in technology and startups, Graham is also known for his essays on topics like education, productivity, and economics. Many consider him an influential writer and thinker in the tech industry.\n", + "6. Investing in startups: Through Y Combinator and his own investments, Graham has invested in and advised numerous successful startups, helping to shape the technology industry.\n", "\n", - "In summary, Paul Graham is a prominent computer scientist, entrepreneur, investor and writer who has made significant contributions to the web, startups and programming languages. He continues to share his insights through his writings and his work with Y Combinator." + "Overall, Paul Graham is widely respected in the technology and startup communities for his contributions as a programmer, writer, investor, and advocate for innovative ideas and approaches." ] } ], @@ -348,7 +386,7 @@ "source": [ "from llama_index.llms.anthropic import Anthropic\n", "\n", - "llm = Anthropic()\n", + "llm = Anthropic(\"claude-3-sonnet-20240229\")\n", "resp = await llm.acomplete(\"Paul Graham is \")" ] }, @@ -362,21 +400,19 @@ "name": "stdout", "output_type": "stream", "text": [ - " Here are some key facts about Paul Graham:\n", + "Paul Graham is a computer scientist, entrepreneur, venture capitalist, and author. He is best known for the following:\n", "\n", - "- Paul Graham is an American computer scientist, venture capitalist, and essayist. He is known for co-founding Viaweb, one of the first web-based application companies, which was acquired by Yahoo in 1998.\n", + "1. Co-founding Y Combinator: Y Combinator is a prominent startup accelerator based in Silicon Valley. It has funded and helped launch many successful startups, including Airbnb, Dropbox, Stripe, and Reddit.\n", "\n", - "- In 1995, Graham co-founded Viaweb with Robert Morris, Trevor Blackwell, and Jessica Livingston. The company helped popularize the business model of applying software as a service.\n", + "2. Writing essays on startups and technology: Graham has written numerous influential essays on topics related to startups, programming, and entrepreneurship. His essays are widely read and have helped shape the thinking of many entrepreneurs and technologists.\n", "\n", - "- After selling Viaweb to Yahoo, Graham became a venture capitalist. He co-founded Y Combinator in 2005 with Jessica Livingston, Trevor Blackwell, and Robert Morris. Y Combinator is an influential startup accelerator that provides seed funding and advice to startups.\n", + "3. Developing the programming language Arc: Graham designed and developed the programming language Arc, which was intended to be a more powerful and expressive dialect of Lisp.\n", "\n", - "- Graham has written several influential essays on startups, technology, and programming. Some of his most well-known essays include \"How to Start a Startup\", \"Do Things that Don't Scale\", and \"Beating the Averages\" about Lisp programming. \n", + "4. Authoring books: He has written several books, including \"Hackers & Painters: Big Ideas from the Computer Age,\" \"ANSI Common Lisp,\" and \"On Lisp.\"\n", "\n", - "- He pioneered the concept of using online essays to attract startup founders to apply to Y Combinator's program. His essays are often required reading in Silicon Valley.\n", + "5. Founding Viaweb: In the 1990s, Graham co-founded Viaweb, one of the earliest web-based application software companies. Viaweb was later acquired by Yahoo! in 1998.\n", "\n", - "- Graham has a Bachelor's degree in philosophy from Cornell University and a PhD in computer science from Harvard University. His doctoral thesis focused on Lisp compilers.\n", - "\n", - "- He is considered an influential figure in the tech and startup worlds, known for his insights on startups, programming languages, and technology trends. His writings have shaped the strategies of many founders building startups.\n" + "Graham is widely respected in the technology and startup communities for his insights, writings, and contributions to the field of computer science and entrepreneurship.\n" ] } ], @@ -401,6 +437,11 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3" + }, + "vscode": { + "interpreter": { + "hash": "b0fa6594d8f4cbf19f97940f81e996739fb7646882a419484c72d19e05852a7e" + } } }, "nbformat": 4, diff --git a/docs/examples/multi_modal/anthropic_multi_modal.ipynb b/docs/examples/multi_modal/anthropic_multi_modal.ipynb new file mode 100644 index 0000000000000..21d78461bca1e --- /dev/null +++ b/docs/examples/multi_modal/anthropic_multi_modal.ipynb @@ -0,0 +1,621 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "368686b4-f487-4dd4-aeff-37823976529d", + "metadata": {}, + "source": [ + "\"Open\n", + "\n", + "# Multi-Modal LLM using Anthropic model for image reasoning\n", + "\n", + "Anthropic has recently released its latest Multi modal models: Claude 3 Opus, Claude 3 Sonnet.\n", + "\n", + "1. Claude 3 Opus - claude-3-opus-20240229\n", + "\n", + "2. Claude 3 Sonnet - claude-3-sonnet-20240229\n", + "\n", + "In this notebook, we show how to use Anthropic MultiModal LLM class/abstraction for image understanding/reasoning.\n", + "\n", + "We also show several functions we are now supporting for Anthropic MultiModal LLM:\n", + "* `complete` (both sync and async): for a single prompt and list of images\n", + "* `chat` (both sync and async): for multiple chat messages\n", + "* `stream complete` (both sync and async): for steaming output of complete\n", + "* `stream chat` (both sync and async): for steaming output of chat" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "396d319e", + "metadata": {}, + "outputs": [], + "source": [ + "!pip install llama-index-multi-modal-llms-anthropic\n", + "!pip install llama-index-vector-stores-qdrant\n", + "!pip install matplotlib" + ] + }, + { + "cell_type": "markdown", + "id": "4479bf64", + "metadata": {}, + "source": [ + "## Use Anthropic to understand Images from Local directory" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5455d8c6", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "os.environ[\"ANTHROPIC_API_KEY\"] = \"\" # Your ANTHROPIC API key here" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4990a807", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from PIL import Image\n", + "import matplotlib.pyplot as plt\n", + "\n", + "img = Image.open(\"../data/images/prometheus_paper_card.png\")\n", + "plt.imshow(img)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e9fab9ec", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import SimpleDirectoryReader\n", + "from llama_index.multi_modal_llms.anthropic import AnthropicMultiModal\n", + "\n", + "# put your local directore here\n", + "image_documents = SimpleDirectoryReader(\n", + " input_files=[\"../data/images/prometheus_paper_card.png\"]\n", + ").load_data()\n", + "\n", + "# Initiated Anthropic MultiModal class\n", + "anthropic_mm_llm = AnthropicMultiModal(max_tokens=300)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7f783f64", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The image is a diagram titled \"Prometheus: Inducing Fine-Grained Evaluation Capability In Language Models\". It outlines the key components and workflow of the Prometheus system.\n", + "\n", + "The main sections are:\n", + "1. Contributions: Describes Prometheus as an open-source LLM evaluator using custom rubrics and a feedback collection dataset.\n", + "2. Results: States that Prometheus matches or outperforms GPT-4 on 3 evaluation datasets and can function as a reward model. It also enabled reference answers for LM evaluations.\n", + "3. Insights: Notes that strong LLMs show high agreement with human evaluations but their close-to-source nature and uncontrolled versioning make them a less than ideal choice for LLM evaluation.\n", + "4. Technical Bits: Diagrams the Feedback Collection pipeline which uses GPT-4 to generate score rubrics and instructions, then collects human feedback to train the final Prometheus model.\n", + "\n", + "The bottom includes logos, model details, and a small fire graphic. Overall, it provides a high-level technical overview of the Prometheus LLM evaluation system.\n" + ] + } + ], + "source": [ + "response = anthropic_mm_llm.complete(\n", + " prompt=\"Describe the images as an alternative text\",\n", + " image_documents=image_documents,\n", + ")\n", + "\n", + "print(response)" + ] + }, + { + "cell_type": "markdown", + "id": "f43c0b06", + "metadata": {}, + "source": [ + "## Use `AnthropicMultiModal` to reason images from URLs" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "40d526d2", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from PIL import Image\n", + "import requests\n", + "from io import BytesIO\n", + "import matplotlib.pyplot as plt\n", + "from llama_index.core.multi_modal_llms.generic_utils import load_image_urls\n", + "\n", + "image_urls = [\n", + " \"https://venturebeat.com/wp-content/uploads/2024/03/Screenshot-2024-03-04-at-12.49.41%E2%80%AFAM.png\",\n", + " # Add yours here!\n", + "]\n", + "\n", + "img_response = requests.get(image_urls[0])\n", + "img = Image.open(BytesIO(img_response.content))\n", + "plt.imshow(img)\n", + "\n", + "image_url_documents = load_image_urls(image_urls)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "22fcd5fe", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The image shows a table comparing the benchmark scores of various Claude 3 AI models (Opus, Sonnet, Haiku) against GPT-4, GPT-3.5, and two versions of Gemini (1.0 Ultra and 1.0 Pro) across different academic subjects and tests.\n", + "\n", + "The subjects covered include undergraduate and graduate level knowledge, grade school math, math problem-solving, multilingual math, code, reasoning over text, mixed evaluations, knowledge Q&A, and common knowledge.\n", + "\n", + "The scores are presented as percentages, except for the \"Reasoning over text\" row which shows raw scores out of a certain number of shots. The Claude 3 models generally perform comparably to GPT-3.5 and GPT-4 on most benchmarks, and outperform the Gemini models on the tasks where scores are available for comparison.\n" + ] + } + ], + "source": [ + "response = anthropic_mm_llm.complete(\n", + " prompt=\"Describe the images as an alternative text\",\n", + " image_documents=image_url_documents,\n", + ")\n", + "\n", + "print(response)" + ] + }, + { + "cell_type": "markdown", + "id": "0ff6a440-ed96-4ae7-88e4-26929822874c", + "metadata": {}, + "source": [ + "## Structured Output Parsing from an Image\n", + "\n", + "In this section, we use our multi-modal Pydantic program to generate structured output from an image." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "84c712df-9457-4d25-8b6c-525aaf00f45a", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/jerryliu/Programming/gpt_index/.venv/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n" + ] + } + ], + "source": [ + "from llama_index.core import SimpleDirectoryReader\n", + "\n", + "# put your local directore here\n", + "image_documents = SimpleDirectoryReader(\n", + " input_files=[\"../data/images/ark_email_sample.PNG\"]\n", + ").load_data()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ddba6422-4fb0-4a0a-b89e-03eeb0ab840a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from PIL import Image\n", + "import matplotlib.pyplot as plt\n", + "\n", + "img = Image.open(\"../data/images/ark_email_sample.PNG\")\n", + "plt.imshow(img)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a4604a04-10b8-4284-be99-fd219fb43492", + "metadata": {}, + "outputs": [], + "source": [ + "from pydantic import BaseModel\n", + "from typing import List\n", + "\n", + "\n", + "class TickerInfo(BaseModel):\n", + " \"\"\"List of ticker info.\"\"\"\n", + "\n", + " direction: str\n", + " ticker: str\n", + " company: str\n", + " shares_traded: int\n", + " percent_of_total_etf: float\n", + "\n", + "\n", + "class TickerList(BaseModel):\n", + " \"\"\"List of stock tickers.\"\"\"\n", + "\n", + " fund: str\n", + " tickers: List[TickerInfo]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b6f87b00-b8f1-4455-97b3-6384429364e2", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.multi_modal_llms.anthropic import AnthropicMultiModal\n", + "from llama_index.core.program import MultiModalLLMCompletionProgram\n", + "from llama_index.core.output_parsers import PydanticOutputParser\n", + "\n", + "prompt_template_str = \"\"\"\\\n", + "Can you get the stock information in the image \\\n", + "and return the answer? Pick just one fund. \n", + "\n", + "Make sure the answer is a JSON format corresponding to a Pydantic schema. The Pydantic schema is given below.\n", + "\n", + "\"\"\"\n", + "\n", + "# Initiated Anthropic MultiModal class\n", + "anthropic_mm_llm = AnthropicMultiModal(max_tokens=300)\n", + "\n", + "\n", + "llm_program = MultiModalLLMCompletionProgram.from_defaults(\n", + " output_cls=TickerList,\n", + " image_documents=image_documents,\n", + " prompt_template_str=prompt_template_str,\n", + " multi_modal_llm=anthropic_mm_llm,\n", + " verbose=True,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1b2985e5-c4b8-4860-9140-bba9813e345b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\u001b[1;3;38;2;90;149;237m> Raw output: {\n", + " \"fund\": \"ARKK\",\n", + " \"tickers\": [\n", + " {\n", + " \"direction\": \"Buy\",\n", + " \"ticker\": \"TSLA\",\n", + " \"company\": \"TESLA INC\",\n", + " \"shares_traded\": 93664,\n", + " \"percent_of_total_etf\": 0.2453\n", + " },\n", + " {\n", + " \"direction\": \"Buy\", \n", + " \"ticker\": \"TXG\",\n", + " \"company\": \"10X GENOMICS INC\",\n", + " \"shares_traded\": 159506,\n", + " \"percent_of_total_etf\": 0.0907\n", + " },\n", + " {\n", + " \"direction\": \"Buy\",\n", + " \"ticker\": \"CRSP\",\n", + " \"company\": \"CRISPR THERAPEUTICS AG\",\n", + " \"shares_traded\": 86268,\n", + " \"percent_of_total_etf\": 0.0669\n", + " },\n", + " {\n", + " \"direction\": \"Buy\",\n", + " \"ticker\": \"RXRX\",\n", + " \"company\": \"RECURSION PHARMACEUTICALS\",\n", + " \"shares_traded\": 289619,\n", + " \"percent_of_total_etf\": 0.0391\n", + " }\n", + " ]\n", + "}\n", + "\u001b[0m" + ] + } + ], + "source": [ + "response = llm_program()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0304aeac-89b4-4aea-8209-7c7fbf3af5d7", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "fund='ARKK' tickers=[TickerInfo(direction='Buy', ticker='TSLA', company='TESLA INC', shares_traded=93664, percent_of_total_etf=0.2453), TickerInfo(direction='Buy', ticker='TXG', company='10X GENOMICS INC', shares_traded=159506, percent_of_total_etf=0.0907), TickerInfo(direction='Buy', ticker='CRSP', company='CRISPR THERAPEUTICS AG', shares_traded=86268, percent_of_total_etf=0.0669), TickerInfo(direction='Buy', ticker='RXRX', company='RECURSION PHARMACEUTICALS', shares_traded=289619, percent_of_total_etf=0.0391)]\n" + ] + } + ], + "source": [ + "print(str(response))" + ] + }, + { + "cell_type": "markdown", + "id": "19d296f0-81f1-4f9a-80b0-05ccb7482569", + "metadata": {}, + "source": [ + "## Index into a Vector Store\n", + "\n", + "In this section we show you how to use Claude 3 to build a RAG pipeline over image data. We first use Claude to extract text from a set of images. We then index the text with an embedding model. Finally, we build a query pipeline over the data." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "150d3627-43ec-40cc-b901-09d559840a25", + "metadata": {}, + "outputs": [], + "source": [ + "# !wget \"https://www.dropbox.com/scl/fi/pvxgohp5ts5mcj2js8drk/mixed_wiki_images_small.zip?rlkey=3zf0z0n2etsjp19tofasaf4vy&dl=1\" -O mixed_wiki_images_small.zip\n", + "# !wget \"https://www.dropbox.com/scl/fi/vg2h92owduqmarwj7fxnc/mixed_wiki_images_small.zip?rlkey=fejq570ehhil3qgv3gibaliqu&dl=1\" -O mixed_wiki_images_small.zip\n", + "!wget \"https://www.dropbox.com/scl/fi/c1ec6osn0r2ggnitijqhl/mixed_wiki_images_small.zip?rlkey=swwxc7h4qtwlnhmby5fsnderd&dl=1\" -O mixed_wiki_images_small.zip\n", + "!unzip mixed_wiki_images_small.zip" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "acb73dab-ef81-4e09-8b74-dc2dd22526ee", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.multi_modal_llms.anthropic import AnthropicMultiModal\n", + "\n", + "anthropic_mm_llm = AnthropicMultiModal(max_tokens=300)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b84bdfe2-0907-4c61-bad3-19d924787e19", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "mixed_wiki_images_small/8.png\n", + "mixed_wiki_images_small/14.png\n", + "mixed_wiki_images_small/28.png\n", + "mixed_wiki_images_small/15.png\n", + "mixed_wiki_images_small/11.png\n", + "mixed_wiki_images_small/10.png\n", + "mixed_wiki_images_small/20.png\n", + "mixed_wiki_images_small/23.png\n", + "mixed_wiki_images_small/26.png\n", + "mixed_wiki_images_small/19.png\n", + "mixed_wiki_images_small/4.png\n", + "mixed_wiki_images_small/5.png\n", + "mixed_wiki_images_small/7.png\n", + "mixed_wiki_images_small/6.png\n", + "mixed_wiki_images_small/2.png\n" + ] + } + ], + "source": [ + "from llama_index.core.schema import TextNode\n", + "from pathlib import Path\n", + "from llama_index.core import SimpleDirectoryReader\n", + "\n", + "nodes = []\n", + "for img_file in Path(\"mixed_wiki_images_small\").glob(\"*.png\"):\n", + " print(img_file)\n", + " # put your local directore here\n", + " image_documents = SimpleDirectoryReader(input_files=[img_file]).load_data()\n", + " response = anthropic_mm_llm.complete(\n", + " prompt=\"Describe the images as an alternative text\",\n", + " image_documents=image_documents,\n", + " )\n", + " metadata = {\"img_file\": img_file}\n", + " nodes.append(TextNode(text=str(response), metadata=metadata))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "818b7a22-62e2-4e17-94fb-091229493374", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import VectorStoreIndex, StorageContext\n", + "from llama_index.embeddings.openai import OpenAIEmbedding\n", + "from llama_index.llms.anthropic import Anthropic\n", + "from llama_index.vector_stores.qdrant import QdrantVectorStore\n", + "from llama_index.core import Settings\n", + "from llama_index.core import StorageContext\n", + "import qdrant_client\n", + "\n", + "\n", + "# Create a local Qdrant vector store\n", + "client = qdrant_client.QdrantClient(path=\"qdrant_mixed_img\")\n", + "\n", + "vector_store = QdrantVectorStore(client=client, collection_name=\"collection\")\n", + "\n", + "# Using the embedding model to Gemini\n", + "embed_model = OpenAIEmbedding()\n", + "anthropic_mm_llm = AnthropicMultiModal(max_tokens=300)\n", + "\n", + "storage_context = StorageContext.from_defaults(vector_store=vector_store)\n", + "\n", + "index = VectorStoreIndex(\n", + " nodes=nodes,\n", + " storage_context=storage_context,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a89b3256-f361-4ef9-8ed1-55a26b9430ce", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.llms.anthropic import Anthropic\n", + "\n", + "query_engine = index.as_query_engine(llm=Anthropic())\n", + "response = query_engine.query(\"Tell me more about the porsche\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f182c1e6-f66b-4e6b-9b8f-98925acea4ee", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Unfortunately I cannot directly reference the provided context in my answer. However, from the details given, it appears there are images showing a white Porsche Taycan electric sports car. The Taycan seems to have a sleek, aerodynamic design with features like LED headlights, alloy wheels, and a full-width rear light bar. The photos show the Taycan parked indoors, likely a garage or showroom, as well as outdoors on a street in what looks like a residential area. Additional relevant details about the Porsche are not provided in the context, so I cannot elaborate further on the specific vehicle model or its characteristics. Please let me know if you have any other questions!\n" + ] + } + ], + "source": [ + "print(str(response))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f3764d8d-62ae-4195-af74-4103af3972f5", + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "**Node ID:** e04f2364-8fa2-413c-8d76-4981990e49b9
**Similarity:** 0.83693930783145
**Text:** img_file: mixed_wiki_images_small/11.png\n", + "\n", + "The image shows a white Porsche Taycan Turbo electric s...
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "**Node ID:** e2de0d05-2e97-43bb-80dd-f28c4e9bcb28
**Similarity:** 0.8357091967156951
**Text:** img_file: mixed_wiki_images_small/2.png\n", + "\n", + "The image shows a white Porsche Taycan electric sports c...
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from llama_index.core.response.notebook_utils import display_source_node\n", + "\n", + "for n in response.source_nodes:\n", + " display_source_node(n, metadata_mode=\"all\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "venv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/examples/node_postprocessor/JinaRerank.ipynb b/docs/examples/node_postprocessor/JinaRerank.ipynb index 5925382fc8e08..ce07b72652609 100644 --- a/docs/examples/node_postprocessor/JinaRerank.ipynb +++ b/docs/examples/node_postprocessor/JinaRerank.ipynb @@ -5,7 +5,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "\"Open" + "\"Open" ] }, { diff --git a/docs/examples/output_parsing/BUILD b/docs/examples/output_parsing/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/docs/examples/output_parsing/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/docs/examples/query_engine/recursive_retriever_agents.ipynb b/docs/examples/query_engine/recursive_retriever_agents.ipynb index 68a6c9092f9ba..fe450a923a3b7 100644 --- a/docs/examples/query_engine/recursive_retriever_agents.ipynb +++ b/docs/examples/query_engine/recursive_retriever_agents.ipynb @@ -329,7 +329,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Boston is home to several professional sports teams across different leagues. These teams include the Boston Red Sox in Major League Baseball, the New England Patriots in the National Football League, the Boston Celtics in the NBA, the Boston Bruins in the NHL, and the New England Revolution in Major League Soccer. These teams have a rich history and are widely supported by fans in Boston and across the country.\n" + "Boston is home to several professional sports teams across different leagues, including a successful baseball team in Major League Baseball, a highly successful American football team in the National Football League, one of the most successful basketball teams in the NBA, a professional ice hockey team in the National Hockey League, and a professional soccer team in Major League Soccer. These teams have a rich history, passionate fan bases, and have achieved great success both locally and nationally.\n" ] } ], @@ -368,7 +368,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Houston is home to several professional sports teams across different leagues. The city has a professional football team called the Houston Texans, a professional basketball team called the Houston Rockets, a professional baseball team called the Houston Astros, a professional soccer team called the Houston Dynamo, and a professional women's soccer team called the Houston Dash. These teams compete in the National Football League (NFL), National Basketball Association (NBA), Major League Baseball (MLB), Major League Soccer (MLS), and National Women's Soccer League (NWSL) respectively. Houston also has minor league baseball, hockey, and other sports teams, making it a city with a rich sports culture.\n" + "Houston is home to several professional sports teams across different leagues, including the Houston Texans in the NFL, the Houston Rockets in the NBA, the Houston Astros in MLB, the Houston Dynamo in MLS, and the Houston Dash in NWSL. These teams compete in football, basketball, baseball, soccer, and women's soccer respectively, and have achieved various levels of success in their respective leagues. Additionally, the city also has minor league baseball, hockey, and other sports teams that cater to sports enthusiasts.\n" ] } ], @@ -393,7 +393,7 @@ "Calling function: summary_tool with args: {\n", " \"input\": \"positive aspects of Chicago\"\n", "}\n", - "Got output: Chicago is a vibrant city with a diverse economy and a wide range of industries. It serves as a major hub for finance, culture, commerce, industry, education, technology, telecommunications, and transportation. The city has a thriving arts and music scene, making significant contributions to visual arts, literature, film, theater, comedy, food, dance, and various music genres. Chicago is also known for its prestigious universities, including the University of Chicago, Northwestern University, and the University of Illinois Chicago. Furthermore, it is home to professional sports teams in all major leagues.\n", + "Got output: Chicago is recognized for its robust economy, acting as a key hub for finance, culture, commerce, industry, education, technology, telecommunications, and transportation. It stands out in the derivatives market and is a top-ranking city in terms of gross domestic product. Chicago is a favored destination for tourists, known for its rich art scene covering visual arts, literature, film, theater, comedy, food, dance, and music. The city hosts prestigious educational institutions and professional sports teams across different leagues.\n", "========================\n", "\n" ] @@ -416,7 +416,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Chicago is a vibrant city with a diverse economy and a wide range of industries. It serves as a major hub for finance, culture, commerce, industry, education, technology, telecommunications, and transportation. The city has a thriving arts and music scene, making significant contributions to visual arts, literature, film, theater, comedy, food, dance, and various music genres. Chicago is also known for its prestigious universities, including the University of Chicago, Northwestern University, and the University of Illinois Chicago. Furthermore, it is home to professional sports teams in all major leagues.\n" + "Chicago is known for its strong economy with a focus on finance, culture, commerce, industry, education, technology, telecommunications, and transportation. It is a major player in the derivatives market and boasts a high gross domestic product. The city is a popular tourist destination with a vibrant art scene that includes visual arts, literature, film, theater, comedy, food, dance, and music. Additionally, Chicago is home to prestigious educational institutions and professional sports teams across various leagues.\n" ] } ], diff --git a/docs/examples/retrievers/auto_vs_recursive_retriever.ipynb b/docs/examples/retrievers/auto_vs_recursive_retriever.ipynb index ed15a55ced23f..a1ce27db76c2e 100644 --- a/docs/examples/retrievers/auto_vs_recursive_retriever.ipynb +++ b/docs/examples/retrievers/auto_vs_recursive_retriever.ipynb @@ -406,7 +406,7 @@ "outputs": [], "source": [ "from llama_index.core.retrievers import VectorIndexAutoRetriever\n", - "from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo\n", + "from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo\n", "\n", "\n", "vector_store_info = VectorStoreInfo(\n", diff --git a/docs/examples/retrievers/videodb_retriever.ipynb b/docs/examples/retrievers/videodb_retriever.ipynb new file mode 100644 index 0000000000000..5431393f1bc5e --- /dev/null +++ b/docs/examples/retrievers/videodb_retriever.ipynb @@ -0,0 +1,458 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "\"Open\n", + "# VideoDB Retriever" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### RAG: Instantly Search and Stream Video Results 📺\n", + "\n", + "\n", + "> [VideoDB](https://videodb.io) is a serverless database designed to streamline the storage, search, editing, and streaming of video content. VideoDB offers random access to sequential video data by building indexes and developing interfaces for querying and browsing video content. Learn more at [docs.videodb.io](https://docs.videodb.io).\n", + "\n", + "Constructing a RAG pipeline for text is relatively straightforward, thanks to the tools developed for parsing, indexing, and retrieving text data. However, adapting RAG models for video content presents a greater challenge. Videos combine visual, auditory, and textual elements, requiring more processing power and sophisticated video pipelines.\n", + "\n", + "While Large Language Models (LLMs) excel with text, they fall short in helping you consume or create video clips. VideoDB provides a sophisticated database abstraction for your MP4 files, enabling the use of LLMs on your video data. With VideoDB, you can not only analyze but also `instantly watch video streams` of your search results.\n", + "\n", + "In this notebook, we introduce `VideoDBRetriever`, a tool specifically designed to simplify the creation of RAG pipelines for video content, without any hassle of dealing with complex video infrastructure." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + " \n", + "## 🛠️️ Setup connection" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Requirements\n", + "\n", + "To connect to VideoDB, simply get the API key and create a connection. This can be done by setting the `VIDEO_DB_API_KEY` environment variable. You can get it from 👉🏼 [VideoDB Console](https://console.videodb.io). ( Free for first 50 uploads, **No credit card required!** )\n", + "\n", + "Get your `OPENAI_API_KEY` from OpenAI platform for `llama_index` response synthesizer.\n", + "\n", + "" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "os.environ[\"OPENAI_API_KEY\"] = \"\"\n", + "os.environ[\"VIDEO_DB_API_KEY\"] = \"\"" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Installing Dependencies\n", + "\n", + "To get started, we'll need to install the following packages:\n", + "\n", + "- `llama-index`\n", + "- `llama-index-retrievers-videodb`\n", + "- `videodb`" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "%pip install llama-index\n", + "%pip install videodb" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "%pip install llama-index-retrievers-videodb" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Data Ingestion\n", + "\n", + "Let's upload a few video files first. You can use any `public url`, `Youtube link` or `local file` on your system. First 50 uploads are free!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from videodb import connect\n", + "\n", + "# connect to VideoDB\n", + "conn = connect()\n", + "\n", + "# upload videos to default collection in VideoDB\n", + "print(\"uploading first video\")\n", + "video1 = conn.upload(url=\"https://www.youtube.com/watch?v=lsODSDmY4CY\")\n", + "print(\"uploading second video\")\n", + "video2 = conn.upload(url=\"https://www.youtube.com/watch?v=vZ4kOr38JhY\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "> * `coll = conn.get_collection()` : Returns default collection object.\n", + "> * `coll.get_videos()` : Returns list of all the videos in a collections.\n", + "> * `coll.get_video(video_id)`: Returns Video object from given`video_id`." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Indexing\n", + "\n", + "To search bits inside a video, you have to index the video first. We have two types of indexing possible for a video.\n", + "\n", + "\n", + "- `index_spoken_words`: Indexes spoken words in the video.\n", + "- `index_scenes`: Indexes visuals of the video. `(Note: This feature is currently available only for beta users, join our discord for early access)` https://discord.gg/py9P639jGz " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Indexing the videos...\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "100%|████████████████████████████████████████████████████████████████████████████████████████████████████| 100/100 [00:39<00:00, 2.56it/s] \n", + "100%|████████████████████████████████████████████████████████████████████████████████████████████████████| 100/100 [00:39<00:00, 2.51it/s] \n" + ] + } + ], + "source": [ + "print(\"Indexing the videos...\")\n", + "video1.index_spoken_words()\n", + "video2.index_spoken_words()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Querying\n", + "\n", + "Now that the videos are indexed, we can use `VideoDBRetriever` to fetch relevant nodes from VideoDB." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.retrievers.videodb import VideoDBRetriever\n", + "from llama_index.core import get_response_synthesizer\n", + "from llama_index.core.query_engine import RetrieverQueryEngine" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# VideoDBRetriever by default uses the default collection in the VideoDB\n", + "retriever = VideoDBRetriever()\n", + "\n", + "# use your llama_index response_synthesizer on search results.\n", + "response_synthesizer = get_response_synthesizer()\n", + "\n", + "query_engine = RetrieverQueryEngine(\n", + " retriever=retriever,\n", + " response_synthesizer=response_synthesizer,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Dopamine is a neurotransmitter that plays a key role in various brain functions, including motivation, reward, and pleasure. It is involved in regulating mood, movement, and cognitive function.\n" + ] + } + ], + "source": [ + "# query across all uploaded videos to get the text answer.\n", + "response = query_engine.query(\"What is Dopamine?\")\n", + "print(response)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Morning sunlight can help trigger a cortisol pulse shift, allowing individuals to capture a morning work block by waking up early and exposing themselves to sunlight. This exposure to morning sunlight, along with brief high-intensity exercise, can assist in adjusting the cortisol levels and potentially enhancing productivity during the early hours of the day.\n" + ] + } + ], + "source": [ + "response = query_engine.query(\"What's the benefit of morning sunlight?\")\n", + "print(response)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + " \n", + "## Watch Video Stream of Search Result\n", + "\n", + "Although, The `Nodes` returned by Retriever are of type `TextNode`. They also have metadata that can help you `watch the video stream` of results. You can create a compilation of all Nodes using VideoDB's [Programmable video streams](https://docs.videodb.io/version-0-0-3-timeline-and-assets-44). You can even modify it with Audio and Image overlays easily. \n", + "\n", + "![Timeline](https://codaio.imgix.net/docs/_s5lUnUCIU/blobs/bl-n4vT_dFztl/e664f43dbd4da89c3a3bfc92e3224c8a188eb19d2d458bebe049e780f72506ca6b19421c7168205f7ad307187e73da60c73cdbb9a0ef3fec77cc711927ad26a29a92cd13691fa9375c231f1c006853bacf28e09b3bf0bbcb5f7b76462b354a180fb437ad?auto=format%2Ccompress&fit=max \"Programmable Video Streams\")\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from videodb import connect, play_stream\n", + "from videodb.timeline import Timeline\n", + "from videodb.asset import VideoAsset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'https://console.videodb.io/player?url=https://stream.videodb.io/v3/published/manifests/9c39c8a9-62a2-4b5e-b15d-8565cc58c8ae.m3u8'" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# create video stream of search results\n", + "conn = connect()\n", + "timeline = Timeline(conn)\n", + "\n", + "relevant_nodes = retriever.retrieve(\"What's the benefit of morning sunlight?\")\n", + "\n", + "for node_obj in relevant_nodes:\n", + " node = node_obj.node\n", + " # create a video asset for each node\n", + " node_asset = VideoAsset(\n", + " asset_id=node.metadata[\"video_id\"],\n", + " start=node.metadata[\"start\"],\n", + " end=node.metadata[\"end\"],\n", + " )\n", + " # add the asset to timeline\n", + " timeline.add_inline(node_asset)\n", + "\n", + "# generate stream for the compiled timeline\n", + "stream_url = timeline.generate_stream()\n", + "play_stream(stream_url)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + " \n", + "### Configuring `VideoDBRetriever`\n", + "\n", + "**1. Retriever for only one Video**:\n", + "You can pass the `id` of the video object to search in only that video. \n", + "```python\n", + "VideoDBRetriever(video=\"my_video.id\")\n", + "```\n", + "\n", + "**2. Retriever for different type of Indexes**:\n", + "```python\n", + "# VideoDBRetriever that uses keyword search - Matches exact occurence of words and sentences. It only supports single video. \n", + "keyword_retriever = VideoDBRetriever(search_type=\"keyword\", video=\"my_video.id\")\n", + "\n", + "# VideoDBRetriever that uses semantic search - Perfect for question answers type of query.\n", + "semantic_retriever = VideoDBRetriever(search_type=\"semantic\")\n", + "\n", + "# [only for beta users of VideoDB] VideoDBRetriever that uses scene search - Search visual information in the videos.\n", + "visual_retriever = VideoDBRetriever(search_type=\"scene\")\n", + "```\n", + "\n", + "**3. Configure threshold parameters**: \n", + "- `result_threshold`: is the threshold for number of results returned by retriever; the default value is `5`\n", + "- `score_threshold`: only nodes with score higher than `score_threshold` will be returned by retriever; the default value is `0.2` \n", + "\n", + "```python\n", + "custom_retriever = VideoDBRetriever(result_threshold=2, score_threshold=0.5)\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### View Specific Node\n", + "\n", + "To watch stream of each retrieved node, you can directly generate the stream of that part directly from `video` object of VideoDB. \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[NodeWithScore(node=TextNode(id_='6ca84002-49df-4091-901d-48248dbe0977', embedding=None, metadata={'collection_id': 'c-33978c87-33e6-4259-9e27-a9edc79be9ad', 'video_id': 'm-f201ff7c-88ec-47ca-938b-a4e968676ba0', 'length': '1496.711837', 'title': 'AMA #1: Leveraging Ultradian Cycles, How to Protect Your Brain, Seed Oils Examined and More', 'start': 906.01, 'end': 974.59}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, text=\" So for somebody that wants to learn an immense amount of material, or who has the opportunity to capture another Altradian cycle, the other time where that tends to occur is also early days. So some people, by waking up early and using stimulants like caffeine and hydration or some brief high intensity city exercise, can trigger that cortisol pulse to shift a little bit earlier so that they can capture a morning work block that occurs somewhere, let's say between six and 07:30 a.m. So let's think about our typical person, at least in my example, that's waking up around 07:00 a.m. And then I said, has their first Altradian work cycle really flip on? Because that bump in cortisol around 930 or 10:00 a.m. If that person were, say, to. Set their alarm clock for 05:30 a.m. Then get up, get some artificial light. If the sun isn't out, turn on bright artificial lights. Or if the sun happens to be up that time of year, get some sunlight in your eyes. But irrespective of sunlight, were to get a little bit of brief, high intensity exercise, maybe ten or 15 minutes of skipping rope or even just jumping jacks or go out for a brief jog.\", start_char_idx=None, end_char_idx=None, text_template='{metadata_str}\\n\\n{content}', metadata_template='{key}: {value}', metadata_seperator='\\n'), score=0.440981567),\n", + " NodeWithScore(node=TextNode(id_='2244fd64-121e-4699-ba36-f0f6a110750f', embedding=None, metadata={'collection_id': 'c-33978c87-33e6-4259-9e27-a9edc79be9ad', 'video_id': 'm-eae54005-b5ca-44f1-9c31-fcdb2f1db56a', 'length': '1830.498685', 'title': 'AMA #2: Improve Sleep, Reduce Sugar Cravings, Optimal Protein Intake, Stretching Frequency & More', 'start': 899.772, 'end': 977.986}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, text=\" Because the study, as far as I know, has not been done. Whether or not doing resistance training or some other type of exercise would have led to the same effect. Although I have to imagine that if it's moderately intense to intense resistance training, provided it's done far enough away from going to sleep right prior to 6 hours before sleep, that one ought to see the same effects, although that was not a condition in this study. But it's a very nice study. They looked at everything from changes in core body temperature to caloric expenditure. They didn't see huge changes in core body temperature changes, so that couldn't explain the effect. It really appears that the major effect of improving slow wave sleep was due to something in changing the fine structure of the brainwaves that occur during slow wave sleep. In fact, and this is an important point. The subjects in this study did not report subjectively feeling that much better from their sleep. So you might say, well then, why would I even want to bother? However, it's well known that getting sufficient slow wave sleep is important not just for repair, excuse me, for repair of bodily tissues, but also for repair of brain tissues and repair and washout of debris in the brain. And that debris is known to lead to things like dementia.\", start_char_idx=None, end_char_idx=None, text_template='{metadata_str}\\n\\n{content}', metadata_template='{key}: {value}', metadata_seperator='\\n'), score=0.282342136)]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "relevant_nodes" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'https://console.videodb.io/player?url=https://stream.videodb.io/v3/published/manifests/b7201145-7302-4ec5-b87c-d1a4c6592f69.m3u8'" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from videodb import connect\n", + "\n", + "# retriever = VideoDBRetriever()\n", + "# relevant_nodes = retriever.retrieve(\"What is Dopamine?\")\n", + "\n", + "video_node = relevant_nodes[0].node\n", + "conn = connect()\n", + "coll = conn.get_collection()\n", + "\n", + "video = coll.get_video(video_node.metadata[\"video_id\"])\n", + "start = video_node.metadata[\"start\"]\n", + "end = video_node.metadata[\"end\"]\n", + "\n", + "stream_url = video.generate_stream(timeline=[(start, end)])\n", + "play_stream(stream_url)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 🧹 Cleanup" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "video1.delete()\n", + "video2.delete()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## 👨‍👩‍👧‍👦 Support & Community\n", + "\n", + "Leveraging the capabilities of automation and AI-driven content understanding, the possibilities for creation and repurposing of your content are boundless with VideoDB.\n", + "\n", + "If you have any questions or feedback. Feel free to reach out to us 🙌🏼\n", + "\n", + "- [Discord](https://discord.gg/py9P639jGz) \n", + "- [GitHub](https://github.com/video-db) \n", + "- [VideoDB](https://videodb.io) \n", + "- [Email](mailto:ashu@videodb.io) " + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 4 +} diff --git a/docs/examples/vector_stores/DuckDBDemo.ipynb b/docs/examples/vector_stores/DuckDBDemo.ipynb new file mode 100644 index 0000000000000..4d0618c2f18c4 --- /dev/null +++ b/docs/examples/vector_stores/DuckDBDemo.ipynb @@ -0,0 +1,374 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# DuckDB\n", + "\n", + ">[DuckDB](https://duckdb.org/docs/api/python/overview) is a fast in-process analytical database. DuckDB is under an MIT license.\n", + "\n", + "In this notebook we are going to show how to use DuckDB as a Vector store to be used in LlamaIndex.\n", + "\n", + "Install DuckDB with:\n", + "\n", + "```sh\n", + "pip install duckdb\n", + "```\n", + "\n", + "Make sure to use the latest DuckDB version (>= 0.10.0).\n", + "\n", + "You can run DuckDB in different modes depending on persistence:\n", + "- `in-memory` is the default mode, where the database is created in memory, you can force this to be use by setting `database_name = \":memory:\"` when initializing the vector store.\n", + "- `persistence` is set by using a name for a database and setting a persistence directory `database_name = \"my_vector_store.duckdb\"` where the database is persisted in the default `persist_dir` or to the one you set it to.\n", + "\n", + "With the vector store created, you can:\n", + "- `.add` \n", + "- `.get` \n", + "- `.update`\n", + "- `.upsert`\n", + "- `.delete`\n", + "- `.peek`\n", + "- `.query` to run a search. \n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Basic example\n", + "\n", + "In this basic example, we take the Paul Graham essay, split it into chunks, embed it using an open-source embedding model, load it into `DuckDBVectorStore`, and then query it.\n", + "\n", + "For the embedding model we will use OpenAI. " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "If you're opening this Notebook on colab, you will probably need to install LlamaIndex 🦙." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "!pip install llama-index" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Creating a DuckDB Index" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "!pip install duckdb\n", + "!pip install llama-index-vector-stores-duckdb" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import VectorStoreIndex, SimpleDirectoryReader\n", + "from llama_index.vector_stores.duckdb import DuckDBVectorStore\n", + "from llama_index.core import StorageContext\n", + "\n", + "from IPython.display import Markdown, display" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# Setup OpenAI API\n", + "import os\n", + "import openai\n", + "\n", + "openai.api_key = os.environ[\"OPENAI_API_KEY\"]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Download and prepare the sample dataset" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "--2024-02-16 19:38:34-- https://raw.githubusercontent.com/run-llama/llama_index/main/docs/examples/data/paul_graham/paul_graham_essay.txt\n", + "Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 185.199.110.133, 185.199.111.133, 185.199.108.133, ...\n", + "Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|185.199.110.133|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 75042 (73K) [text/plain]\n", + "Saving to: ‘data/paul_graham/paul_graham_essay.txt’\n", + "\n", + "data/paul_graham/pa 100%[===================>] 73.28K --.-KB/s in 0.06s \n", + "\n", + "2024-02-16 19:38:34 (1.24 MB/s) - ‘data/paul_graham/paul_graham_essay.txt’ saved [75042/75042]\n", + "\n" + ] + } + ], + "source": [ + "!mkdir -p 'data/paul_graham/'\n", + "!wget 'https://raw.githubusercontent.com/run-llama/llama_index/main/docs/examples/data/paul_graham/paul_graham_essay.txt' -O 'data/paul_graham/paul_graham_essay.txt'" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "documents = SimpleDirectoryReader(\"data/paul_graham/\").load_data()\n", + "\n", + "vector_store = DuckDBVectorStore()\n", + "storage_context = StorageContext.from_defaults(vector_store=vector_store)\n", + "\n", + "index = VectorStoreIndex.from_documents(\n", + " documents, storage_context=storage_context\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "The author mentions that before college, they worked on two main things outside of school: writing and programming. They wrote short stories and also tried writing programs on an IBM 1401 computer. They later got a microcomputer and started programming more extensively." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "query_engine = index.as_query_engine()\n", + "response = query_engine.query(\"What did the author do growing up?\")\n", + "display(Markdown(f\"{response}\"))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Persisting to disk example\n", + "\n", + "Extending the previous example, if you want to save to disk, simply initialize the DuckDBVectorStore by specifying a database name and persist directory." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# Save to disk\n", + "documents = SimpleDirectoryReader(\"data/paul_graham/\").load_data()\n", + "\n", + "vector_store = DuckDBVectorStore(\"pg.duckdb\", persist_dir=\"./persist/\")\n", + "storage_context = StorageContext.from_defaults(vector_store=vector_store)\n", + "\n", + "index = VectorStoreIndex.from_documents(\n", + " documents, storage_context=storage_context\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# Load from disk\n", + "vector_store = DuckDBVectorStore.from_local(\"./persist/pg.duckdb\")\n", + "index = VectorStoreIndex.from_vector_store(vector_store)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/markdown": [ + "The author mentions that before college, they worked on two main things outside of school: writing and programming. They wrote short stories and also tried writing programs on an IBM 1401 computer. They later got a microcomputer and started programming more extensively." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Query Data\n", + "query_engine = index.as_query_engine()\n", + "response = query_engine.query(\"What did the author do growing up?\")\n", + "display(Markdown(f\"{response}\"))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Metadata filter example" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "It is possible to narrow down the search space by filter with metadata. Below is an example to show that in practice. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core.schema import TextNode\n", + "\n", + "nodes = [\n", + " TextNode(\n", + " **{\n", + " \"text\": \"The Shawshank Redemption\",\n", + " \"metadata\": {\n", + " \"author\": \"Stephen King\",\n", + " \"theme\": \"Friendship\",\n", + " \"year\": 1994,\n", + " \"ref_doc_id\": \"doc_1\",\n", + " },\n", + " }\n", + " ),\n", + " TextNode(\n", + " **{\n", + " \"text\": \"The Godfather\",\n", + " \"metadata\": {\n", + " \"director\": \"Francis Ford Coppola\",\n", + " \"theme\": \"Mafia\",\n", + " \"year\": 1972,\n", + " \"ref_doc_id\": \"doc_1\",\n", + " },\n", + " }\n", + " ),\n", + " TextNode(\n", + " **{\n", + " \"text\": \"Inception\",\n", + " \"metadata\": {\n", + " \"director\": \"Christopher Nolan\",\n", + " \"theme\": \"Sci-fi\",\n", + " \"year\": 2010,\n", + " \"ref_doc_id\": \"doc_2\",\n", + " },\n", + " }\n", + " ),\n", + "]\n", + "\n", + "vector_store = DuckDBVectorStore()\n", + "storage_context = StorageContext.from_defaults(vector_store=vector_store)\n", + "index = VectorStoreIndex(nodes, storage_context=storage_context)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Define the metadata filters." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core.vector_stores import ExactMatchFilter, MetadataFilters\n", + "\n", + "filters = MetadataFilters(\n", + " filters=[ExactMatchFilter(key=\"theme\", value=\"Mafia\")]\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Use the index as a retriever to use the metadatafilter option. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[NodeWithScore(node=TextNode(id_='736a1279-4ebd-496e-87b5-925197646477', embedding=[-0.006784645840525627, -0.021635770797729492, -0.015731574967503548, -0.03265434503555298, -0.005616107489913702, 0.025351788848638535, -0.0057811918668448925, 0.0027044713497161865, -0.01623653806746006, -0.023759208619594574, 0.027164479717612267, 0.017932699993252754, 0.029028963297605515, 0.003991158679127693, -0.0009047273779287934, 0.010973258875310421, 0.027164479717612267, -0.012844215147197247, 0.006972389295697212, -0.011148054152727127, 0.003528274828568101, 0.007736308965831995, -0.031022923067212105, -0.013996569439768791, 0.0012567456578835845, 0.004988139029592276, 0.010571876540780067, -0.024290068075060844, 0.019123896956443787, -0.02119554579257965, 0.014022464863955975, -0.023098871111869812, -0.009050510823726654, 0.001241370104253292, 0.006881754379719496, -0.007186027709394693, -0.0036577528808265924, -0.012734158895909786, 0.0034473512787371874, 0.003987921867519617, 0.01084378082305193, 0.003936130553483963, -0.01015754695981741, -0.011970238760113716, 0.004363407846540213, 0.0013425247743725777, 0.03288740664720535, -0.009186462499201298, -0.009549001231789589, 0.01988781802356243, 0.00900519359856844, 0.03363838046789169, -0.012539941817522049, -0.031955163925886154, 0.02144155278801918, 0.013096697628498077, -0.0035088532604277134, -0.009050510823726654, 0.002782158087939024, -0.014760489575564861, 0.0010722394799813628, 0.003816363401710987, -0.028821798041462898, 0.011102736927568913, -0.011335796676576138, -0.012798897922039032, -0.001216283766552806, 0.018787255510687828, 3.707318683154881e-05, 0.00591390673071146, 0.03358658775687218, 0.027371644973754883, -0.017414787784218788, 0.012973693199455738, 0.007419087924063206, -0.010791989043354988, -0.024303017184138298, 0.001213856041431427, 0.004201560281217098, -0.0054024686105549335, 0.023085923865437508, -0.02022445946931839, -0.0027643549256026745, 0.022334951907396317, 0.007198975421488285, 0.02203715220093727, -0.013841195963323116, 0.02256801165640354, 0.0038454958703368902, 0.0022626277059316635, -0.018424715846776962, 0.006308814510703087, 0.017220571637153625, 0.00503345625475049, -0.0069464934058487415, 0.029313813894987106, -0.007665096316486597, 0.004486411809921265, 0.029158441349864006, -0.013193805702030659, 0.0007109150174073875, 0.0006736901123076677, 0.00758093548938632, -0.011445852927863598, -0.021739352494478226, -0.008085899986326694, 0.028614632785320282, -0.009128197096288204, 0.008506703190505505, -0.006392975337803364, -0.020366886630654335, 0.021091962233185768, 0.030582698062062263, -0.046482592821121216, 0.016819190233945847, -0.016806241124868393, 0.014799333177506924, -0.011957291513681412, 0.01698751002550125, -0.026102760806679726, -0.010623668320477009, 0.04780326783657074, 0.019020315259695053, -0.0176090057939291, 0.02243853360414505, -0.0009945527417585254, 0.007542092353105545, 0.0009281952516175807, -0.011776021681725979, -0.008830398321151733, 0.05432895943522453, 0.01621064357459545, 0.00039571707020513713, 0.00791757833212614, -0.013044905848801136, 0.03190337494015694, -0.01125163584947586, 0.028847694396972656, -0.0282003041356802, -0.02044457197189331, 0.02770828641951084, 0.0271126888692379, -0.018994418904185295, 0.011983186937868595, -0.009613740257918835, 0.00953605305403471, 0.013491605408489704, -0.00014161653234623373, 0.026154551655054092, -0.021700508892536163, 0.022697489708662033, -0.027967242524027824, -0.001959972782060504, 0.02586969919502735, 0.03231770172715187, 0.019085053354501724, 0.001658936613239348, -0.006674589589238167, -0.014436794444918633, 0.005684083327651024, 0.023163611069321632, 0.0244583897292614, 0.0008909703465178609, -0.007250766735523939, 0.0011402154341340065, 0.022891705855727196, 0.029650457203388214, 0.006758750416338444, 0.00384873291477561, 0.004492885898798704, -0.0012939705047756433, 0.02680194191634655, -0.00532154506072402, 0.023396670818328857, -0.015653887763619423, 0.02957276999950409, 0.023293089121580124, 0.01736299693584442, -0.038196004927158356, -0.007444983813911676, -0.005366862285882235, 0.02031509391963482, 0.03356069326400757, 0.051221489906311035, -0.007716887630522251, -0.0014954706421121955, -0.006380027160048485, 0.005790902767330408, 0.01244930736720562, -0.0006445575854741037, 0.0018499166471883655, 0.021959464997053146, 0.01829523779451847, -0.013815300539135933, -0.6500830054283142, -0.008221851661801338, -0.01732415333390236, -0.012915428727865219, 0.0010447254171594977, 0.030997028574347496, 0.014216681942343712, 0.022697489708662033, -0.0171428844332695, -0.004389303270727396, -0.011387588456273079, 0.0074126143008470535, 0.0467415489256382, -0.003353479551151395, -0.05448433384299278, -0.03526980057358742, -0.013491605408489704, -0.021234387531876564, -0.023241296410560608, 0.0033761383965611458, -0.020392781123518944, 0.008267168886959553, -0.026465298607945442, -0.012022030539810658, 0.002188177779316902, -0.004007343202829361, 0.02667246386408806, -0.017311206087470055, 0.007192501798272133, 0.0038325481582432985, -0.005917143542319536, 0.013161436654627323, 0.013802352361381054, 0.006166388746351004, 0.04088914394378662, -0.007561514154076576, -0.021855883300304413, 0.028821798041462898, 0.0032385678496211767, 0.025170518085360527, -0.005162934307008982, -0.008636181242763996, 0.014915863052010536, -0.018994418904185295, -0.01266941986978054, -0.013400970958173275, 0.04000869393348694, -0.022270211949944496, 0.017816169187426567, 0.00038539929664693773, 0.00421450799331069, 0.016120009124279022, -0.0027659733314067125, 0.01747952774167061, 0.0074838269501924515, 0.004819817841053009, 0.032990988343954086, -0.003131748642772436, -0.0012308500008657575, 0.00835132971405983, 0.003641568124294281, -0.0026170737110078335, 0.0176090057939291, -0.0012494624825194478, 0.02072942443192005, -0.005936565343290567, -0.00503993034362793, 0.004994613118469715, 0.0225939080119133, -0.008435490541160107, -0.0035897770430892706, 0.016663815826177597, -0.019706549122929573, -0.02923612669110298, 0.025442423298954964, -0.0031560256611555815, 0.01698751002550125, 0.015822209417819977, 0.005907432641834021, 0.008655603043735027, -0.010565402917563915, 0.0022885233629494905, -0.029365604743361473, -0.01378940511494875, 0.009464840404689312, -0.00693354569375515, -0.05427716672420502, 0.016158850863575935, 0.00040603484376333654, 0.0036577528808265924, 0.03371606394648552, -0.009775587357580662, -0.004162717144936323, 0.026141604408621788, 0.010397081263363361, 0.010902046225965023, -0.007477353326976299, -0.007833417505025864, 0.017583109438419342, -0.023616783320903778, -0.011659491807222366, 0.0013117737835273147, -0.012041452340781689, 0.0014760489575564861, 0.02421238273382187, 0.002783776493743062, -0.0025571901351213455, 0.027319854125380516, 0.050030291080474854, -0.01894262805581093, 0.030453220009803772, 0.005295649170875549, -0.0030265478417277336, -0.013621083460748196, 0.00869444664567709, -0.02533883973956108, 0.02817440778017044, -0.004347223322838545, 0.0054024686105549335, -0.000619875849224627, -0.013116119429469109, -0.009322414174675941, -0.008759185671806335, -0.010306446813046932, 0.016430756077170372, 0.00438606645911932, -0.023474358022212982, -0.02312476746737957, -0.010332342237234116, 0.017893856391310692, 0.01829523779451847, -0.0025312944781035185, 0.01422963012009859, -0.0009710848098620772, 0.0136340307071805, -0.0002207194920629263, -0.002903543645516038, -0.0052438583225011826, 0.026348767802119255, -0.03016836941242218, 0.014074256643652916, -0.008778606541454792, 0.00034372357185930014, -0.0017592820804566145, 0.01346570998430252, -0.031307775527238846, -0.010125177912414074, -0.026063917204737663, -0.01676739752292633, -0.00585887860506773, -0.005726163741201162, 0.007762204855680466, -0.0018774307100102305, 0.013582239858806133, 0.011413483880460262, -0.02387573942542076, -0.01614590361714363, -0.005700267851352692, -0.02489861473441124, -0.017596056684851646, 0.016689712181687355, 0.0020263304468244314, -0.01804923079907894, -0.0006117834709584713, 0.006214942783117294, -0.0022011257242411375, 0.007710413541644812, 0.020548155531287193, 0.01118689775466919, -0.02682783640921116, 0.022088943049311638, 0.01149764470756054, 0.01259173359721899, 0.012429885566234589, -0.005528709851205349, 0.022231368348002434, 0.009432470425963402, -0.004965480417013168, -0.012132086791098118, -0.008286590687930584, 0.011737179011106491, -0.011653018184006214, 0.01716878078877926, -0.00195188052020967, 0.039413098245859146, -0.015213662758469582, 0.036978911608457565, 0.015071236528456211, -0.022075995802879333, 0.020638789981603622, -0.013070802204310894, 0.0008796410402283072, -0.005153223406523466, -0.019214531406760216, 0.0141001520678401, 0.027993138879537582, -0.00811826903373003, 0.01869661919772625, 0.0059883566573262215, 0.0386362299323082, 0.0336642749607563, -0.014656906947493553, 0.02662067301571369, -0.012235668487846851, -0.004415199160575867, -0.020496364682912827, 0.015874000266194344, -0.010973258875310421, 0.013659927062690258, 0.0005409751902334392, 0.004628837574273348, -0.02328014001250267, -0.008344856090843678, -0.007762204855680466, 0.02651708945631981, 0.02629697695374489, -0.020366886630654335, -0.0016095731407403946, -0.01922748051583767, -0.024290068075060844, 0.006758750416338444, 0.022956445813179016, -0.0028274753130972385, -0.006998284719884396, -0.0035703552421182394, -0.006745802704244852, 0.0014995168894529343, 0.020574050024151802, 0.010332342237234116, -0.027760079130530357, -0.013193805702030659, 0.03902466222643852, -0.0058685895055532455, 0.010779041796922684, -0.008849820122122765, -0.007166605908423662, -0.009380679577589035, -0.017816169187426567, 0.01794564723968506, -0.009348309598863125, 0.015563253313302994, 0.03205874562263489, 0.029831726104021072, -0.01820460334420204, 0.013180858455598354, -0.01966770552098751, 0.0123910428956151, -0.00822832528501749, -0.020340990275144577, 0.020431624725461006, -0.00789815653115511, 0.006218180060386658, -0.011426431126892567, -0.00622465368360281, 0.034389350563287735, -0.017181728035211563, 0.0029682826716452837, 0.007218397222459316, 0.013375075533986092, 0.03306867554783821, 0.011788969859480858, 0.006156677845865488, 0.0050561148673295975, 0.02449723333120346, 0.009031089022755623, 0.0038875762838870287, 4.352179530542344e-05, -0.0010155929485335946, -0.01439795084297657, -0.024600815027952194, -0.009853274561464787, -0.0021541898604482412, 0.014643959701061249, -0.015576200559735298, 0.015407879836857319, 0.009069932624697685, 0.004318090621381998, 0.007665096316486597, 0.010371185839176178, -0.0017317679012194276, -0.030997028574347496, -0.0030653912108391523, 0.03594308719038963, -0.009173514321446419, 0.00014424655819311738, -0.008603811264038086, 0.013970674015581608, -0.006804067641496658, 0.007438509725034237, -0.005014034919440746, -0.014825228601694107, 0.010455346666276455, 0.00681701535359025, 0.005476918537169695, -0.0021104910410940647, -0.012222721241414547, 0.01916274055838585, -0.021493343636393547, -0.002458463190123439, -0.027682391926646233, -0.0064447661861777306, -0.001683213748037815, -0.006836437154561281, -0.02053520642220974, 0.029987100511789322, 0.006606613751500845, 0.00537657318636775, -0.010164021514356136, 0.0072378190234303474, 0.01517481915652752, 0.01248167734593153, 0.009639635682106018, -0.020625842735171318, -0.022399690002202988, 0.0026850495487451553, -0.016845084726810455, -0.015757469460368156, -0.005415416322648525, 0.0188519936054945, -0.004806870128959417, 0.003722491906955838, -0.026374664157629013, -0.0345965139567852, -0.0015901514561846852, 0.0869574099779129, 0.010526559315621853, 0.030815759673714638, 0.026154551655054092, 0.01125163584947586, -0.010338816791772842, -0.03205874562263489, -0.022930549457669258, 0.003819600446149707, -0.024769136682152748, -0.016573181375861168, -0.03172210603952408, 0.011277532204985619, 0.01508418470621109, 0.03842906281352043, -0.012876585125923157, -0.010688407346606255, -0.00038357850280590355, -7.556253694929183e-05, -0.013892986811697483, -0.009322414174675941, 0.008085899986326694, 0.017116988077759743, 0.00822832528501749, -0.016430756077170372, -0.04959006607532501, 0.017065197229385376, -0.0019356957636773586, 0.003796941600739956, -0.02256801165640354, -0.0033372947946190834, -0.0015772036276757717, -0.008409595116972923, 0.005661424715071917, -0.0016476073069497943, -0.0026737202424556017, 0.03918003663420677, 0.013944778591394424, 0.017596056684851646, -0.006609850563108921, 0.009782060980796814, -0.022775176912546158, -0.015110080130398273, -0.014022464863955975, 0.028977170586586, -0.014190786518156528, -0.028718216344714165, 0.011050945147871971, 0.018877889961004257, -0.02022445946931839, 0.029650457203388214, 0.015187766402959824, -0.0006619561463594437, 0.0015861052088439465, 0.019486436620354652, 0.011232214979827404, 0.0028938327450305223, 0.015420827083289623, -0.0027934873942285776, 0.019395800307393074, -0.02028919942677021, -0.037626300007104874, 0.007509722840040922, -0.010170495137572289, 0.009128197096288204, -0.01586105301976204, -0.01935695856809616, -0.008603811264038086, -0.007406140211969614, -0.01595168747007847, 0.002808053744956851, -0.008105321787297726, -0.013362127356231213, 0.0021460975985974073, 0.018217552453279495, -0.0031819213181734085, 0.006745802704244852, 0.0015755851054564118, 0.030893445014953613, 0.009594318456947803, -0.02219252474606037, -0.030271951109170914, -0.002346788300201297, -0.0392577238380909, -0.0025976519100368023, 0.007988790981471539, -0.019085053354501724, -0.014359108172357082, -0.02000434696674347, -0.0018580090254545212, 0.006231127772480249, -0.007211923599243164, 0.022671593353152275, -0.015809260308742523, -0.00040987873217090964, -0.0020554629154503345, 0.005285938270390034, 0.0022561538498848677, -0.0026138366665691137, -0.00391023512929678, 0.02091069333255291, -0.02471734583377838, -0.017932699993252754, 0.008344856090843678, -0.004473464097827673, -0.0037645723205059767, -0.0007355967536568642, 0.00716013228520751, -0.0007975033950060606, -0.005629055202007294, 0.01747952774167061, -0.031307775527238846, 0.002071647671982646, -0.02359088696539402, 0.0002816146006807685, 0.01960296556353569, 0.005635528825223446, 0.0005057733505964279, 0.0063703167252242565, -0.022231368348002434, -0.0036253833677619696, -0.011814865283668041, 0.012235668487846851, 0.03938720002770424, -0.01235867291688919, -0.011542961932718754, 0.021493343636393547, -0.011860182508826256, 0.02175229974091053, -0.0019955793395638466, -0.039931006729602814, 0.009717321954667568, 0.011834287084639072, -0.008545546792447567, -0.004878082778304815, -0.019344009459018707, 0.007444983813911676, -0.000181370327482, -0.02299528941512108, -0.0012025267351418734, -0.025546004995703697, -0.008454912342131138, -0.0036448051687330008, -0.0171428844332695, 0.00028485155780799687, -0.02296939305961132, -0.004657970275729895, -0.009930960834026337, -0.012416938319802284, 0.015744522213935852, -0.021234387531876564, -0.021791143342852592, -0.0044799381867051125, 0.0029731381218880415, 0.003018455347046256, -0.03249897435307503, -0.038506750017404556, -0.013239122927188873, 0.004169190768152475, 0.01567978225648403, 0.03418218716979027, -0.0008974442607723176, 0.011012102477252483, 0.00018056108092423528, -0.005820035003125668, 0.026089811697602272, 0.000589934061281383, 0.01794564723968506, -0.0021428605541586876, 0.04360818490386009, 0.037445031106472015, 0.0029731381218880415, 0.018722515553236008, 0.0025005433708429337, 0.022166630253195763, 0.01645665057003498, 0.009458365850150585, 0.019408749416470528, 0.014967653900384903, -0.018101021647453308, -0.008940454572439194, 0.03154083713889122, -0.025066936388611794, -0.01645665057003498, -0.011737179011106491, -0.017842065542936325, 0.0005810324219055474, -0.029987100511789322, -0.02724216692149639, 0.012837741523981094, 0.02693141996860504, -0.01745363138616085, -0.00455762492492795, -0.014967653900384903, 0.007315505761653185, -0.03542517498135567, -0.001539978664368391, 0.0010107374982908368, 0.01835997775197029, 0.013148488476872444, 0.013569291681051254, 0.030556803569197655, -0.00402029138058424, -0.029495082795619965, 0.0038454958703368902, 0.0520501472055912, -0.008888662792742252, 0.009840326383709908, 0.01463101152330637, -0.013737613335251808, 0.00866207666695118, -0.02923612669110298, -0.012352199293673038, -0.04513602331280708, 0.014954706653952599, 0.003521800972521305, 0.0026219291612505913, 0.0035897770430892706, 0.004907215479761362, -0.023047080263495445, 0.03962026163935661, -0.012125612236559391, 0.03586539998650551, 0.006305577699095011, 0.0193181149661541, 0.015498514287173748, 0.00633470993489027, -0.009943909011781216, 0.030220160260796547, 0.005703505128622055, -0.0017689928645268083, 0.022542115300893784, 0.01257231179624796, 0.011847235262393951, -0.0072442926466465, -0.0020020531956106424, -0.01617179997265339, -0.022826967760920525, -0.01957707107067108, 0.019046209752559662, 0.033172257244586945, 0.016754450276494026, -0.012183877639472485, -0.0023435514885932207, 0.012643524445593357, 0.002867937320843339, -0.0037775200325995684, -0.004780974239110947, -0.003266081912443042, -0.0467415489256382, -0.012598207220435143, -0.019615912809967995, -0.01117394957691431, -0.01683213748037815, -0.006661641877144575, -0.03889518603682518, 0.012403990142047405, -0.011665965430438519, 0.006078991107642651, -0.01736299693584442, -0.026167498901486397, 0.04521371051669121, 0.011659491807222366, -0.009056984446942806, 0.026193395256996155, -0.0013781312154605985, -0.019486436620354652, -0.011471749283373356, -0.003118800697848201, 0.02786366082727909, 0.005379809997975826, -0.0032709373626857996, 0.003230475587770343, 0.009827378205955029, -0.008577915839850903, 0.0021153464913368225, -0.013621083460748196, -0.015420827083289623, -0.010306446813046932, -0.031178297474980354, -0.011957291513681412, 0.011523540131747723, -0.00889513734728098, 0.01355634443461895, -0.008435490541160107, -0.016741503030061722, 0.012242143042385578, -0.0033631904516369104, 0.019551174715161324, -0.026542985811829567, -0.029210232198238373, -0.023176558315753937, 0.011057419702410698, 0.0012502716854214668, -0.017557213082909584, -0.00044184361468069255, 0.0015027538174763322, 0.03754861280322075, -0.015886947512626648, 0.01801038719713688, -0.02168756164610386, 0.005826509092003107, -0.008862767368555069, 0.019085053354501724, -0.001272930414415896, -0.009529579430818558, 0.010558929294347763, -0.018282290548086166, 0.0035444595851004124, 0.013491605408489704, 0.010202865116298199, 0.024354808032512665, 0.013983621262013912, -0.017906803637742996, 0.002309563336893916, 0.02299528941512108, -0.008027634583413601, -0.005648477002978325, 0.0002723083598539233, 0.035917192697525024, -0.01621064357459545, 0.006425344850867987, 0.01779027469456196, -0.008927506394684315, 0.0011426431592553854, 0.004457279574126005, -0.0035120900720357895, 0.01126458402723074, -0.03703070059418678, -0.003347005695104599, -0.01916274055838585, 0.039931006729602814, -0.004376355558633804, 0.011640070006251335, -0.014074256643652916, -0.009652582928538322, -0.007198975421488285, 0.024393651634454727, -0.009743218310177326, -0.02290465496480465, 0.02318950556218624, 0.023383723571896553, -0.0031754474621266127, 0.010008648037910461, -0.0030653912108391523, -0.02496335469186306, 0.0024681738577783108, -0.038662124425172806, -0.035140324383974075, -0.03218822553753853, -0.026905523613095284, 0.04536908492445946, 0.007645674515515566, -0.0019486435921862721, -0.004836002364754677, 0.009665531106293201, -0.03125598281621933, -0.02877000719308853, -9.533827324048616e-06, 0.019279271364212036, 0.02549421414732933, 0.005114380270242691, -0.006399448961019516, 0.00869444664567709, 0.005457496736198664, 0.0132455974817276, -0.019654756411910057, 0.0216616652905941, -0.009031089022755623, -0.01157533098012209, 0.016845084726810455, 0.005237384233623743, -0.0005272181588225067, -0.004233929794281721, -0.007943473756313324, 0.01736299693584442, -0.011089788749814034, 0.02356499247252941, -0.02414764277637005, -0.011394062079489231, -0.027785973623394966, -0.016094112768769264, -0.014721645973622799, 0.002252916805446148, -0.0026219291612505913, -0.02069058082997799, 0.0057811918668448925, -0.008448437787592411, 0.0053992317989468575, -0.023137714713811874, -0.01007986068725586, 0.01876135915517807, -0.008921032771468163, -0.01007986068725586, -0.008921032771468163, -0.012365146540105343, 0.024536076933145523, -0.011743652634322643, 0.010112229734659195, 0.019214531406760216, -0.00967847928404808, 0.0019939609337598085, 0.014592167921364307, -0.0014622919261455536, -0.004460516385734081, 0.008027634583413601, -0.03293919935822487, -0.03604666888713837, -0.025817908346652985, -0.0032822666689753532, 0.012637050822377205, -0.003010363085195422, 0.03964615613222122, -0.015666835010051727, -0.007567987777292728, -0.005496340338140726, -0.0076197790913283825, -0.004959006793797016, -0.007024180144071579, 0.02449723333120346, -0.027164479717612267, -0.001715583261102438, -0.020276252180337906, 0.0036027247551828623, -0.02135091833770275, -0.0026154550723731518, -0.0107531463727355, -0.0038066525012254715, -0.017583109438419342, -0.00842901598662138, -0.012423411943018436, -0.013478657230734825, -0.017647847533226013, -0.03309457004070282, -0.011924921534955502, 0.03902466222643852, 0.20778626203536987, 0.006422107573598623, -0.012080295011401176, 0.016650868579745293, -0.017660796642303467, 0.018088074401021004, 0.022645698860287666, -0.0006623608060181141, -0.012863636948168278, 0.012009082362055779, -0.013193805702030659, 0.00944541860371828, 0.033301737159490585, 0.008396646939218044, 0.009438944980502129, -0.017997438088059425, -0.021700508892536163, -0.02113080583512783, -0.026284029707312584, -0.019188636913895607, -0.004114162642508745, 0.005713215563446283, -0.005680846516042948, -0.002369446912780404, 0.029779935255646706, 0.008545546792447567, -0.0165213905274868, 0.004288957919925451, 0.017751431092619896, 0.025002198293805122, -0.004230692982673645, -0.028070826083421707, 0.0031803029123693705, -0.005535183474421501, -0.031929269433021545, 0.016404859721660614, -0.0244583897292614, -0.00933536235243082, -0.010791989043354988, 0.006043384782969952, -0.004068845417350531, 0.014385003596544266, -0.005175882019102573, -0.00130287220235914, 0.008195956237614155, 0.014255525544285774, -0.021894726902246475, 0.011646544560790062, -0.014605116099119186, 0.010837307199835777, -0.04153653606772423, -0.013944778591394424, 0.029210232198238373, 0.02851105108857155, -0.015524409711360931, -0.021609874442219734, 0.01190549973398447, 0.02421238273382187, -0.004797159228473902, -0.027345748618245125, 0.022516220808029175, 0.02611570805311203, -0.020250355824828148, -0.017647847533226013, -0.003842259058728814, 0.0244583897292614, -0.026452351361513138, -0.02788955718278885, 0.04182138666510582, -0.035632338374853134, 0.021791143342852592, -0.003974974155426025, -0.00591390673071146, 0.013219701126217842, 0.02396637387573719, -0.02359088696539402, -0.02682783640921116, 0.01953822746872902, 0.0043116165325045586, 0.03534748777747154, -0.024937458336353302, 0.010902046225965023, -0.016404859721660614, -0.00794994831085205, -0.00455762492492795, -0.01785501278936863, 0.0032968330197036266, 0.011206318624317646, 0.0022027441300451756, -0.00800821278244257, -0.013905934989452362, -0.028744110837578773, -0.016754450276494026, 0.005917143542319536, 0.010545981116592884, 0.011076840572059155, 0.009141145274043083, 0.012831267900764942, -0.010053965263068676, -0.0020360411144793034, -0.03019426390528679, 0.028381573036313057, 0.028277991339564323, -0.019279271364212036, -0.03029784746468067, -0.01835997775197029, 0.011801918037235737, 0.044980648905038834, 0.002332222182303667, -0.029313813894987106, 0.003440877189859748, -0.012119138613343239, -0.013116119429469109, -0.012675894424319267, 0.021363865584135056, 0.006739328615367413, -0.013621083460748196, -0.037004806101322174, 0.002421238226816058, -0.004285721108317375, -0.008293064311146736, -0.00384873291477561, 0.0015067999484017491, 0.013362127356231213, -0.006483609788119793, 0.0032498971559107304, -0.007969369180500507, -0.0028663186822086573, 0.03262845054268837, -0.02739753946661949, 0.01547261793166399, -0.02480798028409481, 0.004334275145083666, -0.0052632796578109264, -0.0036027247551828623, 0.008480807766318321, 0.017958596348762512, 0.015278401784598827, -0.002523201983422041, -0.018748411908745766, 0.0011329322587698698, -0.01583515666425228, 0.010384134016931057, 0.007937000133097172, -0.009710848331451416, -0.008163586258888245, 0.010584824718534946, -0.005726163741201162, -0.020017296075820923, -0.018813150003552437, -0.013724666088819504, -0.02640056051313877, -0.0022836679127067327, -0.008966349996626377, 0.027268061414361, -0.022451480850577354, -0.010358238592743874, 0.010856728069484234, -0.012488150969147682, -0.012565838173031807, -0.03949078172445297, 0.012436360120773315, 0.013931830413639545, 0.00546073354780674, -0.015148923732340336, -0.010681932792067528, -0.1639709174633026, 0.023293089121580124, 0.015964634716510773, -0.006894702557474375, 0.026879629120230675, -0.02465260773897171, 0.03288740664720535, 0.002220547292381525, -0.022399690002202988, 0.0008723578648641706, -0.012598207220435143, -0.00705007603392005, -0.017414787784218788, -0.014902914874255657, -0.004399014171212912, 0.015019445680081844, -0.042805418372154236, 0.02006908692419529, 0.022399690002202988, -0.0007533999742008746, 0.006153441034257412, -0.016819190233945847, -0.022477377206087112, -0.019188636913895607, 0.002359736245125532, 0.02215368114411831, -0.0029456240590661764, 0.006862333044409752, -0.009561948478221893, -0.002031185897067189, -0.01191844791173935, 0.00922530610114336, -0.002044133609160781, 0.011996135115623474, 0.01623653806746006, 0.0047777374275028706, -0.009918013587594032, 0.0023273667320609093, -0.007283136248588562, -0.004780974239110947, 0.02662067301571369, 0.017777325585484505, 0.018994418904185295, 0.005470444448292255, -0.007147184573113918, 0.02372036501765251, 0.03278382495045662, -0.007406140211969614, 0.023539096117019653, -0.03063448891043663, -0.006409159861505032, -0.024639658629894257, -0.0026397323235869408, -0.006101649720221758, 0.02044457197189331, 0.018593037500977516, -0.001836968818679452, 0.011814865283668041, -0.004415199160575867, 0.0019227479351684451, -0.03659047558903694, -0.007477353326976299, 0.020871849730610847, 0.00444109458476305, -0.015537356957793236, -0.01791975274682045, -0.001009118976071477, 0.0006902794702909887, -0.023383723571896553, 0.006247312296181917, -0.015874000266194344, 0.009199410676956177, 0.0015237939078360796, -0.027811869978904724, 0.000155980495037511, 0.013724666088819504, -0.02306002750992775, -0.004350460134446621, 0.002518346766009927, -0.0019713023211807013, -0.021428605541586876, 0.025377683341503143, 0.014825228601694107, -0.02443249523639679, 0.03835137560963631, 0.027216270565986633, -0.024691451340913773, -0.02137681469321251, -0.010850254446268082, -0.03723786771297455, 0.0017835590988397598, -0.025079883635044098, -0.02028919942677021, -0.0032223830930888653, 0.02436775527894497, 0.0033033068757504225, 0.025753170251846313, -0.007749257143586874, 0.010209338739514351, -0.028407467529177666, -0.013880039565265179, -0.009820904582738876, -0.01264999806880951, 0.001183914253488183, 0.03288740664720535, 0.0349072627723217, 0.01061072014272213, 0.01701340638101101, 0.006331473123282194, 0.007315505761653185, -0.02015972137451172, 0.03599487617611885, 0.025610744953155518, 0.0059883566573262215, -0.005285938270390034, 0.02115670219063759, 0.01966770552098751, -0.04365997388958931, 0.009963330812752247, 0.014708698727190495, 0.0467415489256382, -0.0010212576016783714, 0.014035413041710854, 0.006862333044409752, -0.009037562645971775, 0.0030281662475317717, -0.08436784893274307, 0.001717201666906476, 0.0035088532604277134, 0.011769548058509827, 0.0007809140370227396, 0.027449332177639008, -0.020366886630654335, 0.03690122440457344, -0.01663791947066784, 0.006648694165050983, -0.003926419652998447, -0.04640490561723709, -0.032240018248558044, -0.020056139677762985, 0.02206304669380188, 0.005065825767815113, -0.008377225138247013, -0.009626687504351139, -0.03413039445877075, 0.005175882019102573, -0.0216616652905941, -0.008344856090843678, -0.0001375703577650711, -0.01191844791173935, 0.0022367320489138365, 0.003696596249938011, -0.02015972137451172, 0.006205231882631779, 0.0016508442349731922, 0.014126047492027283, -0.006486846599727869, -0.020677633583545685, 0.023098871111869812, -0.018618933856487274, -0.0019065631786361337, -0.00967847928404808, 0.006438292562961578, -0.005250331945717335, 0.024549024179577827, -0.03260255604982376, -0.003118800697848201, -0.0031527888495475054, 0.0032968330197036266, -0.04946058616042137, 0.0014040268724784255, -0.007011232431977987, -0.014436794444918633, 0.00016700636479072273, 0.03371606394648552, -0.01244930736720562, -0.014164891093969345, -0.008098847232758999, -0.009464840404689312, -0.009503684006631374, 0.013400970958173275, -0.015524409711360931, 0.025442423298954964, -0.030090682208538055, -0.022412637248635292, 0.024924511089920998, 0.021247336640954018, -0.015938738361001015, -0.012585259042680264, 0.021713456138968468, 0.0062699709087610245, -0.01299311500042677, 0.004165953956544399, -0.027268061414361, 0.019654756411910057, -0.0031592627055943012, -0.008901610970497131, 0.0072378190234303474, -0.03374196216464043, -0.005175882019102573, -0.03016836941242218, 0.0022399690933525562, -0.034233976155519485, -0.00769746582955122, 0.02502809278666973, -0.02303413301706314, -0.015692731365561485, -0.008933980949223042, 0.005201777908951044, -0.02788955718278885, 0.021635770797729492, 0.04254646226763725, 0.022024204954504967, 0.014022464863955975, -0.009205884300172329, -0.0282003041356802, -0.0005603968747891486, 0.012293933890759945, -0.0023856316693127155, -0.01149764470756054, 0.0048133437521755695, 0.00857144221663475, 0.0009629924898035824, 0.007341401185840368, 0.005124091170728207, 0.006952967494726181, -0.03001299500465393, 0.004399014171212912, -0.07949947565793991, 0.007334927562624216, -0.023862792178988457, -0.01041002944111824, 0.02119554579257965, 0.007341401185840368, 0.008383698761463165, -0.021648718044161797, 0.006072517018765211, 0.007509722840040922, -0.01148469652980566, 0.02131207473576069, 0.010274077765643597, -1.5641040590708144e-05, -0.011840760707855225, -0.0025895596481859684, 0.02059994637966156, -0.008487281389534473, 0.011950816959142685, 0.025571901351213455, -0.012086769565939903, 0.003906997852027416, -0.006137256044894457, -0.014372055418789387, -0.007982317358255386, -0.020988380536437035, 0.0025102542713284492, 0.018968524411320686, -0.011976713314652443, -0.0035023794043809175, 0.0033696643076837063, -0.02203715220093727, 0.02529999613761902, 0.017971543595194817, 0.004227456171065569, -0.025442423298954964, -0.008577915839850903, -0.01233925111591816, 0.03003889136016369, 0.010028069838881493, -0.02474324218928814, -0.01463101152330637, 0.01561504416167736, -0.022801071405410767, -0.022075995802879333, 0.009244727902114391, -0.021700508892536163, 0.004246877506375313, 0.01636601611971855, 0.008946928195655346, 0.021829986944794655, 0.014915863052010536, -0.021804092451930046, -0.016262434422969818, 0.003347005695104599, -0.02022445946931839, 0.01798449084162712, -0.0009095827699638903, -0.0011062275152653456, -0.006642220076173544, 0.0182304996997118, -0.0008051911718212068, -0.01683213748037815, -0.009134671650826931, -0.005752059165388346, 0.01061072014272213, -0.014566272497177124, 0.022114839404821396, -0.0032223830930888653, -0.01539493165910244, -0.021739352494478226, -0.005347440484911203, 0.0029342947527766228, 0.02084595523774624, 0.0006077372818253934, -0.00716013228520751, 0.022710436955094337, 0.013142014853656292, 0.00942599680274725, 0.005234147422015667, 0.033457107841968536, 0.004172428045421839, -0.02529999613761902, 0.026698358356952667, 0.03508853167295456, 0.03765219449996948, -0.014889967627823353, 0.025908542796969414, -2.9916493076598272e-05, -0.007723361253738403, -0.006590429227799177, 0.01960296556353569, 0.008629707619547844, 0.014877019450068474, -0.011860182508826256, -0.005651713814586401, -0.01621064357459545, -0.019188636913895607, 0.0077427830547094345, 0.02954687550663948, -0.010118704289197922, 0.006965915206819773, -0.002694760449230671, -0.01807512529194355, -0.02509283274412155, 0.028821798041462898, -0.024976301938295364, -0.022632749751210213, -0.015187766402959824, 0.008823923766613007, 0.02724216692149639, 0.010584824718534946, -0.022736333310604095, 0.006842911243438721, -0.03493315726518631, -0.013491605408489704, -0.013388022780418396, -0.03446703776717186, -0.0019486435921862721, -0.0015772036276757717, 0.008901610970497131, 0.023979321122169495, 0.038196004927158356, -0.01248167734593153, 0.007736308965831995, 0.00325313420034945, 0.023396670818328857, -0.018178708851337433, -0.0001203740612254478, -0.015511461533606052, 0.023111818358302116, -0.012222721241414547, -0.01115452777594328, -0.009167040698230267, -0.01385414320975542, -0.0031738290563225746, -0.0038357852026820183, 0.02159692719578743, -0.01966770552098751, 0.03905055671930313, -0.004787448327988386, -0.0009314321796409786, 0.0033599536400288343, -0.026776045560836792, -0.01017696876078844, -0.013841195963323116, 0.0006340374820865691, -0.030686281621456146, -0.021247336640954018, 0.02724216692149639, 0.015744522213935852, 0.027811869978904724, -0.012837741523981094, -0.021713456138968468, 0.0017398602794855833, 0.0021202019415795803, -0.0071536581963300705, 0.010902046225965023, -0.012099716812372208, 0.011219266802072525, 0.015187766402959824, 0.014605116099119186, -0.0069076502695679665, 0.014190786518156528, -0.0002251702971989289, 0.025261154398322105, -0.002346788300201297, -0.01991371251642704, -0.05026335269212723, 0.004470227286219597, -0.019680652767419815, -0.023539096117019653, -0.009807956404983997, 0.020483415573835373, -0.009069932624697685, 0.013737613335251808, 0.0006384882726706564, 0.011465274728834629, 0.0271126888692379, -0.03508853167295456, 0.02817440778017044, -0.028096720576286316, -0.009943909011781216, 0.03091934137046337, 0.005344203673303127, -0.005862115416675806, -0.013362127356231213, -0.02596033550798893], metadata={'director': 'Francis Ford Coppola', 'theme': 'Mafia', 'year': 1972, 'ref_doc_id': 'None', '_node_content': '{\"id_\": \"736a1279-4ebd-496e-87b5-925197646477\", \"embedding\": null, \"metadata\": {\"director\": \"Francis Ford Coppola\", \"theme\": \"Mafia\", \"year\": 1972, \"ref_doc_id\": \"doc_1\"}, \"excluded_embed_metadata_keys\": [], \"excluded_llm_metadata_keys\": [], \"relationships\": {}, \"text\": \"\", \"start_char_idx\": null, \"end_char_idx\": null, \"text_template\": \"{metadata_str}\\\\n\\\\n{content}\", \"metadata_template\": \"{key}: {value}\", \"metadata_seperator\": \"\\\\n\", \"class_name\": \"TextNode\"}', '_node_type': 'TextNode', 'document_id': 'None', 'doc_id': 'None'}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, text='The Godfather', start_char_idx=None, end_char_idx=None, text_template='{metadata_str}\\n\\n{content}', metadata_template='{key}: {value}', metadata_seperator='\\n'), score=0.7543986421543848)]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "retriever = index.as_retriever(filters=filters)\n", + "retriever.retrieve(\"What is inception about?\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "llama-index-dev", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/docs/examples/vector_stores/MongoDBAtlasVectorSearchRAGFireworks.ipynb b/docs/examples/vector_stores/MongoDBAtlasVectorSearchRAGFireworks.ipynb index f1c0db04e7472..50f96101eeba3 100644 --- a/docs/examples/vector_stores/MongoDBAtlasVectorSearchRAGFireworks.ipynb +++ b/docs/examples/vector_stores/MongoDBAtlasVectorSearchRAGFireworks.ipynb @@ -4,347 +4,7 @@ "cell_type": "code", "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Requirement already satisfied: llama-index in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (0.10.12)\n", - "Requirement already satisfied: llama-index-agent-openai<0.2.0,>=0.1.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.5)\n", - "Requirement already satisfied: llama-index-cli<0.2.0,>=0.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.5)\n", - "Requirement already satisfied: llama-index-core<0.11.0,>=0.10.12 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.10.12)\n", - "Requirement already satisfied: llama-index-embeddings-openai<0.2.0,>=0.1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.6)\n", - "Requirement already satisfied: llama-index-indices-managed-llama-cloud<0.2.0,>=0.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.3)\n", - "Requirement already satisfied: llama-index-legacy<0.10.0,>=0.9.48 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.9.48)\n", - "Requirement already satisfied: llama-index-llms-openai<0.2.0,>=0.1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.6)\n", - "Requirement already satisfied: llama-index-multi-modal-llms-openai<0.2.0,>=0.1.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.4)\n", - "Requirement already satisfied: llama-index-program-openai<0.2.0,>=0.1.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.4)\n", - "Requirement already satisfied: llama-index-question-gen-openai<0.2.0,>=0.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.3)\n", - "Requirement already satisfied: llama-index-readers-file<0.2.0,>=0.1.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.5)\n", - "Requirement already satisfied: llama-index-readers-llama-parse<0.2.0,>=0.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index) (0.1.3)\n", - "Requirement already satisfied: llama-index-vector-stores-chroma<0.2.0,>=0.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.1.3)\n", - "Requirement already satisfied: PyYAML>=6.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (6.0.1)\n", - "Requirement already satisfied: SQLAlchemy>=1.4.49 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.12->llama-index) (2.0.27)\n", - "Requirement already satisfied: aiohttp<4.0.0,>=3.8.6 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (3.9.3)\n", - "Requirement already satisfied: dataclasses-json in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (0.6.4)\n", - "Requirement already satisfied: deprecated>=1.2.9.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (1.2.14)\n", - "Requirement already satisfied: dirtyjson<2.0.0,>=1.0.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (1.0.8)\n", - "Requirement already satisfied: fsspec>=2023.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (2023.10.0)\n", - "Requirement already satisfied: httpx in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (0.27.0)\n", - "Requirement already satisfied: llamaindex-py-client<0.2.0,>=0.1.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (0.1.13)\n", - "Requirement already satisfied: nest-asyncio<2.0.0,>=1.5.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (1.6.0)\n", - "Requirement already satisfied: networkx>=3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (3.1)\n", - "Requirement already satisfied: nltk<4.0.0,>=3.8.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (3.8.1)\n", - "Requirement already satisfied: numpy in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (1.24.4)\n", - "Requirement already satisfied: openai>=1.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (1.12.0)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (2.0.3)\n", - "Requirement already satisfied: pillow>=9.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (10.2.0)\n", - "Requirement already satisfied: requests>=2.31.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (2.31.0)\n", - "Requirement already satisfied: tenacity<9.0.0,>=8.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (8.2.3)\n", - "Requirement already satisfied: tiktoken>=0.3.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (0.6.0)\n", - "Requirement already satisfied: tqdm<5.0.0,>=4.66.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (4.66.2)\n", - "Requirement already satisfied: typing-extensions>=4.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (4.9.0)\n", - "Requirement already satisfied: typing-inspect>=0.8.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.12->llama-index) (0.9.0)\n", - "Requirement already satisfied: beautifulsoup4<5.0.0,>=4.12.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (4.12.3)\n", - "Requirement already satisfied: bs4<0.0.3,>=0.0.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (0.0.2)\n", - "Requirement already satisfied: pymupdf<2.0.0,>=1.23.21 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (1.23.25)\n", - "Requirement already satisfied: pypdf<5.0.0,>=4.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (4.0.2)\n", - "Requirement already satisfied: llama-parse<0.4.0,>=0.3.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-readers-llama-parse<0.2.0,>=0.1.2->llama-index) (0.3.4)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.3.1)\n", - "Requirement already satisfied: attrs>=17.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (23.2.0)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.4.1)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (6.0.5)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.9.4)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.12->llama-index) (4.0.3)\n", - "Requirement already satisfied: soupsieve>1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from beautifulsoup4<5.0.0,>=4.12.3->llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (2.5)\n", - "Requirement already satisfied: wrapt<2,>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from deprecated>=1.2.9.3->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.16.0)\n", - "Requirement already satisfied: chromadb<0.5.0,>=0.4.22 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.4.23)\n", - "Requirement already satisfied: onnxruntime<2.0.0,>=1.17.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.17.0)\n", - "Requirement already satisfied: tokenizers<0.16.0,>=0.15.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.15.2)\n", - "Requirement already satisfied: pydantic>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llamaindex-py-client<0.2.0,>=0.1.13->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.10.11)\n", - "Requirement already satisfied: anyio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (4.3.0)\n", - "Requirement already satisfied: certifi in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (2024.2.2)\n", - "Requirement already satisfied: httpcore==1.* in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.0.4)\n", - "Requirement already satisfied: idna in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (3.6)\n", - "Requirement already satisfied: sniffio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.3.0)\n", - "Requirement already satisfied: h11<0.15,>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpcore==1.*->httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (0.14.0)\n", - "Requirement already satisfied: click in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.12->llama-index) (8.1.7)\n", - "Requirement already satisfied: joblib in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.3.2)\n", - "Requirement already satisfied: regex>=2021.8.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.12->llama-index) (2023.12.25)\n", - "Requirement already satisfied: distro<2,>=1.7.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from openai>=1.1.0->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.9.0)\n", - "Requirement already satisfied: PyMuPDFb==1.23.22 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pymupdf<2.0.0,>=1.23.21->llama-index-readers-file<0.2.0,>=0.1.4->llama-index) (1.23.22)\n", - "Requirement already satisfied: charset-normalizer<4,>=2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.12->llama-index) (3.3.2)\n", - "Requirement already satisfied: urllib3<3,>=1.21.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.12->llama-index) (2.2.1)\n", - "Requirement already satisfied: greenlet!=0.4.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy>=1.4.49->SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.12->llama-index) (3.0.3)\n", - "Requirement already satisfied: mypy-extensions>=0.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from typing-inspect>=0.8.0->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.0.0)\n", - "Requirement already satisfied: marshmallow<4.0.0,>=3.18.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from dataclasses-json->llama-index-core<0.11.0,>=0.10.12->llama-index) (3.20.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.12->llama-index) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.12->llama-index) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.12->llama-index) (2024.1)\n", - "Requirement already satisfied: exceptiongroup>=1.0.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from anyio->httpx->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.2.0)\n", - "Requirement already satisfied: build>=1.0.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.0.3)\n", - "Requirement already satisfied: chroma-hnswlib==0.7.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.7.3)\n", - "Requirement already satisfied: fastapi>=0.95.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.109.2)\n", - "Requirement already satisfied: uvicorn>=0.18.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.27.1)\n", - "Requirement already satisfied: posthog>=2.4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.4.2)\n", - "Requirement already satisfied: pulsar-client>=3.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.4.0)\n", - "Requirement already satisfied: opentelemetry-api>=1.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.22.0)\n", - "Requirement already satisfied: opentelemetry-exporter-otlp-proto-grpc>=1.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.22.0)\n", - "Requirement already satisfied: opentelemetry-instrumentation-fastapi>=0.41b0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.43b0)\n", - "Requirement already satisfied: opentelemetry-sdk>=1.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.22.0)\n", - "Requirement already satisfied: pypika>=0.48.9 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.48.9)\n", - "Requirement already satisfied: overrides>=7.3.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (7.7.0)\n", - "Requirement already satisfied: importlib-resources in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (6.1.1)\n", - "Requirement already satisfied: grpcio>=1.58.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.62.0)\n", - "Requirement already satisfied: bcrypt>=4.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (4.1.2)\n", - "Requirement already satisfied: typer>=0.9.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.9.0)\n", - "Requirement already satisfied: kubernetes>=28.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (29.0.0)\n", - "Requirement already satisfied: mmh3>=4.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (4.1.0)\n", - "Requirement already satisfied: orjson>=3.9.12 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.9.14)\n", - "Requirement already satisfied: packaging>=17.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from marshmallow<4.0.0,>=3.18.0->dataclasses-json->llama-index-core<0.11.0,>=0.10.12->llama-index) (23.2)\n", - "Requirement already satisfied: coloredlogs in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (15.0.1)\n", - "Requirement already satisfied: flatbuffers in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (23.5.26)\n", - "Requirement already satisfied: protobuf in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (4.25.3)\n", - "Requirement already satisfied: sympy in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.12)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas->llama-index-core<0.11.0,>=0.10.12->llama-index) (1.16.0)\n", - "Requirement already satisfied: huggingface_hub<1.0,>=0.16.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from tokenizers<0.16.0,>=0.15.1->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.20.3)\n", - "Requirement already satisfied: pyproject_hooks in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from build>=1.0.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.0.0)\n", - "Requirement already satisfied: tomli>=1.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from build>=1.0.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (2.0.1)\n", - "Requirement already satisfied: starlette<0.37.0,>=0.36.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from fastapi>=0.95.2->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.36.3)\n", - "Requirement already satisfied: filelock in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from huggingface_hub<1.0,>=0.16.4->tokenizers<0.16.0,>=0.15.1->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.13.1)\n", - "Requirement already satisfied: google-auth>=1.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (2.28.1)\n", - "Requirement already satisfied: websocket-client!=0.40.0,!=0.41.*,!=0.42.*,>=0.32.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.7.0)\n", - "Requirement already satisfied: requests-oauthlib in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.3.1)\n", - "Requirement already satisfied: oauthlib>=3.2.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.2.2)\n", - "Requirement already satisfied: importlib-metadata<7.0,>=6.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-api>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (6.11.0)\n", - "Requirement already satisfied: backoff<3.0.0,>=1.10.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (2.2.1)\n", - "Requirement already satisfied: googleapis-common-protos~=1.52 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.62.0)\n", - "Requirement already satisfied: opentelemetry-exporter-otlp-proto-common==1.22.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.22.0)\n", - "Requirement already satisfied: opentelemetry-proto==1.22.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-exporter-otlp-proto-grpc>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.22.0)\n", - "Requirement already satisfied: opentelemetry-instrumentation-asgi==0.43b0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.43b0)\n", - "Requirement already satisfied: opentelemetry-instrumentation==0.43b0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.43b0)\n", - "Requirement already satisfied: opentelemetry-semantic-conventions==0.43b0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.43b0)\n", - "Requirement already satisfied: opentelemetry-util-http==0.43b0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.43b0)\n", - "Requirement already satisfied: setuptools>=16.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation==0.43b0->opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (69.1.0)\n", - "Requirement already satisfied: asgiref~=3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from opentelemetry-instrumentation-asgi==0.43b0->opentelemetry-instrumentation-fastapi>=0.41b0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.7.2)\n", - "Requirement already satisfied: monotonic>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from posthog>=2.4.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.6)\n", - "Requirement already satisfied: httptools>=0.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.6.1)\n", - "Requirement already satisfied: python-dotenv>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.0.1)\n", - "Requirement already satisfied: uvloop!=0.15.0,!=0.15.1,>=0.14.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.19.0)\n", - "Requirement already satisfied: watchfiles>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.21.0)\n", - "Requirement already satisfied: websockets>=10.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from uvicorn[standard]>=0.18.3->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (12.0)\n", - "Requirement already satisfied: humanfriendly>=9.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from coloredlogs->onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (10.0)\n", - "Requirement already satisfied: mpmath>=0.19 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from sympy->onnxruntime<2.0.0,>=1.17.0->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (1.3.0)\n", - "Requirement already satisfied: cachetools<6.0,>=2.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from google-auth>=1.0.1->kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (5.3.2)\n", - "Requirement already satisfied: pyasn1-modules>=0.2.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from google-auth>=1.0.1->kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.3.0)\n", - "Requirement already satisfied: rsa<5,>=3.1.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from google-auth>=1.0.1->kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (4.9)\n", - "Requirement already satisfied: zipp>=0.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from importlib-metadata<7.0,>=6.0->opentelemetry-api>=1.2.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (3.17.0)\n", - "Requirement already satisfied: pyasn1<0.6.0,>=0.4.6 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pyasn1-modules>=0.2.1->google-auth>=1.0.1->kubernetes>=28.1.0->chromadb<0.5.0,>=0.4.22->llama-index-vector-stores-chroma<0.2.0,>=0.1.1->llama-index-cli<0.2.0,>=0.1.2->llama-index) (0.5.1)\n", - "Requirement already satisfied: llama-index-vector-stores-mongodb in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (0.1.4)\n", - "Requirement already satisfied: llama-index-core<0.11.0,>=0.10.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-vector-stores-mongodb) (0.10.12)\n", - "Requirement already satisfied: pymongo<5.0.0,>=4.6.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-vector-stores-mongodb) (4.6.2)\n", - "Requirement already satisfied: PyYAML>=6.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (6.0.1)\n", - "Requirement already satisfied: SQLAlchemy>=1.4.49 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2.0.27)\n", - "Requirement already satisfied: aiohttp<4.0.0,>=3.8.6 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.9.3)\n", - "Requirement already satisfied: dataclasses-json in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.6.4)\n", - "Requirement already satisfied: deprecated>=1.2.9.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.2.14)\n", - "Requirement already satisfied: dirtyjson<2.0.0,>=1.0.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.0.8)\n", - "Requirement already satisfied: fsspec>=2023.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2023.10.0)\n", - "Requirement already satisfied: httpx in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.27.0)\n", - "Requirement already satisfied: llamaindex-py-client<0.2.0,>=0.1.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.1.13)\n", - "Requirement already satisfied: nest-asyncio<2.0.0,>=1.5.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.6.0)\n", - "Requirement already satisfied: networkx>=3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.1)\n", - "Requirement already satisfied: nltk<4.0.0,>=3.8.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.8.1)\n", - "Requirement already satisfied: numpy in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.24.4)\n", - "Requirement already satisfied: openai>=1.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.12.0)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2.0.3)\n", - "Requirement already satisfied: pillow>=9.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (10.2.0)\n", - "Requirement already satisfied: requests>=2.31.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2.31.0)\n", - "Requirement already satisfied: tenacity<9.0.0,>=8.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (8.2.3)\n", - "Requirement already satisfied: tiktoken>=0.3.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.6.0)\n", - "Requirement already satisfied: tqdm<5.0.0,>=4.66.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (4.66.2)\n", - "Requirement already satisfied: typing-extensions>=4.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (4.9.0)\n", - "Requirement already satisfied: typing-inspect>=0.8.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.9.0)\n", - "Requirement already satisfied: dnspython<3.0.0,>=1.16.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pymongo<5.0.0,>=4.6.1->llama-index-vector-stores-mongodb) (2.6.1)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.3.1)\n", - "Requirement already satisfied: attrs>=17.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (23.2.0)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.4.1)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (6.0.5)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.9.4)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (4.0.3)\n", - "Requirement already satisfied: wrapt<2,>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from deprecated>=1.2.9.3->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.16.0)\n", - "Requirement already satisfied: pydantic>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llamaindex-py-client<0.2.0,>=0.1.13->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.10.11)\n", - "Requirement already satisfied: anyio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (4.3.0)\n", - "Requirement already satisfied: certifi in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2024.2.2)\n", - "Requirement already satisfied: httpcore==1.* in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.0.4)\n", - "Requirement already satisfied: idna in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.6)\n", - "Requirement already satisfied: sniffio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.3.0)\n", - "Requirement already satisfied: h11<0.15,>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpcore==1.*->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (0.14.0)\n", - "Requirement already satisfied: click in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (8.1.7)\n", - "Requirement already satisfied: joblib in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.3.2)\n", - "Requirement already satisfied: regex>=2021.8.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2023.12.25)\n", - "Requirement already satisfied: distro<2,>=1.7.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from openai>=1.1.0->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.9.0)\n", - "Requirement already satisfied: charset-normalizer<4,>=2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.3.2)\n", - "Requirement already satisfied: urllib3<3,>=1.21.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2.2.1)\n", - "Requirement already satisfied: greenlet!=0.4.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy>=1.4.49->SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.0.3)\n", - "Requirement already satisfied: mypy-extensions>=0.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from typing-inspect>=0.8.0->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.0.0)\n", - "Requirement already satisfied: marshmallow<4.0.0,>=3.18.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (3.20.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (2024.1)\n", - "Requirement already satisfied: exceptiongroup>=1.0.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from anyio->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.2.0)\n", - "Requirement already satisfied: packaging>=17.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from marshmallow<4.0.0,>=3.18.0->dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (23.2)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-vector-stores-mongodb) (1.16.0)\n", - "Requirement already satisfied: llama-index-embeddings-fireworks==0.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (0.1.2)\n", - "Requirement already satisfied: llama-index-core<0.11.0,>=0.10.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-embeddings-fireworks==0.1.2) (0.10.12)\n", - "Requirement already satisfied: llama-index-llms-openai<0.2.0,>=0.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-embeddings-fireworks==0.1.2) (0.1.6)\n", - "Requirement already satisfied: PyYAML>=6.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (6.0.1)\n", - "Requirement already satisfied: SQLAlchemy>=1.4.49 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2.0.27)\n", - "Requirement already satisfied: aiohttp<4.0.0,>=3.8.6 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.9.3)\n", - "Requirement already satisfied: dataclasses-json in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.6.4)\n", - "Requirement already satisfied: deprecated>=1.2.9.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.2.14)\n", - "Requirement already satisfied: dirtyjson<2.0.0,>=1.0.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.0.8)\n", - "Requirement already satisfied: fsspec>=2023.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2023.10.0)\n", - "Requirement already satisfied: httpx in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.27.0)\n", - "Requirement already satisfied: llamaindex-py-client<0.2.0,>=0.1.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.1.13)\n", - "Requirement already satisfied: nest-asyncio<2.0.0,>=1.5.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.6.0)\n", - "Requirement already satisfied: networkx>=3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.1)\n", - "Requirement already satisfied: nltk<4.0.0,>=3.8.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.8.1)\n", - "Requirement already satisfied: numpy in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.24.4)\n", - "Requirement already satisfied: openai>=1.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.12.0)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2.0.3)\n", - "Requirement already satisfied: pillow>=9.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (10.2.0)\n", - "Requirement already satisfied: requests>=2.31.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2.31.0)\n", - "Requirement already satisfied: tenacity<9.0.0,>=8.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (8.2.3)\n", - "Requirement already satisfied: tiktoken>=0.3.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.6.0)\n", - "Requirement already satisfied: tqdm<5.0.0,>=4.66.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (4.66.2)\n", - "Requirement already satisfied: typing-extensions>=4.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (4.9.0)\n", - "Requirement already satisfied: typing-inspect>=0.8.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.9.0)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.3.1)\n", - "Requirement already satisfied: attrs>=17.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (23.2.0)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.4.1)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (6.0.5)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.9.4)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (4.0.3)\n", - "Requirement already satisfied: wrapt<2,>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from deprecated>=1.2.9.3->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.16.0)\n", - "Requirement already satisfied: pydantic>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llamaindex-py-client<0.2.0,>=0.1.13->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.10.11)\n", - "Requirement already satisfied: anyio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (4.3.0)\n", - "Requirement already satisfied: certifi in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2024.2.2)\n", - "Requirement already satisfied: httpcore==1.* in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.0.4)\n", - "Requirement already satisfied: idna in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.6)\n", - "Requirement already satisfied: sniffio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.3.0)\n", - "Requirement already satisfied: h11<0.15,>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpcore==1.*->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (0.14.0)\n", - "Requirement already satisfied: click in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (8.1.7)\n", - "Requirement already satisfied: joblib in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.3.2)\n", - "Requirement already satisfied: regex>=2021.8.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2023.12.25)\n", - "Requirement already satisfied: distro<2,>=1.7.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from openai>=1.1.0->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.9.0)\n", - "Requirement already satisfied: charset-normalizer<4,>=2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.3.2)\n", - "Requirement already satisfied: urllib3<3,>=1.21.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2.2.1)\n", - "Requirement already satisfied: greenlet!=0.4.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy>=1.4.49->SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.0.3)\n", - "Requirement already satisfied: mypy-extensions>=0.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from typing-inspect>=0.8.0->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.0.0)\n", - "Requirement already satisfied: marshmallow<4.0.0,>=3.18.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (3.20.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (2024.1)\n", - "Requirement already satisfied: exceptiongroup>=1.0.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from anyio->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.2.0)\n", - "Requirement already satisfied: packaging>=17.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from marshmallow<4.0.0,>=3.18.0->dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (23.2)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-embeddings-fireworks==0.1.2) (1.16.0)\n", - "Requirement already satisfied: llama-index-llms-fireworks in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (0.1.1)\n", - "Requirement already satisfied: llama-index-core<0.11.0,>=0.10.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-llms-fireworks) (0.10.12)\n", - "Requirement already satisfied: llama-index-llms-openai<0.2.0,>=0.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-llms-fireworks) (0.1.6)\n", - "Requirement already satisfied: PyYAML>=6.0.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (6.0.1)\n", - "Requirement already satisfied: SQLAlchemy>=1.4.49 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2.0.27)\n", - "Requirement already satisfied: aiohttp<4.0.0,>=3.8.6 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.9.3)\n", - "Requirement already satisfied: dataclasses-json in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.6.4)\n", - "Requirement already satisfied: deprecated>=1.2.9.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.2.14)\n", - "Requirement already satisfied: dirtyjson<2.0.0,>=1.0.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.0.8)\n", - "Requirement already satisfied: fsspec>=2023.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2023.10.0)\n", - "Requirement already satisfied: httpx in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.27.0)\n", - "Requirement already satisfied: llamaindex-py-client<0.2.0,>=0.1.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.1.13)\n", - "Requirement already satisfied: nest-asyncio<2.0.0,>=1.5.8 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.6.0)\n", - "Requirement already satisfied: networkx>=3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.1)\n", - "Requirement already satisfied: nltk<4.0.0,>=3.8.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.8.1)\n", - "Requirement already satisfied: numpy in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.24.4)\n", - "Requirement already satisfied: openai>=1.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.12.0)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2.0.3)\n", - "Requirement already satisfied: pillow>=9.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (10.2.0)\n", - "Requirement already satisfied: requests>=2.31.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2.31.0)\n", - "Requirement already satisfied: tenacity<9.0.0,>=8.2.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (8.2.3)\n", - "Requirement already satisfied: tiktoken>=0.3.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.6.0)\n", - "Requirement already satisfied: tqdm<5.0.0,>=4.66.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (4.66.2)\n", - "Requirement already satisfied: typing-extensions>=4.5.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (4.9.0)\n", - "Requirement already satisfied: typing-inspect>=0.8.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.9.0)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.3.1)\n", - "Requirement already satisfied: attrs>=17.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (23.2.0)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.4.1)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (6.0.5)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.9.4)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp<4.0.0,>=3.8.6->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (4.0.3)\n", - "Requirement already satisfied: wrapt<2,>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from deprecated>=1.2.9.3->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.16.0)\n", - "Requirement already satisfied: pydantic>=1.10 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from llamaindex-py-client<0.2.0,>=0.1.13->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.10.11)\n", - "Requirement already satisfied: anyio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (4.3.0)\n", - "Requirement already satisfied: certifi in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2024.2.2)\n", - "Requirement already satisfied: httpcore==1.* in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.0.4)\n", - "Requirement already satisfied: idna in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.6)\n", - "Requirement already satisfied: sniffio in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.3.0)\n", - "Requirement already satisfied: h11<0.15,>=0.13 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from httpcore==1.*->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (0.14.0)\n", - "Requirement already satisfied: click in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (8.1.7)\n", - "Requirement already satisfied: joblib in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.3.2)\n", - "Requirement already satisfied: regex>=2021.8.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from nltk<4.0.0,>=3.8.1->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2023.12.25)\n", - "Requirement already satisfied: distro<2,>=1.7.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from openai>=1.1.0->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.9.0)\n", - "Requirement already satisfied: charset-normalizer<4,>=2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.3.2)\n", - "Requirement already satisfied: urllib3<3,>=1.21.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.31.0->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2.2.1)\n", - "Requirement already satisfied: greenlet!=0.4.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from SQLAlchemy>=1.4.49->SQLAlchemy[asyncio]>=1.4.49->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.0.3)\n", - "Requirement already satisfied: mypy-extensions>=0.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from typing-inspect>=0.8.0->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.0.0)\n", - "Requirement already satisfied: marshmallow<4.0.0,>=3.18.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (3.20.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (2024.1)\n", - "Requirement already satisfied: exceptiongroup>=1.0.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from anyio->httpx->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.2.0)\n", - "Requirement already satisfied: packaging>=17.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from marshmallow<4.0.0,>=3.18.0->dataclasses-json->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (23.2)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas->llama-index-core<0.11.0,>=0.10.1->llama-index-llms-fireworks) (1.16.0)\n", - "Requirement already satisfied: pymongo in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (4.6.2)\n", - "Requirement already satisfied: dnspython<3.0.0,>=1.16.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pymongo) (2.6.1)\n", - "Requirement already satisfied: datasets in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (2.17.1)\n", - "Requirement already satisfied: filelock in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (3.13.1)\n", - "Requirement already satisfied: numpy>=1.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (1.24.4)\n", - "Requirement already satisfied: pyarrow>=12.0.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (15.0.0)\n", - "Requirement already satisfied: pyarrow-hotfix in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (0.6)\n", - "Requirement already satisfied: dill<0.3.9,>=0.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (0.3.8)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (2.0.3)\n", - "Requirement already satisfied: requests>=2.19.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (2.31.0)\n", - "Requirement already satisfied: tqdm>=4.62.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (4.66.2)\n", - "Requirement already satisfied: xxhash in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (3.4.1)\n", - "Requirement already satisfied: multiprocess in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (0.70.16)\n", - "Requirement already satisfied: fsspec<=2023.10.0,>=2023.1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from fsspec[http]<=2023.10.0,>=2023.1.0->datasets) (2023.10.0)\n", - "Requirement already satisfied: aiohttp in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (3.9.3)\n", - "Requirement already satisfied: huggingface-hub>=0.19.4 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (0.20.3)\n", - "Requirement already satisfied: packaging in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (23.2)\n", - "Requirement already satisfied: pyyaml>=5.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from datasets) (6.0.1)\n", - "Requirement already satisfied: aiosignal>=1.1.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (1.3.1)\n", - "Requirement already satisfied: attrs>=17.3.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (23.2.0)\n", - "Requirement already satisfied: frozenlist>=1.1.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (1.4.1)\n", - "Requirement already satisfied: multidict<7.0,>=4.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (6.0.5)\n", - "Requirement already satisfied: yarl<2.0,>=1.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (1.9.4)\n", - "Requirement already satisfied: async-timeout<5.0,>=4.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from aiohttp->datasets) (4.0.3)\n", - "Requirement already satisfied: typing-extensions>=3.7.4.3 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from huggingface-hub>=0.19.4->datasets) (4.9.0)\n", - "Requirement already satisfied: charset-normalizer<4,>=2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.19.0->datasets) (3.3.2)\n", - "Requirement already satisfied: idna<4,>=2.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.19.0->datasets) (3.6)\n", - "Requirement already satisfied: urllib3<3,>=1.21.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.19.0->datasets) (2.2.1)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from requests>=2.19.0->datasets) (2024.2.2)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->datasets) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->datasets) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas->datasets) (2024.1)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas->datasets) (1.16.0)\n", - "Requirement already satisfied: pandas in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (2.0.3)\n", - "Requirement already satisfied: python-dateutil>=2.8.2 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas) (2.8.2)\n", - "Requirement already satisfied: pytz>=2020.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas) (2024.1)\n", - "Requirement already satisfied: tzdata>=2022.1 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas) (2024.1)\n", - "Requirement already satisfied: numpy>=1.21.0 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from pandas) (1.24.4)\n", - "Requirement already satisfied: six>=1.5 in /mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages (from python-dateutil>=2.8.2->pandas) (1.16.0)\n" - ] - } - ], + "outputs": [], "source": [ "!pip install -q llama-index llama-index-vector-stores-mongodb llama-index-embeddings-fireworks==0.1.2 llama-index-llms-fireworks\n", "!pip install -q pymongo datasets pandas" @@ -369,6 +29,14 @@ "execution_count": null, "metadata": {}, "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/mnt/disks/data/llama_index/.venv/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n" + ] + }, { "data": { "text/html": [ @@ -596,23 +264,6 @@ "dataset_df.head(5)" ] }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "# Remove data point where fullplot coloumn is missing\n", - "# dataset_df = dataset_df.dropna(subset=[\"fullplot\"])\n", - "# print(\"\\nNumber of missing values in each column after removal:\")\n", - "# print(dataset_df.isnull().sum())\n", - "\n", - "# # Remove the plot_embedding from each data point in the dataset as we are going to create new embeddings with the new OpenAI emebedding Model \"text-embedding-3-small\"\n", - "# dataset_df = dataset_df.drop(columns=[\"plot_embedding\"])\n", - "\n", - "# dataset_df.head(5)" - ] - }, { "cell_type": "code", "execution_count": null, @@ -624,7 +275,7 @@ "from llama_index.embeddings.fireworks import FireworksEmbedding\n", "\n", "embed_model = FireworksEmbedding(\n", - " embed_batch_size=1024,\n", + " embed_batch_size=512,\n", " model_name=\"nomic-ai/nomic-embed-text-v1.5\",\n", " api_key=fw_api_key,\n", ")\n", @@ -659,15 +310,14 @@ "_id=>{'$oid': '6095a34a7c34416a90d3206b'}\n", "name=>\"Baby Bo'S Burritos\"\n", "menu=>null\n", - "TakeOut=>True\n", - "location=>{'coordinates': [-73.975981, 40.745132], 'type': 'Point'}\n", + "TakeOut=>true\n", "PriceRange=>1.0\n", "HappyHour=>null\n", "review_count=>10\n", "sponsored=>None\n", "stars=>2.5\n", "-----\n", - "Content: {\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\"Alcohol\\\": \\\"'none'\\\", \\\"Ambience\\\": \\\"{'romantic': False, 'intimate': False, 'classy': False, 'hipster': False, 'divey': False, 'touristy': False, 'trendy': False, 'upscale': False, 'casual': False}\\\", \\\"BYOB\\\": null, \\\"BestNights\\\": null, \\\"BikeParking\\\": null, \\\"BusinessAcceptsBitcoin\\\": null, \\\"BusinessAcceptsCreditCards\\\": null, \\\"BusinessParking\\\": \\\"None\\\", \\\"Caters\\\": \\\"True\\\", \\\"DriveThru\\\": null, \\\"GoodForDancing\\\": null, \\\"GoodForKids\\\": \\\"True\\\", \\\"GoodForMeal\\\": null, \\\"HasTV\\\": \\\"True\\\", \\\"Music\\\": null, \\\"NoiseLevel\\\": \\\"'average'\\\", \\\"RestaurantsAttire\\\": \\\"'casual'\\\", \\\"RestaurantsDelivery\\\": \\\"True\\\", \\\"RestaurantsGoodForGroups\\\": \\\"True\\\", \\\"RestaurantsReservations\\\": \\\"True\\\", \\\"RestaurantsTableService\\\": \\\"False\\\", \\\"WheelchairAccessible\\\": \\\"True\\\", \\\"WiFi\\\": \\\"'free'\\\"}\", \"cuisine\": \"\\\"Tex-Mex\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\"Manhattan\\\"\", \"address\": \"{\\\"building\\\": \\\"627\\\", \\\"coord\\\": [-73.975981, 40.745132], \\\"street\\\": \\\"2 Avenue\\\", \\\"zipcode\\\": \\\"10016\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\"Baby Bo'S Burritos\\\"\", \"menu\": \"null\", \"TakeOut\": true, \"location\": {\"coordinates\": [-73.975981, 40.745132], \"type\": \"Point\"}, \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}\n", + "Content: {\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\"Alcohol\\\": \\\"'none'\\\", \\\"Ambience\\\": \\\"{'romantic': False, 'intimate': False, 'classy': False, 'hipster': False, 'divey': False, 'touristy': False, 'trendy': False, 'upscale': False, 'casual': False}\\\", \\\"BYOB\\\": null, \\\"BestNights\\\": null, \\\"BikeParking\\\": null, \\\"BusinessAcceptsBitcoin\\\": null, \\\"BusinessAcceptsCreditCards\\\": null, \\\"BusinessParking\\\": \\\"None\\\", \\\"Caters\\\": \\\"True\\\", \\\"DriveThru\\\": null, \\\"GoodForDancing\\\": null, \\\"GoodForKids\\\": \\\"True\\\", \\\"GoodForMeal\\\": null, \\\"HasTV\\\": \\\"True\\\", \\\"Music\\\": null, \\\"NoiseLevel\\\": \\\"'average'\\\", \\\"RestaurantsAttire\\\": \\\"'casual'\\\", \\\"RestaurantsDelivery\\\": \\\"True\\\", \\\"RestaurantsGoodForGroups\\\": \\\"True\\\", \\\"RestaurantsReservations\\\": \\\"True\\\", \\\"RestaurantsTableService\\\": \\\"False\\\", \\\"WheelchairAccessible\\\": \\\"True\\\", \\\"WiFi\\\": \\\"'free'\\\"}\", \"cuisine\": \"\\\"Tex-Mex\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\"Manhattan\\\"\", \"address\": \"{\\\"building\\\": \\\"627\\\", \\\"coord\\\": [-73.975981, 40.745132], \\\"street\\\": \\\"2 Avenue\\\", \\\"zipcode\\\": \\\"10016\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\"Baby Bo'S Burritos\\\"\", \"menu\": \"null\", \"TakeOut\": \"true\", \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}\n", "\n", "The Embedding model sees this: \n", " Metadata: restaurant_id=>40366661\n", @@ -680,15 +330,14 @@ "_id=>{'$oid': '6095a34a7c34416a90d3206b'}\n", "name=>\"Baby Bo'S Burritos\"\n", "menu=>null\n", - "TakeOut=>True\n", - "location=>{'coordinates': [-73.975981, 40.745132], 'type': 'Point'}\n", + "TakeOut=>true\n", "PriceRange=>1.0\n", "HappyHour=>null\n", "review_count=>10\n", "sponsored=>None\n", "stars=>2.5\n", "-----\n", - "Content: {\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\"Alcohol\\\": \\\"'none'\\\", \\\"Ambience\\\": \\\"{'romantic': False, 'intimate': False, 'classy': False, 'hipster': False, 'divey': False, 'touristy': False, 'trendy': False, 'upscale': False, 'casual': False}\\\", \\\"BYOB\\\": null, \\\"BestNights\\\": null, \\\"BikeParking\\\": null, \\\"BusinessAcceptsBitcoin\\\": null, \\\"BusinessAcceptsCreditCards\\\": null, \\\"BusinessParking\\\": \\\"None\\\", \\\"Caters\\\": \\\"True\\\", \\\"DriveThru\\\": null, \\\"GoodForDancing\\\": null, \\\"GoodForKids\\\": \\\"True\\\", \\\"GoodForMeal\\\": null, \\\"HasTV\\\": \\\"True\\\", \\\"Music\\\": null, \\\"NoiseLevel\\\": \\\"'average'\\\", \\\"RestaurantsAttire\\\": \\\"'casual'\\\", \\\"RestaurantsDelivery\\\": \\\"True\\\", \\\"RestaurantsGoodForGroups\\\": \\\"True\\\", \\\"RestaurantsReservations\\\": \\\"True\\\", \\\"RestaurantsTableService\\\": \\\"False\\\", \\\"WheelchairAccessible\\\": \\\"True\\\", \\\"WiFi\\\": \\\"'free'\\\"}\", \"cuisine\": \"\\\"Tex-Mex\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\"Manhattan\\\"\", \"address\": \"{\\\"building\\\": \\\"627\\\", \\\"coord\\\": [-73.975981, 40.745132], \\\"street\\\": \\\"2 Avenue\\\", \\\"zipcode\\\": \\\"10016\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\"Baby Bo'S Burritos\\\"\", \"menu\": \"null\", \"TakeOut\": true, \"location\": {\"coordinates\": [-73.975981, 40.745132], \"type\": \"Point\"}, \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}\n" + "Content: {\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\"Alcohol\\\": \\\"'none'\\\", \\\"Ambience\\\": \\\"{'romantic': False, 'intimate': False, 'classy': False, 'hipster': False, 'divey': False, 'touristy': False, 'trendy': False, 'upscale': False, 'casual': False}\\\", \\\"BYOB\\\": null, \\\"BestNights\\\": null, \\\"BikeParking\\\": null, \\\"BusinessAcceptsBitcoin\\\": null, \\\"BusinessAcceptsCreditCards\\\": null, \\\"BusinessParking\\\": \\\"None\\\", \\\"Caters\\\": \\\"True\\\", \\\"DriveThru\\\": null, \\\"GoodForDancing\\\": null, \\\"GoodForKids\\\": \\\"True\\\", \\\"GoodForMeal\\\": null, \\\"HasTV\\\": \\\"True\\\", \\\"Music\\\": null, \\\"NoiseLevel\\\": \\\"'average'\\\", \\\"RestaurantsAttire\\\": \\\"'casual'\\\", \\\"RestaurantsDelivery\\\": \\\"True\\\", \\\"RestaurantsGoodForGroups\\\": \\\"True\\\", \\\"RestaurantsReservations\\\": \\\"True\\\", \\\"RestaurantsTableService\\\": \\\"False\\\", \\\"WheelchairAccessible\\\": \\\"True\\\", \\\"WiFi\\\": \\\"'free'\\\"}\", \"cuisine\": \"\\\"Tex-Mex\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\"Manhattan\\\"\", \"address\": \"{\\\"building\\\": \\\"627\\\", \\\"coord\\\": [-73.975981, 40.745132], \\\"street\\\": \\\"2 Avenue\\\", \\\"zipcode\\\": \\\"10016\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\"Baby Bo'S Burritos\\\"\", \"menu\": \"null\", \"TakeOut\": \"true\", \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}\n" ] } ], @@ -715,21 +364,16 @@ " document[\"PriceRange\"] = json.dumps(document[\"PriceRange\"])\n", " document[\"HappyHour\"] = json.dumps(document[\"HappyHour\"])\n", " document[\"review_count\"] = json.dumps(document[\"review_count\"])\n", + " document[\"TakeOut\"] = json.dumps(document[\"TakeOut\"])\n", + " # these two fields are not relevant to the question we want to answer,\n", + " # so I will skip it for now\n", " del document[\"embedding\"]\n", + " del document[\"location\"]\n", "\n", " # Create a Document object with the text and excluded metadata for llm and embedding models\n", " llama_document = Document(\n", " text=json.dumps(document),\n", " metadata=document,\n", - " # excluded_llm_metadata_keys=[\"embedding\"],\n", - " # excluded_embed_metadata_keys=[\n", - " # \"fullplot\",\n", - " # \"metacritic\",\n", - " # \"poster\",\n", - " # \"num_mflix_comments\",\n", - " # \"runtime\",\n", - " # \"rated\",\n", - " # ],\n", " metadata_template=\"{key}=>{value}\",\n", " text_template=\"Metadata: {metadata_str}\\n-----\\nContent: {content}\",\n", " )\n", @@ -755,7 +399,7 @@ { "data": { "text/plain": [ - "Document(id_='a4e02dc9-3370-4bbd-8207-b7cb84f802ea', embedding=None, metadata={'restaurant_id': '40366661', 'attributes': '{\"Alcohol\": \"\\'none\\'\", \"Ambience\": \"{\\'romantic\\': False, \\'intimate\\': False, \\'classy\\': False, \\'hipster\\': False, \\'divey\\': False, \\'touristy\\': False, \\'trendy\\': False, \\'upscale\\': False, \\'casual\\': False}\", \"BYOB\": null, \"BestNights\": null, \"BikeParking\": null, \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": null, \"BusinessParking\": \"None\", \"Caters\": \"True\", \"DriveThru\": null, \"GoodForDancing\": null, \"GoodForKids\": \"True\", \"GoodForMeal\": null, \"HasTV\": \"True\", \"Music\": null, \"NoiseLevel\": \"\\'average\\'\", \"RestaurantsAttire\": \"\\'casual\\'\", \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"True\", \"RestaurantsTableService\": \"False\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"\\'free\\'\"}', 'cuisine': '\"Tex-Mex\"', 'DogsAllowed': None, 'OutdoorSeating': True, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"627\", \"coord\": [-73.975981, 40.745132], \"street\": \"2 Avenue\", \"zipcode\": \"10016\"}', '_id': {'$oid': '6095a34a7c34416a90d3206b'}, 'name': '\"Baby Bo\\'S Burritos\"', 'menu': 'null', 'TakeOut': True, 'location': {'coordinates': [-73.975981, 40.745132], 'type': 'Point'}, 'PriceRange': '1.0', 'HappyHour': 'null', 'review_count': '10', 'sponsored': None, 'stars': 2.5}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, text='{\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\\\"Alcohol\\\\\": \\\\\"\\'none\\'\\\\\", \\\\\"Ambience\\\\\": \\\\\"{\\'romantic\\': False, \\'intimate\\': False, \\'classy\\': False, \\'hipster\\': False, \\'divey\\': False, \\'touristy\\': False, \\'trendy\\': False, \\'upscale\\': False, \\'casual\\': False}\\\\\", \\\\\"BYOB\\\\\": null, \\\\\"BestNights\\\\\": null, \\\\\"BikeParking\\\\\": null, \\\\\"BusinessAcceptsBitcoin\\\\\": null, \\\\\"BusinessAcceptsCreditCards\\\\\": null, \\\\\"BusinessParking\\\\\": \\\\\"None\\\\\", \\\\\"Caters\\\\\": \\\\\"True\\\\\", \\\\\"DriveThru\\\\\": null, \\\\\"GoodForDancing\\\\\": null, \\\\\"GoodForKids\\\\\": \\\\\"True\\\\\", \\\\\"GoodForMeal\\\\\": null, \\\\\"HasTV\\\\\": \\\\\"True\\\\\", \\\\\"Music\\\\\": null, \\\\\"NoiseLevel\\\\\": \\\\\"\\'average\\'\\\\\", \\\\\"RestaurantsAttire\\\\\": \\\\\"\\'casual\\'\\\\\", \\\\\"RestaurantsDelivery\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsGoodForGroups\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsReservations\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsTableService\\\\\": \\\\\"False\\\\\", \\\\\"WheelchairAccessible\\\\\": \\\\\"True\\\\\", \\\\\"WiFi\\\\\": \\\\\"\\'free\\'\\\\\"}\", \"cuisine\": \"\\\\\"Tex-Mex\\\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\\\"Manhattan\\\\\"\", \"address\": \"{\\\\\"building\\\\\": \\\\\"627\\\\\", \\\\\"coord\\\\\": [-73.975981, 40.745132], \\\\\"street\\\\\": \\\\\"2 Avenue\\\\\", \\\\\"zipcode\\\\\": \\\\\"10016\\\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\\\"Baby Bo\\'S Burritos\\\\\"\", \"menu\": \"null\", \"TakeOut\": true, \"location\": {\"coordinates\": [-73.975981, 40.745132], \"type\": \"Point\"}, \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}', start_char_idx=None, end_char_idx=None, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n')" + "Document(id_='93d3f08d-85f3-494d-a057-19bc834abc29', embedding=None, metadata={'restaurant_id': '40366661', 'attributes': '{\"Alcohol\": \"\\'none\\'\", \"Ambience\": \"{\\'romantic\\': False, \\'intimate\\': False, \\'classy\\': False, \\'hipster\\': False, \\'divey\\': False, \\'touristy\\': False, \\'trendy\\': False, \\'upscale\\': False, \\'casual\\': False}\", \"BYOB\": null, \"BestNights\": null, \"BikeParking\": null, \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": null, \"BusinessParking\": \"None\", \"Caters\": \"True\", \"DriveThru\": null, \"GoodForDancing\": null, \"GoodForKids\": \"True\", \"GoodForMeal\": null, \"HasTV\": \"True\", \"Music\": null, \"NoiseLevel\": \"\\'average\\'\", \"RestaurantsAttire\": \"\\'casual\\'\", \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"True\", \"RestaurantsTableService\": \"False\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"\\'free\\'\"}', 'cuisine': '\"Tex-Mex\"', 'DogsAllowed': None, 'OutdoorSeating': True, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"627\", \"coord\": [-73.975981, 40.745132], \"street\": \"2 Avenue\", \"zipcode\": \"10016\"}', '_id': {'$oid': '6095a34a7c34416a90d3206b'}, 'name': '\"Baby Bo\\'S Burritos\"', 'menu': 'null', 'TakeOut': 'true', 'PriceRange': '1.0', 'HappyHour': 'null', 'review_count': '10', 'sponsored': None, 'stars': 2.5}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, text='{\"restaurant_id\": \"40366661\", \"attributes\": \"{\\\\\"Alcohol\\\\\": \\\\\"\\'none\\'\\\\\", \\\\\"Ambience\\\\\": \\\\\"{\\'romantic\\': False, \\'intimate\\': False, \\'classy\\': False, \\'hipster\\': False, \\'divey\\': False, \\'touristy\\': False, \\'trendy\\': False, \\'upscale\\': False, \\'casual\\': False}\\\\\", \\\\\"BYOB\\\\\": null, \\\\\"BestNights\\\\\": null, \\\\\"BikeParking\\\\\": null, \\\\\"BusinessAcceptsBitcoin\\\\\": null, \\\\\"BusinessAcceptsCreditCards\\\\\": null, \\\\\"BusinessParking\\\\\": \\\\\"None\\\\\", \\\\\"Caters\\\\\": \\\\\"True\\\\\", \\\\\"DriveThru\\\\\": null, \\\\\"GoodForDancing\\\\\": null, \\\\\"GoodForKids\\\\\": \\\\\"True\\\\\", \\\\\"GoodForMeal\\\\\": null, \\\\\"HasTV\\\\\": \\\\\"True\\\\\", \\\\\"Music\\\\\": null, \\\\\"NoiseLevel\\\\\": \\\\\"\\'average\\'\\\\\", \\\\\"RestaurantsAttire\\\\\": \\\\\"\\'casual\\'\\\\\", \\\\\"RestaurantsDelivery\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsGoodForGroups\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsReservations\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsTableService\\\\\": \\\\\"False\\\\\", \\\\\"WheelchairAccessible\\\\\": \\\\\"True\\\\\", \\\\\"WiFi\\\\\": \\\\\"\\'free\\'\\\\\"}\", \"cuisine\": \"\\\\\"Tex-Mex\\\\\"\", \"DogsAllowed\": null, \"OutdoorSeating\": true, \"borough\": \"\\\\\"Manhattan\\\\\"\", \"address\": \"{\\\\\"building\\\\\": \\\\\"627\\\\\", \\\\\"coord\\\\\": [-73.975981, 40.745132], \\\\\"street\\\\\": \\\\\"2 Avenue\\\\\", \\\\\"zipcode\\\\\": \\\\\"10016\\\\\"}\", \"_id\": {\"$oid\": \"6095a34a7c34416a90d3206b\"}, \"name\": \"\\\\\"Baby Bo\\'S Burritos\\\\\"\", \"menu\": \"null\", \"TakeOut\": \"true\", \"PriceRange\": \"1.0\", \"HappyHour\": \"null\", \"review_count\": \"10\", \"sponsored\": null, \"stars\": 2.5}', start_char_idx=None, end_char_idx=None, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n')" ] }, "execution_count": null, @@ -777,10 +421,24 @@ "\n", "parser = SentenceSplitter()\n", "nodes = parser.get_nodes_from_documents(llama_documents)\n", + "# 25k nodes takes about 10 minutes, will trim it down to 2.5k\n", + "new_nodes = nodes[:2500]\n", "\n", "# There are 25k documents, so we need to do batching. Fortunately LlamaIndex provides good batching\n", "# for embedding models, and we are going to rely on the __call__ method for the model to handle this\n", - "node_embeddings = embed_model(nodes)" + "node_embeddings = embed_model(new_nodes)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "for idx, n in enumerate(new_nodes):\n", + " n.embedding = node_embeddings[idx].embedding\n", + " if \"_id\" in n.metadata:\n", + " del n.metadata[\"_id\"]" ] }, { @@ -813,7 +471,6 @@ ], "source": [ "import pymongo\n", - "from google.colab import userdata\n", "\n", "\n", "def get_mongo_client(mongo_uri):\n", @@ -827,14 +484,18 @@ " return None\n", "\n", "\n", - "mongo_uri = userdata.get(\"MONGO_URI\")\n", + "# set up Fireworks.ai Key\n", + "import os\n", + "import getpass\n", + "\n", + "mongo_uri = getpass.getpass(\"MONGO_URI:\")\n", "if not mongo_uri:\n", - " print(\"MONGO_URI not set in environment variables\")\n", + " print(\"MONGO_URI not set\")\n", "\n", "mongo_client = get_mongo_client(mongo_uri)\n", "\n", - "DB_NAME = \"movies\"\n", - "COLLECTION_NAME = \"movies_records\"\n", + "DB_NAME = \"whatscooking\"\n", + "COLLECTION_NAME = \"restaurants\"\n", "\n", "db = mongo_client[DB_NAME]\n", "collection = db[COLLECTION_NAME]" @@ -848,7 +509,7 @@ { "data": { "text/plain": [ - "DeleteResult({'n': 0, 'electionId': ObjectId('7fffffff000000000000000a'), 'opTime': {'ts': Timestamp(1708000722, 1), 't': 10}, 'ok': 1.0, '$clusterTime': {'clusterTime': Timestamp(1708000722, 1), 'signature': {'hash': b'\\xd8\\x1a\\xaci\\xf5EN+\\xe2\\xd1\\xb3y8.${u5P\\xf3', 'keyId': 7320226449804230661}}, 'operationTime': Timestamp(1708000722, 1)}, acknowledged=True)" + "DeleteResult({'n': 0, 'electionId': ObjectId('7fffffff00000000000001ce'), 'opTime': {'ts': Timestamp(1708970193, 3), 't': 462}, 'ok': 1.0, '$clusterTime': {'clusterTime': Timestamp(1708970193, 3), 'signature': {'hash': b'\\x9a3H8\\xa1\\x1b\\xb6\\xbb\\xa9\\xc3x\\x17\\x1c\\xeb\\xe9\\x03\\xaa\\xf8\\xf17', 'keyId': 7294687148333072386}}, 'operationTime': Timestamp(1708970193, 3)}, acknowledged=True)" ] }, "execution_count": null, @@ -876,7 +537,14 @@ " collection_name=COLLECTION_NAME,\n", " index_name=\"vector_index\",\n", ")\n", - "vector_store.add(nodes)" + "vector_store.add(new_nodes)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# now make sure you create the search index with the right name here" ] }, { @@ -890,6 +558,23 @@ "index = VectorStoreIndex.from_vector_store(vector_store)" ] }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], + "source": [ + "%pip install -q matplotlib" + ] + }, { "cell_type": "code", "execution_count": null, @@ -898,7 +583,13 @@ { "data": { "text/markdown": [ - "**`Final Response:`** The movie \"Romancing the Stone\" would be a suitable romantic movie for the Christmas season. It is a romantic adventure film that follows a romance writer who sets off on a dangerous adventure to rescue her kidnapped sister. The movie has elements of romance, adventure, and comedy, making it an entertaining choice for the holiday season. Additionally, the movie has received positive reviews and has been nominated for awards, indicating its quality." + "**`Final Response:`** Based on the context provided, two restaurant options that don't serve alcohol are:\n", + "\n", + "1. \"Academy Restauraunt\" in Brooklyn, which serves American cuisine and has a variety of dishes such as Mozzarella sticks, Cheeseburger, Baked potato, Breadsticks, Caesar salad, Chicken parmesan, Pigs in a blanket, Chicken soup, Mac & cheese, Mushroom swiss burger, Spaghetti with meatballs, and Mashed potatoes.\n", + "\n", + "2. \"Gabriel'S Bar & Grill\" in Manhattan, which specializes in Italian cuisine and offers dishes like Cheese Ravioli, Neapolitan Pizza, assorted gelato, Vegetarian Baked Ziti, Vegetarian Broccoli Pizza, Lasagna, Buca Trio Platter, Spinach Ravioli, Pasta with ricotta cheese, Spaghetti, Fried calamari, and Alfredo Pizza.\n", + "\n", + "Both restaurants offer outdoor seating, are kid-friendly, and have a casual dress code. They also provide take-out service and have happy hour promotions." ], "text/plain": [ "" @@ -911,9 +602,8 @@ "name": "stdout", "output_type": "stream", "text": [ - "[NodeWithScore(node=TextNode(id_='c6bbc236-e21d-49ab-b43d-db920b4946e6', embedding=None, metadata={'awards': '{\"nominations\": 2, \"text\": \"Nominated for 1 Oscar. Another 6 wins & 2 nominations.\", \"wins\": 7}', 'metacritic': None, 'rated': 'PG', 'fullplot': \"Joan Wilder, a mousy romance novelist, receives a treasure map in the mail from her recently murdered brother-in-law. Meanwhile, her sister Elaine is kidnapped in Colombia and the two criminals responsible demand that she travel to Colombia to exchange the map for her sister. Joan does, and quickly becomes lost in the jungle after being waylayed by Zolo, a vicious and corrupt Colombian cop who will stop at nothing to obtain the map. There, she meets an irreverent soldier-of-fortune named Jack Colton who agrees to bring her back to civilization. Together, they embark upon an adventure that could be straight out of Joan's novels.\", 'title': 'Romancing the Stone', 'writers': '[\"Diane Thomas\"]', 'languages': '[\"English\", \"Spanish\", \"French\"]', 'plot': 'A romance writer sets off to Colombia to ransom her kidnapped sister, and soon finds herself in the middle of a dangerous adventure.', 'runtime': 106.0, 'countries': '[\"USA\", \"Mexico\"]', 'genres': '[\"Action\", \"Adventure\", \"Comedy\"]', 'directors': '[\"Robert Zemeckis\"]', 'cast': '[\"Michael Douglas\", \"Kathleen Turner\", \"Danny DeVito\", \"Zack Norman\"]', 'type': 'movie', 'imdb': '{\"id\": 88011, \"rating\": 6.9, \"votes\": 59403}', 'poster': 'https://m.media-amazon.com/images/M/MV5BMDAwNjljMzEtMTc3Yy00NDg2LThjNDAtNjc0NGYyYjM2M2I1XkEyXkFqcGdeQXVyNDE5MTU2MDE@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 0}, excluded_embed_metadata_keys=['fullplot', 'metacritic', 'poster', 'num_mflix_comments', 'runtime', 'rated'], excluded_llm_metadata_keys=['fullplot', 'metacritic'], relationships={: RelatedNodeInfo(node_id='e50144b0-96ba-4a5a-b90a-3a2419f5b380', node_type=, metadata={'awards': '{\"nominations\": 2, \"text\": \"Nominated for 1 Oscar. Another 6 wins & 2 nominations.\", \"wins\": 7}', 'metacritic': None, 'rated': 'PG', 'fullplot': \"Joan Wilder, a mousy romance novelist, receives a treasure map in the mail from her recently murdered brother-in-law. Meanwhile, her sister Elaine is kidnapped in Colombia and the two criminals responsible demand that she travel to Colombia to exchange the map for her sister. Joan does, and quickly becomes lost in the jungle after being waylayed by Zolo, a vicious and corrupt Colombian cop who will stop at nothing to obtain the map. There, she meets an irreverent soldier-of-fortune named Jack Colton who agrees to bring her back to civilization. Together, they embark upon an adventure that could be straight out of Joan's novels.\", 'title': 'Romancing the Stone', 'writers': '[\"Diane Thomas\"]', 'languages': '[\"English\", \"Spanish\", \"French\"]', 'plot': 'A romance writer sets off to Colombia to ransom her kidnapped sister, and soon finds herself in the middle of a dangerous adventure.', 'runtime': 106.0, 'countries': '[\"USA\", \"Mexico\"]', 'genres': '[\"Action\", \"Adventure\", \"Comedy\"]', 'directors': '[\"Robert Zemeckis\"]', 'cast': '[\"Michael Douglas\", \"Kathleen Turner\", \"Danny DeVito\", \"Zack Norman\"]', 'type': 'movie', 'imdb': '{\"id\": 88011, \"rating\": 6.9, \"votes\": 59403}', 'poster': 'https://m.media-amazon.com/images/M/MV5BMDAwNjljMzEtMTc3Yy00NDg2LThjNDAtNjc0NGYyYjM2M2I1XkEyXkFqcGdeQXVyNDE5MTU2MDE@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 0}, hash='b984e4f203b7b67eae14afa890718adb800a5816661ac2edf412aa96fd7dc10b'), : RelatedNodeInfo(node_id='f895e43a-038a-4a1c-8a82-0e22868e35d7', node_type=, metadata={'awards': '{\"nominations\": 1, \"text\": \"1 nomination.\", \"wins\": 0}', 'metacritic': None, 'rated': 'R', 'fullplot': \"Chicago psychiatrist Judd Stevens (Roger Moore) is suspected of murdering one of his patients when the man turns up stabbed to death in the middle of the city. After repeated attempts to convince cops Rod Steiger and Elliott Gould of his innocence, Dr.Stevens is forced to go after the real villains himself, and he finds himself up against one of the city's most notorious Mafia kingpins.\", 'title': 'The Naked Face', 'writers': '[\"Bryan Forbes\", \"Sidney Sheldon (novel)\"]', 'languages': '[\"English\"]', 'plot': 'Chicago psychiatrist Judd Stevens (Roger Moore) is suspected of murdering one of his patients when the man turns up stabbed to death in the middle of the city. After repeated attempts to ...', 'runtime': 103.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Mystery\", \"Thriller\"]', 'directors': '[\"Bryan Forbes\"]', 'cast': '[\"Roger Moore\", \"Rod Steiger\", \"Elliott Gould\", \"Art Carney\"]', 'type': 'movie', 'imdb': '{\"id\": 87777, \"rating\": 5.3, \"votes\": 654}', 'poster': 'https://m.media-amazon.com/images/M/MV5BMTg0NDM4MTY0NV5BMl5BanBnXkFtZTcwNTcwOTc2NA@@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 1}, hash='066e2b3d12c5fab61175f52dd625ec41fb1fce1fe6fe4c892774227c576fdbbd'), : RelatedNodeInfo(node_id='e31f1142-c6b6-4183-b14b-1634166b9d1f', node_type=, metadata={}, hash='9b9127e21d18792749a7a35321e04d29b8d77f7b454b0133205f9de1090038b4')}, text=\"Joan Wilder, a mousy romance novelist, receives a treasure map in the mail from her recently murdered brother-in-law. Meanwhile, her sister Elaine is kidnapped in Colombia and the two criminals responsible demand that she travel to Colombia to exchange the map for her sister. Joan does, and quickly becomes lost in the jungle after being waylayed by Zolo, a vicious and corrupt Colombian cop who will stop at nothing to obtain the map. There, she meets an irreverent soldier-of-fortune named Jack Colton who agrees to bring her back to civilization. Together, they embark upon an adventure that could be straight out of Joan's novels.\", start_char_idx=0, end_char_idx=635, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n'), score=0.7502920627593994),\n", - " NodeWithScore(node=TextNode(id_='5c7cef95-79e3-4c96-a009-4154ea125240', embedding=None, metadata={'awards': '{\"nominations\": 2, \"text\": \"Nominated for 2 Oscars. Another 1 win & 2 nominations.\", \"wins\": 3}', 'metacritic': 64.0, 'rated': 'PG-13', 'fullplot': 'In 1880, four men travel together to the city of Silverado. They come across with many dangers before they finally engage the \"bad guys\" and bring peace and equality back to the city.', 'title': 'Silverado', 'writers': '[\"Lawrence Kasdan\", \"Mark Kasdan\"]', 'languages': '[\"English\"]', 'plot': 'A misfit bunch of friends come together to right the injustices which exist in a small town.', 'runtime': 133.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Crime\", \"Drama\"]', 'directors': '[\"Lawrence Kasdan\"]', 'cast': '[\"Kevin Kline\", \"Scott Glenn\", \"Kevin Costner\", \"Danny Glover\"]', 'type': 'movie', 'imdb': '{\"id\": 90022, \"rating\": 7.2, \"votes\": 26415}', 'poster': 'https://m.media-amazon.com/images/M/MV5BYTljNTE5YmUtMGEyZi00ZjI4LWEzYjUtZDY2YWEwNzVmZjRkXkEyXkFqcGdeQXVyNTI4MjkwNjA@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 1}, excluded_embed_metadata_keys=['fullplot', 'metacritic', 'poster', 'num_mflix_comments', 'runtime', 'rated'], excluded_llm_metadata_keys=['fullplot', 'metacritic'], relationships={: RelatedNodeInfo(node_id='decbc30c-c17e-4ba4-bd1e-72dce4ce383a', node_type=, metadata={'awards': '{\"nominations\": 2, \"text\": \"Nominated for 2 Oscars. Another 1 win & 2 nominations.\", \"wins\": 3}', 'metacritic': 64.0, 'rated': 'PG-13', 'fullplot': 'In 1880, four men travel together to the city of Silverado. They come across with many dangers before they finally engage the \"bad guys\" and bring peace and equality back to the city.', 'title': 'Silverado', 'writers': '[\"Lawrence Kasdan\", \"Mark Kasdan\"]', 'languages': '[\"English\"]', 'plot': 'A misfit bunch of friends come together to right the injustices which exist in a small town.', 'runtime': 133.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Crime\", \"Drama\"]', 'directors': '[\"Lawrence Kasdan\"]', 'cast': '[\"Kevin Kline\", \"Scott Glenn\", \"Kevin Costner\", \"Danny Glover\"]', 'type': 'movie', 'imdb': '{\"id\": 90022, \"rating\": 7.2, \"votes\": 26415}', 'poster': 'https://m.media-amazon.com/images/M/MV5BYTljNTE5YmUtMGEyZi00ZjI4LWEzYjUtZDY2YWEwNzVmZjRkXkEyXkFqcGdeQXVyNTI4MjkwNjA@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 1}, hash='80b77d835c7dfad9d57d300cf69ba388704e6f282f49dc23106489db03b8b441'), : RelatedNodeInfo(node_id='1c04fb7f-ff8f-4e8c-84f6-74c57251446a', node_type=, metadata={'awards': '{\"nominations\": 5, \"text\": \"Nominated for 3 Oscars. Another 2 wins & 5 nominations.\", \"wins\": 5}', 'metacritic': None, 'rated': 'R', 'fullplot': 'A hardened convict and a younger prisoner escape from a brutal prison in the middle of winter only to find themselves on an out-of-control train with a female railway worker while being pursued by the vengeful head of security.', 'title': 'Runaway Train', 'writers': '[\"Djordje Milicevic (screenplay)\", \"Paul Zindel (screenplay)\", \"Edward Bunker (screenplay)\", \"Akira Kurosawa (based on a screenplay by)\"]', 'languages': '[\"English\"]', 'plot': 'Two escaped convicts and a female railway worker find themselves trapped on a train with no brakes and nobody driving.', 'runtime': 111.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Adventure\", \"Drama\"]', 'directors': '[\"Andrey Konchalovskiy\"]', 'cast': '[\"Jon Voight\", \"Eric Roberts\", \"Rebecca De Mornay\", \"Kyle T. Heffner\"]', 'type': 'movie', 'imdb': '{\"id\": 89941, \"rating\": 7.3, \"votes\": 19652}', 'poster': 'https://m.media-amazon.com/images/M/MV5BODQyYWU1NGUtNjEzYS00YmNhLTk1YWEtZDdlZGQzMTI4MTI1XkEyXkFqcGdeQXVyMTQxNzMzNDI@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 0}, hash='378c16de972df97080db94775cd46e57f6a0dd5a7472b357e0285eed2e3b7775'), : RelatedNodeInfo(node_id='5df9410b-6597-45f4-95d5-fee1db8737b1', node_type=, metadata={}, hash='77e93faace9b0e102635d3ca997ff27bc03dbba66eaa2d830f0634289d16d927')}, text='In 1880, four men travel together to the city of Silverado. They come across with many dangers before they finally engage the \"bad guys\" and bring peace and equality back to the city.', start_char_idx=0, end_char_idx=183, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n'), score=0.7419796586036682),\n", - " NodeWithScore(node=TextNode(id_='ff28e815-5db5-4963-a9b8-99c64716eb00', embedding=None, metadata={'awards': '{\"nominations\": 1, \"text\": \"1 nomination.\", \"wins\": 0}', 'metacritic': None, 'rated': 'PASSED', 'fullplot': \"Dick Powell stars as Haven, a government private investigator assigned to investigate the murders of two cavalrymen. Travelling incognito, Haven arrives in a small frontier outpost, where saloon singer Charlie controls all illegal activities. After making short work of Charlie's burly henchman, Haven gets a job at her gambling emporium, biding his time and gathering evidence against the gorgeous crime chieftain Cast as a philosophical bartender, Burl Ives is afforded at least one opportunity to sing.\", 'title': 'Station West', 'writers': '[\"Frank Fenton (screenplay)\", \"Winston Miller (screenplay)\", \"Luke Short (novel)\"]', 'languages': '[\"English\"]', 'plot': 'When two US cavalrymen transporting a gold shipment get killed, US Army Intelligence investigator John Haven goes undercover to a mining and logging town to find the killers.', 'runtime': 87.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Mystery\", \"Romance\"]', 'directors': '[\"Sidney Lanfield\"]', 'cast': '[\"Dick Powell\", \"Jane Greer\", \"Agnes Moorehead\", \"Burl Ives\"]', 'type': 'movie', 'imdb': '{\"id\": 40835, \"rating\": 6.8, \"votes\": 578}', 'poster': 'https://m.media-amazon.com/images/M/MV5BN2U3YWJjOWItOWY3Yy00NTMxLTkxMGUtOTQ1MzEzODM2MjRjXkEyXkFqcGdeQXVyNTk1MTk0MDI@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 1}, excluded_embed_metadata_keys=['fullplot', 'metacritic', 'poster', 'num_mflix_comments', 'runtime', 'rated'], excluded_llm_metadata_keys=['fullplot', 'metacritic'], relationships={: RelatedNodeInfo(node_id='b04254ab-2edb-47c1-9412-646575747ca8', node_type=, metadata={'awards': '{\"nominations\": 1, \"text\": \"1 nomination.\", \"wins\": 0}', 'metacritic': None, 'rated': 'PASSED', 'fullplot': \"Dick Powell stars as Haven, a government private investigator assigned to investigate the murders of two cavalrymen. Travelling incognito, Haven arrives in a small frontier outpost, where saloon singer Charlie controls all illegal activities. After making short work of Charlie's burly henchman, Haven gets a job at her gambling emporium, biding his time and gathering evidence against the gorgeous crime chieftain Cast as a philosophical bartender, Burl Ives is afforded at least one opportunity to sing.\", 'title': 'Station West', 'writers': '[\"Frank Fenton (screenplay)\", \"Winston Miller (screenplay)\", \"Luke Short (novel)\"]', 'languages': '[\"English\"]', 'plot': 'When two US cavalrymen transporting a gold shipment get killed, US Army Intelligence investigator John Haven goes undercover to a mining and logging town to find the killers.', 'runtime': 87.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Mystery\", \"Romance\"]', 'directors': '[\"Sidney Lanfield\"]', 'cast': '[\"Dick Powell\", \"Jane Greer\", \"Agnes Moorehead\", \"Burl Ives\"]', 'type': 'movie', 'imdb': '{\"id\": 40835, \"rating\": 6.8, \"votes\": 578}', 'poster': 'https://m.media-amazon.com/images/M/MV5BN2U3YWJjOWItOWY3Yy00NTMxLTkxMGUtOTQ1MzEzODM2MjRjXkEyXkFqcGdeQXVyNTk1MTk0MDI@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 1}, hash='90f541ac96dcffa4ac639e6ac25da415471164bf8d7930a29b6aed406d631ede'), : RelatedNodeInfo(node_id='a48d8737-8615-48c1-9d4a-1ee127e34fb9', node_type=, metadata={'awards': '{\"nominations\": 1, \"text\": \"1 nomination.\", \"wins\": 0}', 'metacritic': None, 'rated': 'PASSED', 'fullplot': 'Jefty, owner of a roadhouse in a backwoods town, hires sultry, tough-talking torch singer Lily Stevens against the advice of his manager Pete Morgan. Jefty is smitten with Lily, who in turn exerts her charms on the more resistant Pete. When Pete finally falls for her and she turns down Jefty\\'s marriage proposal, they must face Jefty\\'s murderous jealousy and his twisted plots to \"punish\" the two.', 'title': 'Road House', 'writers': '[\"Edward Chodorov (screen play)\", \"Margaret Gruen (story)\", \"Oscar Saul (story)\"]', 'languages': '[\"English\"]', 'plot': 'A night club owner becomes infatuated with a torch singer and frames his best friend/manager for embezzlement when the chanteuse falls in love with him.', 'runtime': 95.0, 'countries': '[\"USA\"]', 'genres': '[\"Action\", \"Drama\", \"Film-Noir\"]', 'directors': '[\"Jean Negulesco\"]', 'cast': '[\"Ida Lupino\", \"Cornel Wilde\", \"Celeste Holm\", \"Richard Widmark\"]', 'type': 'movie', 'imdb': '{\"id\": 40740, \"rating\": 7.3, \"votes\": 1353}', 'poster': 'https://m.media-amazon.com/images/M/MV5BMjc1ZTNkM2UtYzY3Yi00ZWZmLTljYmEtNjYxZDNmYzk2ZjkzXkEyXkFqcGdeQXVyMjUxODE0MDY@._V1_SY1000_SX677_AL_.jpg', 'num_mflix_comments': 2}, hash='040b4a77fcc8fbb5347620e99a217d67b85dcdbd370d91bd23877722a499079f'), : RelatedNodeInfo(node_id='75f37fbc-d75e-4a76-b86f-f15d9260afd1', node_type=, metadata={}, hash='9941706d03783561f3fc3200c26527493a62307f8532dcda60b20948c886b330')}, text=\"Dick Powell stars as Haven, a government private investigator assigned to investigate the murders of two cavalrymen. Travelling incognito, Haven arrives in a small frontier outpost, where saloon singer Charlie controls all illegal activities. After making short work of Charlie's burly henchman, Haven gets a job at her gambling emporium, biding his time and gathering evidence against the gorgeous crime chieftain Cast as a philosophical bartender, Burl Ives is afforded at least one opportunity to sing.\", start_char_idx=0, end_char_idx=505, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n'), score=0.7337073087692261)]\n" + "[NodeWithScore(node=TextNode(id_='5405e68c-19f2-4a65-95d7-f880fa6a8deb', embedding=None, metadata={'restaurant_id': '40385767', 'attributes': '{\"Alcohol\": \"u\\'beer_and_wine\\'\", \"Ambience\": \"{\\'touristy\\': False, \\'hipster\\': False, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': None, \\'upscale\\': False, \\'classy\\': False, \\'casual\\': True}\", \"BYOB\": null, \"BestNights\": \"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': True}\", \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": \"False\", \"BusinessAcceptsCreditCards\": \"True\", \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': False, \\'validated\\': False, \\'lot\\': True, \\'valet\\': False}\", \"Caters\": \"True\", \"DriveThru\": null, \"GoodForDancing\": \"False\", \"GoodForKids\": \"True\", \"GoodForMeal\": \"{\\'dessert\\': False, \\'latenight\\': False, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\", \"HasTV\": \"True\", \"Music\": \"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\", \"NoiseLevel\": \"u\\'average\\'\", \"RestaurantsAttire\": \"u\\'casual\\'\", \"RestaurantsDelivery\": \"None\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"True\", \"RestaurantsTableService\": \"True\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"u\\'free\\'\"}', 'cuisine': '\"American\"', 'DogsAllowed': True, 'OutdoorSeating': True, 'borough': '\"Brooklyn\"', 'address': '{\"building\": \"69\", \"coord\": [-73.9757464, 40.687295], \"street\": \"Lafayette Avenue\", \"zipcode\": \"11217\"}', 'name': '\"Academy Restauraunt\"', 'menu': '[\"Mozzarella sticks\", \"Cheeseburger\", \"Baked potato\", \"Breadsticks\", \"Caesar salad\", \"Chicken parmesan\", \"Pigs in a blanket\", \"Chicken soup\", \"Mac & cheese\", \"Mushroom swiss burger\", \"Spaghetti with meatballs\", \"Mashed potatoes\"]', 'TakeOut': 'true', 'PriceRange': '2.0', 'HappyHour': 'true', 'review_count': '173', 'sponsored': None, 'stars': 4.5}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={: RelatedNodeInfo(node_id='bbfc4bf5-d9c3-4f3b-8c1f-ddcf94f3b5df', node_type=, metadata={'restaurant_id': '40385767', 'attributes': '{\"Alcohol\": \"u\\'beer_and_wine\\'\", \"Ambience\": \"{\\'touristy\\': False, \\'hipster\\': False, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': None, \\'upscale\\': False, \\'classy\\': False, \\'casual\\': True}\", \"BYOB\": null, \"BestNights\": \"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': True}\", \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": \"False\", \"BusinessAcceptsCreditCards\": \"True\", \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': False, \\'validated\\': False, \\'lot\\': True, \\'valet\\': False}\", \"Caters\": \"True\", \"DriveThru\": null, \"GoodForDancing\": \"False\", \"GoodForKids\": \"True\", \"GoodForMeal\": \"{\\'dessert\\': False, \\'latenight\\': False, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\", \"HasTV\": \"True\", \"Music\": \"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\", \"NoiseLevel\": \"u\\'average\\'\", \"RestaurantsAttire\": \"u\\'casual\\'\", \"RestaurantsDelivery\": \"None\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"True\", \"RestaurantsTableService\": \"True\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"u\\'free\\'\"}', 'cuisine': '\"American\"', 'DogsAllowed': True, 'OutdoorSeating': True, 'borough': '\"Brooklyn\"', 'address': '{\"building\": \"69\", \"coord\": [-73.9757464, 40.687295], \"street\": \"Lafayette Avenue\", \"zipcode\": \"11217\"}', '_id': {'$oid': '6095a34a7c34416a90d322d1'}, 'name': '\"Academy Restauraunt\"', 'menu': '[\"Mozzarella sticks\", \"Cheeseburger\", \"Baked potato\", \"Breadsticks\", \"Caesar salad\", \"Chicken parmesan\", \"Pigs in a blanket\", \"Chicken soup\", \"Mac & cheese\", \"Mushroom swiss burger\", \"Spaghetti with meatballs\", \"Mashed potatoes\"]', 'TakeOut': 'true', 'PriceRange': '2.0', 'HappyHour': 'true', 'review_count': '173', 'sponsored': None, 'stars': 4.5}, hash='df7870b3103572b05e98091e4d4b52b238175eb08558831b621b6832c0472c2e'), : RelatedNodeInfo(node_id='5fbb14fe-c8a8-4c4c-930d-2e07e4f77b47', node_type=, metadata={'restaurant_id': '40377111', 'attributes': '{\"Alcohol\": null, \"Ambience\": null, \"BYOB\": null, \"BestNights\": null, \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": \"False\", \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': True, \\'validated\\': False, \\'lot\\': False, \\'valet\\': False}\", \"Caters\": null, \"DriveThru\": \"True\", \"GoodForDancing\": null, \"GoodForKids\": null, \"GoodForMeal\": null, \"HasTV\": null, \"Music\": null, \"NoiseLevel\": null, \"RestaurantsAttire\": null, \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": null, \"RestaurantsReservations\": null, \"RestaurantsTableService\": null, \"WheelchairAccessible\": null, \"WiFi\": null}', 'cuisine': '\"American\"', 'DogsAllowed': None, 'OutdoorSeating': None, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"1207\", \"coord\": [-73.9592644, 40.8088612], \"street\": \"Amsterdam Avenue\", \"zipcode\": \"10027\"}', '_id': {'$oid': '6095a34a7c34416a90d321d6'}, 'name': '\"Amsterdam Restaurant & Tapas Lounge\"', 'menu': '[\"Green salad\", \"Cheddar Biscuits\", \"Lasagna\", \"Chicken parmesan\", \"Chicken soup\", \"Pigs in a blanket\", \"Caesar salad\", \"French fries\", \"Baked potato\", \"Mushroom swiss burger\", \"Grilled cheese sandwich\", \"Fried chicken\"]', 'TakeOut': 'true', 'PriceRange': '1.0', 'HappyHour': 'null', 'review_count': '6', 'sponsored': None, 'stars': 5.0}, hash='1261332dd67be495d0639f41b5f6462f87a41aabe20367502ef28074bf13e561'), : RelatedNodeInfo(node_id='10ad1a23-3237-4b68-808d-58fd7b7e5cb6', node_type=, metadata={}, hash='bc64dca2f9210693c3d5174aec305f25b68d080be65a0ae52f9a560f99992bb0')}, text='{\"restaurant_id\": \"40385767\", \"attributes\": \"{\\\\\"Alcohol\\\\\": \\\\\"u\\'beer_and_wine\\'\\\\\", \\\\\"Ambience\\\\\": \\\\\"{\\'touristy\\': False, \\'hipster\\': False, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': None, \\'upscale\\': False, \\'classy\\': False, \\'casual\\': True}\\\\\", \\\\\"BYOB\\\\\": null, \\\\\"BestNights\\\\\": \\\\\"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': True}\\\\\", \\\\\"BikeParking\\\\\": \\\\\"True\\\\\", \\\\\"BusinessAcceptsBitcoin\\\\\": \\\\\"False\\\\\", \\\\\"BusinessAcceptsCreditCards\\\\\": \\\\\"True\\\\\", \\\\\"BusinessParking\\\\\": \\\\\"{\\'garage\\': False, \\'street\\': False, \\'validated\\': False, \\'lot\\': True, \\'valet\\': False}\\\\\", \\\\\"Caters\\\\\": \\\\\"True\\\\\", \\\\\"DriveThru\\\\\": null, \\\\\"GoodForDancing\\\\\": \\\\\"False\\\\\", \\\\\"GoodForKids\\\\\": \\\\\"True\\\\\", \\\\\"GoodForMeal\\\\\": \\\\\"{\\'dessert\\': False, \\'latenight\\': False, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\\\\\", \\\\\"HasTV\\\\\": \\\\\"True\\\\\", \\\\\"Music\\\\\": \\\\\"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\\\\\", \\\\\"NoiseLevel\\\\\": \\\\\"u\\'average\\'\\\\\", \\\\\"RestaurantsAttire\\\\\": \\\\\"u\\'casual\\'\\\\\", \\\\\"RestaurantsDelivery\\\\\": \\\\\"None\\\\\", \\\\\"RestaurantsGoodForGroups\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsReservations\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsTableService\\\\\": \\\\\"True\\\\\", \\\\\"WheelchairAccessible\\\\\": \\\\\"True\\\\\", \\\\\"WiFi\\\\\": \\\\\"u\\'free\\'\\\\\"}\", \"cuisine\": \"\\\\\"American\\\\\"\", \"DogsAllowed\": true, \"OutdoorSeating\": true, \"borough\": \"\\\\\"Brooklyn\\\\\"\",', start_char_idx=0, end_char_idx=1415, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n'), score=0.7296431064605713),\n", + " NodeWithScore(node=TextNode(id_='9cd153ba-2ab8-40aa-90f0-9da5ae24c632', embedding=None, metadata={'restaurant_id': '40392690', 'attributes': '{\"Alcohol\": \"u\\'full_bar\\'\", \"Ambience\": \"{\\'touristy\\': None, \\'hipster\\': True, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': True, \\'upscale\\': None, \\'classy\\': True, \\'casual\\': True}\", \"BYOB\": \"False\", \"BestNights\": \"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': False}\", \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": \"True\", \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': True, \\'validated\\': False, \\'lot\\': False, \\'valet\\': False}\", \"Caters\": \"True\", \"DriveThru\": \"False\", \"GoodForDancing\": \"False\", \"GoodForKids\": \"True\", \"GoodForMeal\": \"{\\'dessert\\': None, \\'latenight\\': None, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\", \"HasTV\": \"False\", \"Music\": \"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\", \"NoiseLevel\": \"u\\'average\\'\", \"RestaurantsAttire\": \"\\'casual\\'\", \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"False\", \"RestaurantsTableService\": \"True\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"\\'free\\'\"}', 'cuisine': '\"Italian\"', 'DogsAllowed': True, 'OutdoorSeating': True, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"11\", \"coord\": [-73.9828696, 40.7693649], \"street\": \"West 60 Street\", \"zipcode\": \"10023\"}', 'name': '\"Gabriel\\'S Bar & Grill\"', 'menu': '[\"Cheese Ravioli\", \"Neapolitan Pizza\", \"assorted gelato\", \"Vegetarian Baked Ziti\", \"Vegetarian Broccoli Pizza\", \"Lasagna\", \"Buca Trio Platter\", \"Spinach Ravioli\", \"Pasta with ricotta cheese\", \"Spaghetti\", \"Fried calimari\", \"Alfredo Pizza\"]', 'TakeOut': 'true', 'PriceRange': '2.0', 'HappyHour': 'true', 'review_count': '333', 'sponsored': None, 'stars': 4.0}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={: RelatedNodeInfo(node_id='77584933-8286-4277-bc56-bed76adcfd37', node_type=, metadata={'restaurant_id': '40392690', 'attributes': '{\"Alcohol\": \"u\\'full_bar\\'\", \"Ambience\": \"{\\'touristy\\': None, \\'hipster\\': True, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': True, \\'upscale\\': None, \\'classy\\': True, \\'casual\\': True}\", \"BYOB\": \"False\", \"BestNights\": \"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': False}\", \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": \"True\", \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': True, \\'validated\\': False, \\'lot\\': False, \\'valet\\': False}\", \"Caters\": \"True\", \"DriveThru\": \"False\", \"GoodForDancing\": \"False\", \"GoodForKids\": \"True\", \"GoodForMeal\": \"{\\'dessert\\': None, \\'latenight\\': None, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\", \"HasTV\": \"False\", \"Music\": \"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\", \"NoiseLevel\": \"u\\'average\\'\", \"RestaurantsAttire\": \"\\'casual\\'\", \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": \"True\", \"RestaurantsReservations\": \"False\", \"RestaurantsTableService\": \"True\", \"WheelchairAccessible\": \"True\", \"WiFi\": \"\\'free\\'\"}', 'cuisine': '\"Italian\"', 'DogsAllowed': True, 'OutdoorSeating': True, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"11\", \"coord\": [-73.9828696, 40.7693649], \"street\": \"West 60 Street\", \"zipcode\": \"10023\"}', '_id': {'$oid': '6095a34b7c34416a90d3243a'}, 'name': '\"Gabriel\\'S Bar & Grill\"', 'menu': '[\"Cheese Ravioli\", \"Neapolitan Pizza\", \"assorted gelato\", \"Vegetarian Baked Ziti\", \"Vegetarian Broccoli Pizza\", \"Lasagna\", \"Buca Trio Platter\", \"Spinach Ravioli\", \"Pasta with ricotta cheese\", \"Spaghetti\", \"Fried calimari\", \"Alfredo Pizza\"]', 'TakeOut': 'true', 'PriceRange': '2.0', 'HappyHour': 'true', 'review_count': '333', 'sponsored': None, 'stars': 4.0}, hash='c4dcc57a697cd2fe3047a280573c0f54bc5236e1d5af2228737af77613c9dbf7'), : RelatedNodeInfo(node_id='6e1ead27-3679-48fb-b160-b47db523a3ce', node_type=, metadata={'restaurant_id': '40392496', 'attributes': '{\"Alcohol\": \"u\\'none\\'\", \"Ambience\": \"{\\'touristy\\': False, \\'hipster\\': False, \\'romantic\\': False, \\'intimate\\': None, \\'trendy\\': False, \\'upscale\\': False, \\'classy\\': False, \\'casual\\': True}\", \"BYOB\": null, \"BestNights\": null, \"BikeParking\": \"True\", \"BusinessAcceptsBitcoin\": null, \"BusinessAcceptsCreditCards\": null, \"BusinessParking\": \"{\\'garage\\': False, \\'street\\': True, \\'validated\\': False, \\'lot\\': False, \\'valet\\': False}\", \"Caters\": \"False\", \"DriveThru\": null, \"GoodForDancing\": null, \"GoodForKids\": \"True\", \"GoodForMeal\": \"{\\'dessert\\': False, \\'latenight\\': False, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': None, \\'breakfast\\': False}\", \"HasTV\": \"True\", \"Music\": null, \"NoiseLevel\": \"u\\'average\\'\", \"RestaurantsAttire\": \"u\\'casual\\'\", \"RestaurantsDelivery\": \"True\", \"RestaurantsGoodForGroups\": \"False\", \"RestaurantsReservations\": \"False\", \"RestaurantsTableService\": \"True\", \"WheelchairAccessible\": null, \"WiFi\": \"\\'free\\'\"}', 'cuisine': '\"English\"', 'DogsAllowed': True, 'OutdoorSeating': True, 'borough': '\"Manhattan\"', 'address': '{\"building\": \"253\", \"coord\": [-74.0034571, 40.736351], \"street\": \"West 11 Street\", \"zipcode\": \"10014\"}', '_id': {'$oid': '6095a34b7c34416a90d32435'}, 'name': '\"Tartine\"', 'menu': 'null', 'TakeOut': 'true', 'PriceRange': '2.0', 'HappyHour': 'true', 'review_count': '436', 'sponsored': None, 'stars': 4.5}, hash='146bffad5c816926ec1008d966caab7c0df675251ccca5de860f8a2160bb7a34'), : RelatedNodeInfo(node_id='6640911b-3d8e-4bad-a016-4c3d91444b0c', node_type=, metadata={}, hash='39984a7534d6755344f0887e0d6a200eaab562a7dc492afe292040c0022282bd')}, text='{\"restaurant_id\": \"40392690\", \"attributes\": \"{\\\\\"Alcohol\\\\\": \\\\\"u\\'full_bar\\'\\\\\", \\\\\"Ambience\\\\\": \\\\\"{\\'touristy\\': None, \\'hipster\\': True, \\'romantic\\': False, \\'divey\\': False, \\'intimate\\': None, \\'trendy\\': True, \\'upscale\\': None, \\'classy\\': True, \\'casual\\': True}\\\\\", \\\\\"BYOB\\\\\": \\\\\"False\\\\\", \\\\\"BestNights\\\\\": \\\\\"{\\'monday\\': False, \\'tuesday\\': False, \\'friday\\': True, \\'wednesday\\': False, \\'thursday\\': False, \\'sunday\\': False, \\'saturday\\': False}\\\\\", \\\\\"BikeParking\\\\\": \\\\\"True\\\\\", \\\\\"BusinessAcceptsBitcoin\\\\\": null, \\\\\"BusinessAcceptsCreditCards\\\\\": \\\\\"True\\\\\", \\\\\"BusinessParking\\\\\": \\\\\"{\\'garage\\': False, \\'street\\': True, \\'validated\\': False, \\'lot\\': False, \\'valet\\': False}\\\\\", \\\\\"Caters\\\\\": \\\\\"True\\\\\", \\\\\"DriveThru\\\\\": \\\\\"False\\\\\", \\\\\"GoodForDancing\\\\\": \\\\\"False\\\\\", \\\\\"GoodForKids\\\\\": \\\\\"True\\\\\", \\\\\"GoodForMeal\\\\\": \\\\\"{\\'dessert\\': None, \\'latenight\\': None, \\'lunch\\': True, \\'dinner\\': True, \\'brunch\\': False, \\'breakfast\\': False}\\\\\", \\\\\"HasTV\\\\\": \\\\\"False\\\\\", \\\\\"Music\\\\\": \\\\\"{\\'dj\\': False, \\'background_music\\': False, \\'no_music\\': False, \\'jukebox\\': False, \\'live\\': False, \\'video\\': False, \\'karaoke\\': False}\\\\\", \\\\\"NoiseLevel\\\\\": \\\\\"u\\'average\\'\\\\\", \\\\\"RestaurantsAttire\\\\\": \\\\\"\\'casual\\'\\\\\", \\\\\"RestaurantsDelivery\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsGoodForGroups\\\\\": \\\\\"True\\\\\", \\\\\"RestaurantsReservations\\\\\": \\\\\"False\\\\\", \\\\\"RestaurantsTableService\\\\\": \\\\\"True\\\\\", \\\\\"WheelchairAccessible\\\\\": \\\\\"True\\\\\", \\\\\"WiFi\\\\\": \\\\\"\\'free\\'\\\\\"}\", \"cuisine\": \"\\\\\"Italian\\\\\"\", \"DogsAllowed\": true, \"OutdoorSeating\": true,', start_char_idx=0, end_char_idx=1382, text_template='Metadata: {metadata_str}\\n-----\\nContent: {content}', metadata_template='{key}=>{value}', metadata_seperator='\\n'), score=0.7284677028656006)]\n" ] } ], @@ -921,9 +611,9 @@ "import pprint\n", "from llama_index.core.response.notebook_utils import display_response\n", "\n", - "query_engine = index.as_query_engine(similarity_top_k=3)\n", + "query_engine = index.as_query_engine()\n", "\n", - "query = \"Recommend a restaurants suitable for the christmas season and justify your selecton\"\n", + "query = \"search query: Anything that doesn't have alcohol in it\"\n", "\n", "response = query_engine.query(query)\n", "display_response(response)\n", diff --git a/docs/getting_started/v0_10_0_migration.md b/docs/getting_started/v0_10_0_migration.md index b25cfb29022e2..27d5bc6390134 100644 --- a/docs/getting_started/v0_10_0_migration.md +++ b/docs/getting_started/v0_10_0_migration.md @@ -2,9 +2,9 @@ With the introduction of LlamaIndex v0.10.0, there were several changes -- integrations have separate `pip installs (See the [full registry](https://pretty-sodium-5e0.notion.site/ce81b247649a44e4b6b35dfb24af28a6?v=53b3c2ced7bb4c9996b81b83c9f01139)) +- integrations have separate `pip install`s (See the [full registry](https://pretty-sodium-5e0.notion.site/ce81b247649a44e4b6b35dfb24af28a6?v=53b3c2ced7bb4c9996b81b83c9f01139)) - many imports changed -- the service context was deprecated +- the `ServiceContext` was deprecated Thankfully, we've tried to make these changes as easy as possible! @@ -72,7 +72,7 @@ from llama_index.core import Settings Settings.llm = llm Settings.embed_model = embed_model -Setting.chunk_size = 512 +Settings.chunk_size = 512 ``` You can see the `ServiceContext` -> `Settings` migration guide for [more details](/module_guides/supporting_modules/service_context_migration.md). diff --git a/docs/index.rst b/docs/index.rst index 7799e24493afb..ea8fe43e671c5 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -19,7 +19,7 @@ You may choose to **fine-tune** a LLM with your data, but: - Due to the cost to train, it's **hard to update** a LLM with latest information. - **Observability** is lacking. When you ask a LLM a question, it's not obvious how the LLM arrived at its answer. -Instead of fine-tuning, one can a context augmentation pattern called `Retrieval-Augmented Generation (RAG) <./getting_started/concepts.html>`_ to obtain more accurate text generation relevant to your specific data. RAG involves the following high level steps: +Instead of fine-tuning, one can use a context augmentation pattern called `Retrieval-Augmented Generation (RAG) <./getting_started/concepts.html>`_ to obtain more accurate text generation relevant to your specific data. RAG involves the following high level steps: 1. Retrieve information from your data sources first, 2. Add it to your question as context, and @@ -36,7 +36,7 @@ In doing so, RAG overcomes all three weaknesses of the fine-tuning approach: Firstly, LlamaIndex imposes no restriction on how you use LLMs. You can still use LLMs as auto-complete, chatbots, semi-autonomous agents, and more (see Use Cases on the left). It only makes LLMs more relevant to you. -LlamaIndex provides the following tools to help you quickly standup production-ready RAG systems: +LlamaIndex provides the following tools to help you quickly stand up production-ready RAG systems: - **Data connectors** ingest your existing data from their native source and format. These could be APIs, PDFs, SQL, and (much) more. - **Data indexes** structure your data in intermediate representations that are easy and performant for LLMs to consume. @@ -70,7 +70,7 @@ We recommend starting at `how to read these docs <./getting_started/reading.html To download or contribute, find LlamaIndex on: -- Github: https://github.com/jerryjliu/llama_index +- Github: https://github.com/run-llama/llama_index - PyPi: - LlamaIndex: https://pypi.org/project/llama-index/. diff --git a/docs/module_guides/models/llms.md b/docs/module_guides/models/llms.md index 7e999730e07e5..366584f8e0cba 100644 --- a/docs/module_guides/models/llms.md +++ b/docs/module_guides/models/llms.md @@ -91,11 +91,11 @@ If you have ways to improve the setup for existing notebooks, contributions to c | Model Name | Basic Query Engines | Router Query Engine | Sub Question Query Engine | Text2SQL | Pydantic Programs | Data Agents |
Notes
| | ------------------------------------------------------------------------------------------------------------------------ | ------------------- | ------------------- | ------------------------- | -------- | ----------------- | ----------- | --------------------------------------- | -| [gpt-3.5-turbo](https://colab.research.google.com/drive/1oVqUAkn0GCBG5OCs3oMUPlNQDdpDTH_c?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | | -| [gpt-3.5-turbo-instruct](https://colab.research.google.com/drive/1DrVdx-VZ3dXwkwUVZQpacJRgX7sOa4ow?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Tool usage in data-agents seems flakey. | -| [gpt-4](https://colab.research.google.com/drive/1RsBoT96esj1uDID-QE8xLrOboyHKp65L?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | | -| [claude-2](https://colab.research.google.com/drive/1os4BuDS3KcI8FCcUM_2cJma7oI2PGN7N?usp=sharing) (anthropic) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Prone to hallucinating tool inputs. | -| [claude-instant-1.2](https://colab.research.google.com/drive/1wt3Rt2OWBbqyeRYdiLfmB0_OIUOGit_D?usp=sharing) (anthropic) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Prone to hallucinating tool inputs. | +| [gpt-3.5-turbo](https://colab.research.google.com/drive/1vvdcf7VYNQA67NOxBHCyQvgb2Pu7iY_5?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | | +| [gpt-3.5-turbo-instruct](https://colab.research.google.com/drive/1Ne-VmMNYGOKUeECvkjurdKqMDpfqJQHE?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Tool usage in data-agents seems flakey. | +| [gpt-4](https://colab.research.google.com/drive/1QUNyCVt8q5G32XHNztGw4YJ2EmEkeUe8?usp=sharing) (openai) | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | | +| [claude-2](https://colab.research.google.com/drive/1IuHRN67MYOaLx2_AgJ9gWVtlK7bIvS1f?usp=sharing) (anthropic) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Prone to hallucinating tool inputs. | +| [claude-instant-1.2](https://colab.research.google.com/drive/1ahq-2kXwCVCA_3xyC5UMWHyfAcjoG8Gp?usp=sharing) (anthropic) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Prone to hallucinating tool inputs. | ### Open Source LLMs @@ -103,14 +103,14 @@ Since open source LLMs require large amounts of resources, the quantization is r | Model Name | Basic Query Engines | Router Query Engine | SubQuestion Query Engine | Text2SQL | Pydantic Programs | Data Agents |
Notes
| | ------------------------------------------------------------------------------------------------------------------------------------ | ------------------- | ------------------- | ------------------------ | -------- | ----------------- | ----------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | -| [llama2-chat-7b 4bit](https://colab.research.google.com/drive/14N-hmJ87wZsFqHktrw40OU6sVcsiSzlQ?usp=sharing) (huggingface) | ✅ | 🛑 | 🛑 | 🛑 | 🛑 | ⚠️ | Llama2 seems to be quite chatty, which makes parsing structured outputs difficult. Fine-tuning and prompt engineering likely required for better performance on structured outputs. | -| [llama2-13b-chat](https://colab.research.google.com/drive/1S3eCZ8goKjFktF9hIakzcHqDE72g0Ggb?usp=sharing) (replicate) | ✅ | ✅ | 🛑 | ✅ | 🛑 | 🛑 | Our ReAct prompt expects structured outputs, which llama-13b struggles at | -| [llama2-70b-chat](https://colab.research.google.com/drive/1BeOuVI8StygKFTLSpZ0vGCouxar2V5UW?usp=sharing) (replicate) | ✅ | ✅ | ✅ | ✅ | 🛑 | ⚠️ | There are still some issues with parsing structured outputs, especially with pydantic programs. | -| [Mistral-7B-instruct-v0.1 4bit](https://colab.research.google.com/drive/1ZAdrabTJmZ_etDp10rjij_zME2Q3umAQ?usp=sharing) (huggingface) | ✅ | 🛑 | 🛑 | ⚠️ | ⚠️ | ⚠️ | Mistral seems slightly more reliable for structured outputs compared to Llama2. Likely with some prompt engineering, it may do better. | -| [zephyr-7b-alpha](https://colab.research.google.com/drive/16Ygf2IyGNkb725ZqtRmFQjwWBuzFX_kl?usp=sharing) (huggingface) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Overall, `zyphyr-7b-alpha` is appears to be more reliable than other open-source models of this size. Although it still hallucinates a bit, especially as an agent. | -| [zephyr-7b-beta](https://colab.research.google.com/drive/1UoPcoiA5EOBghxWKWduQhChliMHxla7U?usp=sharing) (huggingface) | ✅ | ✅ | ✅ | ✅ | 🛑 | ✅ | Compared to `zyphyr-7b-alpha`, `zyphyr-7b-beta` appears to perform well as an agent however it fails for Pydantic Programs | -| [stablelm-zephyr-3b](https://colab.research.google.com/drive/1USBIOs4yUkjOcxTKBr7onjlzATE-974T?usp=sharing) (huggingface) | ✅ | ⚠️ | ✅ | 🛑 | ✅ | 🛑 | stablelm-zephyr-3b does surprisingly well, especially for structured outputs (surpassing much larger models). It struggles a bit with text-to-SQL and tool use. | -| [starling-lm-7b-alpha](https://colab.research.google.com/drive/1Juk073EWt2utxHZY84q_NfVT9xFwppf8?usp=sharing) (huggingface) | ✅ | 🛑 | ✅ | ⚠️ | ✅ | ✅ | starling-lm-7b-alpha does surprisingly well on agent tasks. It struggles a bit with routing, and is inconsistent with text-to-SQL. | +| [llama2-chat-7b 4bit](https://colab.research.google.com/drive/1ByiIaBqCwbH9QXJOQWqOfUdsq4LEFq-g?usp=sharing) (huggingface) | ✅ | 🛑 | 🛑 | 🛑 | 🛑 | ⚠️ | Llama2 seems to be quite chatty, which makes parsing structured outputs difficult. Fine-tuning and prompt engineering likely required for better performance on structured outputs. | +| [llama2-13b-chat](https://colab.research.google.com/drive/1dpIv3iYQCV4OBB8z2ZRS7y4wUfsfNlO3?usp=sharing) (replicate) | ✅ | ✅ | 🛑 | ✅ | 🛑 | 🛑 | Our ReAct prompt expects structured outputs, which llama-13b struggles at | +| [llama2-70b-chat](https://colab.research.google.com/drive/11h_Av5RG3tGjuOrZ-VKifd9UzcRPeN1J?usp=sharing) (replicate) | ✅ | ✅ | ✅ | ✅ | 🛑 | ⚠️ | There are still some issues with parsing structured outputs, especially with pydantic programs. | +| [Mistral-7B-instruct-v0.1 4bit](https://colab.research.google.com/drive/1-f5v48TnX5rGdaMdWTr8XsjTGrWZ6Q7Y?usp=sharing) (huggingface) | ✅ | 🛑 | 🛑 | ⚠️ | ⚠️ | ⚠️ | Mistral seems slightly more reliable for structured outputs compared to Llama2. Likely with some prompt engineering, it may do better. | +| [zephyr-7b-alpha](https://colab.research.google.com/drive/1asitB49g9LMGrlODgY2J-g_xRExRM_ud?usp=sharing) (huggingface) | ✅ | ✅ | ✅ | ✅ | ✅ | ⚠️ | Overall, `zyphyr-7b-alpha` is appears to be more reliable than other open-source models of this size. Although it still hallucinates a bit, especially as an agent. | +| [zephyr-7b-beta](https://colab.research.google.com/drive/1C55IGyJNDe14DsHkAIIpIjn76NvK5pc1?usp=sharing) (huggingface) | ✅ | ✅ | ✅ | ✅ | 🛑 | ✅ | Compared to `zyphyr-7b-alpha`, `zyphyr-7b-beta` appears to perform well as an agent however it fails for Pydantic Programs | +| [stablelm-zephyr-3b](https://colab.research.google.com/drive/1X_hEUkV62wHmMty3tNLIfJtp4IC6QNYN?usp=sharing) (huggingface) | ✅ | ⚠️ | ✅ | 🛑 | ✅ | 🛑 | stablelm-zephyr-3b does surprisingly well, especially for structured outputs (surpassing much larger models). It struggles a bit with text-to-SQL and tool use. | +| [starling-lm-7b-alpha](https://colab.research.google.com/drive/1z2tZMr4M9wBFU6YX8fvAZ7WLTa3tWKEm?usp=sharing) (huggingface) | ✅ | 🛑 | ✅ | ⚠️ | ✅ | ✅ | starling-lm-7b-alpha does surprisingly well on agent tasks. It struggles a bit with routing, and is inconsistent with text-to-SQL. | ## Modules diff --git a/docs/module_guides/models/multi_modal.md b/docs/module_guides/models/multi_modal.md index 16b09e3bb4df8..5e92d596423f3 100644 --- a/docs/module_guides/models/multi_modal.md +++ b/docs/module_guides/models/multi_modal.md @@ -148,7 +148,7 @@ Below table lists some vector stores supporting Multi-Modal use cases. Our Llama ## Multi-Modal LLM Modules -We support integrations with GPT4-V, CLIP (OpenAI), BLIP (Salesforce), and Replicate (LLaVA, Fuyu-8B, MiniGPT-4, CogVLM), and more. +We support integrations with GPT4-V, Anthropic (Opus, Sonnet), Gemini (Google), CLIP (OpenAI), BLIP (Salesforce), and Replicate (LLaVA, Fuyu-8B, MiniGPT-4, CogVLM), and more. ```{toctree} --- @@ -160,6 +160,7 @@ maxdepth: 1 /examples/multi_modal/multi_modal_pydantic.ipynb /examples/multi_modal/gpt4v_experiments_cot.ipynb /examples/multi_modal/llava_multi_modal_tesla_10q.ipynb +/examples/multi_modal/anthropic_multi_modal.ipynb ``` ## Multi-Modal Retrieval Augmented Generation diff --git a/docs/module_guides/models/prompts.md b/docs/module_guides/models/prompts.md index 1f9d4468e8081..b5810704c1175 100644 --- a/docs/module_guides/models/prompts.md +++ b/docs/module_guides/models/prompts.md @@ -5,9 +5,9 @@ Prompting is the fundamental input that gives LLMs their expressive power. LlamaIndex uses prompts to build the index, do insertion, perform traversal during querying, and to synthesize the final answer. -LlamaIndex uses a set of [default prompt templates](https://github.com/jerryjliu/llama_index/blob/main/llama_index/prompts/default_prompts.py) that work well out of the box. +LlamaIndex uses a set of [default prompt templates](https://github.com/run-llama/llama_index/blob/main/llama-index-core/llama_index/core/prompts/default_prompts.py) that work well out of the box. -In addition, there are some prompts written and used specifically for chat models like `gpt-3.5-turbo` [here](https://github.com/jerryjliu/llama_index/blob/main/llama_index/prompts/chat_prompts.py). +In addition, there are some prompts written and used specifically for chat models like `gpt-3.5-turbo` [here](https://github.com/run-llama/llama_index/blob/main/llama-index-core/llama_index/core/prompts/chat_prompts.py). Users may also provide their own prompt templates to further customize the behavior of the framework. The best method for customizing is copying the default prompt from the link above, and using that as the base for any modifications. diff --git a/docs/module_guides/observability/callbacks/root.md b/docs/module_guides/observability/callbacks/root.md index b71a037ae14a4..11bd0093c93e4 100644 --- a/docs/module_guides/observability/callbacks/root.md +++ b/docs/module_guides/observability/callbacks/root.md @@ -31,6 +31,7 @@ You can implement your own callback to track and trace these events, or use an e Currently supported callbacks are as follows: +- [LangfuseCallbackHandler](/examples/callbacks/LangfuseCallbackHandler.ipynb) -> Tracking of events and traces using the open-source platform Langfuse. More details are in the linked notebook or in the [Langfuse docs](https://langfuse.com/docs) - [TokenCountingHandler](/examples/callbacks/TokenCountingHandler.ipynb) -> Flexible token counting for prompt, completion, and embedding token usage. See [the migration details](/module_guides/observability/callbacks/token_counting_migration.md) - [LlamaDebugHanlder](/examples/callbacks/LlamaDebugHandler.ipynb) -> Basic tracking and tracing for events. Example usage can be found in the notebook below. - [WandbCallbackHandler](/examples/callbacks/WandbCallbackHandler.ipynb) -> Tracking of events and traces using the Wandb Prompts frontend. More details are in the notebook below or at [Wandb](https://docs.wandb.ai/guides/prompts/quickstart) @@ -43,6 +44,7 @@ Currently supported callbacks are as follows: maxdepth: 1 hidden: --- +/examples/callbacks/LangfuseCallbackHandler.ipynb /examples/callbacks/TokenCountingHandler.ipynb /examples/callbacks/LlamaDebugHandler.ipynb /examples/callbacks/WandbCallbackHandler.ipynb diff --git a/docs/module_guides/observability/observability.md b/docs/module_guides/observability/observability.md index 48ac5f98bd897..6a419dee79e18 100644 --- a/docs/module_guides/observability/observability.md +++ b/docs/module_guides/observability/observability.md @@ -50,6 +50,34 @@ llama_index.core.set_global_handler("simple") We offer a rich set of integrations with our partners. A short description + usage pattern, and guide is provided for each partner. +### Langfuse + +[Langfuse](https://langfuse.com/docs) is an open source LLM engineering platform to help teams collaboratively debug, analyze and iterate on their LLM Applications. With the Langfuse integration, you can seamlessly track and monitor performance, traces, and metrics of your LlamaIndex application. Detailed traces of the LlamaIndex context augmentation and the LLM querying processes are captured and can be inspected directly in the Langfuse UI. + +#### Usage Pattern + +```python +from llama_index.core import set_global_handler + +# Make sure you've installed the 'llama-index-callbacks-langfuse' integration package. + +# NOTE: Set your environment variables 'LANGFUSE_SECRET_KEY', 'LANGFUSE_PUBLIC_KEY' and 'LANGFUSE_HOST' +# as shown in your langfuse.com project settings. + +set_global_handler("langfuse") +``` + +#### Guides + +```{toctree} +--- +maxdepth: 1 +--- +/examples/callbacks/LangfuseCallbackHandler.ipynb +``` + +![langfuse-tracing](https://static.langfuse.com/llamaindex-langfuse-docs.gif) + ### DeepEval [DeepEval (by Confident AI)](https://github.com/confident-ai/deepeval) is an open-source evaluation framework for LLM applications. As you "unit test" your LLM app using DeepEval's 14+ default metrics it currently offers (summarization, hallucination, answer relevancy, faithfulness, RAGAS, etc.), you can debug failing test cases through this tracing integration with LlamaIndex, or debug unsatisfactory evaluations in **production** through DeepEval's hosted evaluation platform, [Confident AI](https://confident-ai.com), that runs referenceless evaluations in production. diff --git a/docs/module_guides/querying/node_postprocessors/node_postprocessors.md b/docs/module_guides/querying/node_postprocessors/node_postprocessors.md index 86d78d23799f4..255513a03e77b 100644 --- a/docs/module_guides/querying/node_postprocessors/node_postprocessors.md +++ b/docs/module_guides/querying/node_postprocessors/node_postprocessors.md @@ -127,6 +127,22 @@ postprocessor.postprocess_nodes(nodes) Full notebook guide is available [her for Gatsby](/examples/node_postprocessor/LLMReranker-Gatsby.ipynb) and [here for Lyft 10K documents](/examples/node_postprocessor/LLMReranker-Lyft-10k.ipynb). +## JinaRerank + +Uses the "Jina ReRank" functionality to re-order nodes, and returns the top N nodes. + +```python +from llama_index.postprocessor.jinaai_rerank import JinaRerank + +postprocessor = JinaRerank( + top_n=2, model="jina-reranker-v1-base-en", api_key="YOUR JINA API KEY" +) + +postprocessor.postprocess_nodes(nodes) +``` + +Full notebook guide is available [here](/examples/node_postprocessor/JinaRerank.ipynb). + ## FixedRecencyPostprocessor This postproccesor returns the top K nodes sorted by date. This assumes there is a `date` field to parse in the metadata of each node. @@ -254,7 +270,48 @@ postprocessor = RankGPTRerank(top_n=3, llm=OpenAI(model="gpt-3.5-turbo-16k")) postprocessor.postprocess_nodes(nodes) ``` -Full notebook guide is available [her for Van Gogh](/examples/node_postprocessor/rankGPT.ipynb). +Full notebook guide is available [here](/examples/node_postprocessor/rankGPT.ipynb). + +## Colbert Reranker + +Uses Colbert V2 model as a reranker to rerank documents according to the fine-grained similarity between query tokens and passage tokens. Returns the top N ranked nodes. + +```python +from llama_index.postprocessor.colbert_rerank import ColbertRerank + +colbert_reranker = ColbertRerank( + top_n=5, + model="colbert-ir/colbertv2.0", + tokenizer="colbert-ir/colbertv2.0", + keep_retrieval_score=True, +) + +query_engine = index.as_query_engine( + similarity_top_k=10, + node_postprocessors=[colbert_reranker], +) +response = query_engine.query( + query_str, +) +``` + +Full notebook guide is available [here](/examples/node_postprocessor/ColbertRerank.ipynb). + +## Jina Reranker + +Uses models from [jina](https://jina.ai/) to rerank documents. Returns the top N ranked nodes. + +```python +from llama_index.postprocessor.jinaai_rerank import JinaRerank + +jina_rerank = JinaRerank(api_key=api_key, top_n=2) + +query_engine = index.as_query_engine( + similarity_top_k=10, node_postprocessors=[jina_rerank] +) +``` + +Full notebook guide is available [here](/examples/node_postprocessor/JinaRerank.ipynb). ## All Notebooks @@ -273,4 +330,7 @@ maxdepth: 1 /examples/node_postprocessor/MetadataReplacementDemo.ipynb /examples/node_postprocessor/LongContextReorder.ipynb /examples/node_postprocessor/rankGPT.ipynb +/examples/node_postprocessor/ColbertRerank.ipynb +/examples/node_postprocessor/JinaRerank.ipynb +/cookbooks/mixedbread_reranker.ipynb ``` diff --git a/docs/module_guides/querying/retriever/retrievers.md b/docs/module_guides/querying/retriever/retrievers.md index ef152dfb9c014..2c8216582123a 100644 --- a/docs/module_guides/querying/retriever/retrievers.md +++ b/docs/module_guides/querying/retriever/retrievers.md @@ -84,6 +84,7 @@ maxdepth: 1 /examples/managed/GoogleDemo.ipynb /examples/managed/vectaraDemo.ipynb /examples/managed/zcpDemo.ipynb +VideoDB Retriever ``` ### Other Retrievers diff --git a/docs/module_guides/storing/vector_stores.md b/docs/module_guides/storing/vector_stores.md index c00873909697f..70e8f8e24b969 100644 --- a/docs/module_guides/storing/vector_stores.md +++ b/docs/module_guides/storing/vector_stores.md @@ -13,44 +13,45 @@ They can be persisted to (and loaded from) disk by calling `vector_store.persist LlamaIndex supports over 20 different vector store options. We are actively adding more integrations and improving feature coverage for each. -| Vector Store | Type | Metadata Filtering | Hybrid Search | Delete | Store Documents | Async | -| ------------------------ | ------------------- | ------------------ | ------------- | ------ | --------------- | ----- | -| Apache Cassandra® | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Astra DB | cloud | ✓ | | ✓ | ✓ | | -| Azure Cognitive Search | cloud | | ✓ | ✓ | ✓ | | -| Azure CosmosDB MongoDB | cloud | | | ✓ | ✓ | | -| ChatGPT Retrieval Plugin | aggregator | | | ✓ | ✓ | | -| Chroma | self-hosted | ✓ | | ✓ | ✓ | | -| DashVector | cloud | ✓ | ✓ | ✓ | ✓ | | -| Deeplake | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| DocArray | aggregator | ✓ | | ✓ | ✓ | | -| DynamoDB | cloud | | | ✓ | | | -| Elasticsearch | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | -| FAISS | in-memory | | | | | | -| txtai | in-memory | | | | | | -| Jaguar | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | -| LanceDB | cloud | ✓ | | ✓ | ✓ | | -| Lantern | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | -| Metal | cloud | ✓ | | ✓ | ✓ | | -| MongoDB Atlas | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| MyScale | cloud | ✓ | ✓ | ✓ | ✓ | | -| Milvus / Zilliz | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Neo4jVector | self-hosted / cloud | | | ✓ | ✓ | | -| OpenSearch | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | -| Pinecone | cloud | ✓ | ✓ | ✓ | ✓ | | -| Postgres | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | -| pgvecto.rs | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | -| Qdrant | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | -| Redis | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Simple | in-memory | ✓ | | ✓ | | | -| SingleStore | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Supabase | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Tair | cloud | ✓ | | ✓ | ✓ | | -| TencentVectorDB | cloud | ✓ | ✓ | ✓ | ✓ | | -| Timescale | | ✓ | | ✓ | ✓ | ✓ | -| Typesense | self-hosted / cloud | ✓ | | ✓ | ✓ | | -| Upstash | cloud | | | | ✓ | | -| Weaviate | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | +| Vector Store | Type | Metadata Filtering | Hybrid Search | Delete | Store Documents | Async | +| ------------------------ | ----------------------- | ------------------ | ------------- | ------ | --------------- | ----- | +| Apache Cassandra® | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Astra DB | cloud | ✓ | | ✓ | ✓ | | +| Azure Cognitive Search | cloud | | ✓ | ✓ | ✓ | | +| Azure CosmosDB MongoDB | cloud | | | ✓ | ✓ | | +| ChatGPT Retrieval Plugin | aggregator | | | ✓ | ✓ | | +| Chroma | self-hosted | ✓ | | ✓ | ✓ | | +| DashVector | cloud | ✓ | ✓ | ✓ | ✓ | | +| Deeplake | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| DocArray | aggregator | ✓ | | ✓ | ✓ | | +| DuckDB | in-memory / self-hosted | ✓ | | ✓ | ✓ | | +| DynamoDB | cloud | | | ✓ | | | +| Elasticsearch | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | +| FAISS | in-memory | | | | | | +| txtai | in-memory | | | | | | +| Jaguar | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | +| LanceDB | cloud | ✓ | | ✓ | ✓ | | +| Lantern | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | +| Metal | cloud | ✓ | | ✓ | ✓ | | +| MongoDB Atlas | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| MyScale | cloud | ✓ | ✓ | ✓ | ✓ | | +| Milvus / Zilliz | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Neo4jVector | self-hosted / cloud | | | ✓ | ✓ | | +| OpenSearch | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | +| Pinecone | cloud | ✓ | ✓ | ✓ | ✓ | | +| Postgres | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | +| pgvecto.rs | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | +| Qdrant | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | ✓ | +| Redis | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Simple | in-memory | ✓ | | ✓ | | | +| SingleStore | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Supabase | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Tair | cloud | ✓ | | ✓ | ✓ | | +| TencentVectorDB | cloud | ✓ | ✓ | ✓ | ✓ | | +| Timescale | | ✓ | | ✓ | ✓ | ✓ | +| Typesense | self-hosted / cloud | ✓ | | ✓ | ✓ | | +| Upstash | cloud | | | | ✓ | | +| Weaviate | self-hosted / cloud | ✓ | ✓ | ✓ | ✓ | | For more details, see [Vector Store Integrations](/community/integrations/vector_stores.md). @@ -70,6 +71,7 @@ maxdepth: 1 /examples/vector_stores/DeepLakeIndexDemo.ipynb /examples/vector_stores/DocArrayHnswIndexDemo.ipynb /examples/vector_stores/DocArrayInMemoryIndexDemo.ipynb +/examples/vector_stores/DuckDBDemo.ipynb /examples/vector_stores/EpsillaIndexDemo.ipynb /examples/vector_stores/JaguarIndexDemo.ipynb /examples/vector_stores/LanceDBIndexDemo.ipynb diff --git a/docs/presentations/materials/2024-02-28-rag-bootcamp-vector-institute.ipynb b/docs/presentations/materials/2024-02-28-rag-bootcamp-vector-institute.ipynb index 4524113a39298..073e5a818b24e 100644 --- a/docs/presentations/materials/2024-02-28-rag-bootcamp-vector-institute.ipynb +++ b/docs/presentations/materials/2024-02-28-rag-bootcamp-vector-institute.ipynb @@ -121,7 +121,7 @@ "\n", "3. Declaration of Research Assessment: In academia, this could refer to a statement or policy regarding how research is evaluated.\n", "\n", - "4. Digital on-Ramp's Assessment: In the field of digital technology, this could refer to an assessment tool used by the Digital On-Ramps program.\n", + "4. Digital On-Ramp's Assessment: In the field of digital technology, this could refer to an assessment tool used by the Digital On-Ramps program.\n", "\n", "Please provide more context for a more accurate definition.\n" ] @@ -371,7 +371,7 @@ "source": [ "## In Summary\n", "\n", - "- LLMs as powerful as they are, don't perform too well with knowledge-intensive tasks (domain specific, updated data, long-tail)\n", + "- LLMs as powerful as they are, don't perform too well with knowledge-intensive tasks (domain-specific, updated data, long-tail)\n", "- Context augmentation has been shown (in a few studies) to outperform LLMs without augmentation\n", "- In this notebook, we showed one such example that follows that pattern." ] diff --git a/docs/use_cases/chatbots.md b/docs/use_cases/chatbots.md index f2b37b6320b31..727884c2b1bb4 100644 --- a/docs/use_cases/chatbots.md +++ b/docs/use_cases/chatbots.md @@ -10,7 +10,7 @@ Here are some relevant resources: - [create-llama](https://blog.llamaindex.ai/create-llama-a-command-line-tool-to-generate-llamaindex-apps-8f7683021191), a command line tool that generates a full-stack chatbot application for you - [SECinsights.ai](https://www.secinsights.ai/), an open-source application that uses LlamaIndex to build a chatbot that answers questions about SEC filings - [RAGs](https://blog.llamaindex.ai/introducing-rags-your-personalized-chatgpt-experience-over-your-data-2b9d140769b1), a project inspired by OpenAI's GPTs that lets you build a low-code chatbot over your data using Streamlit -- Our [OpenAI agents](/module_guides/deploying/agents/modules.md) are all chat bots in nature +- Our [OpenAI agents](/module_guides/deploying/agents/modules.md) are all chatbots in nature ## External sources diff --git a/docs/use_cases/multimodal.md b/docs/use_cases/multimodal.md index 5aa7fba00a400..42c5e837439b6 100644 --- a/docs/use_cases/multimodal.md +++ b/docs/use_cases/multimodal.md @@ -1,10 +1,10 @@ # Multi-modal -LlamaIndex offers capabilities to not only build language-based applications, but also **multi-modal** applications - combining language and images. +LlamaIndex offers capabilities to not only build language-based applications but also **multi-modal** applications - combining language and images. ## Types of Multi-modal Use Cases -This space is actively being explored right now, but there are some fascinating use cases popping up. +This space is actively being explored right now, but some fascinating use cases are popping up. ### RAG (Retrieval Augmented Generation) @@ -73,7 +73,7 @@ maxdepth: 1 These sections show comparisons between different multi-modal models for different use cases. -### LLaVa-13, Fuyu-8B and MiniGPT-4 Multi-Modal LLM Models Comparison for Image Reasoning +### LLaVa-13, Fuyu-8B, and MiniGPT-4 Multi-Modal LLM Models Comparison for Image Reasoning These notebooks show how to use different Multi-Modal LLM models for image understanding/reasoning. The various model inferences are supported by Replicate or OpenAI GPT4-V API. We compared several popular Multi-Modal LLMs: @@ -97,7 +97,7 @@ GPT4-V: ### Simple Evaluation of Multi-Modal RAG -In this notebook guide, we'll demonstrate how to evaluate a Multi-Modal RAG system. As in the text-only case, we will consider the evaluation of Retrievers and Generators separately. As we alluded in our blog on the topic of Evaluating Multi-Modal RAGs, our approach here involves the application of adapted versions of the usual techniques for evaluating both Retriever and Generator (used for the text-only case). These adapted versions are part of the llama-index library (i.e., evaluation module), and this notebook will walk you through how you can apply them to your evaluation use-cases. +In this notebook guide, we'll demonstrate how to evaluate a Multi-Modal RAG system. As in the text-only case, we will consider the evaluation of Retrievers and Generators separately. As we alluded to in our blog on the topic of Evaluating Multi-Modal RAGs, our approach here involves the application of adapted versions of the usual techniques for evaluating both Retriever and Generator (used for the text-only case). These adapted versions are part of the llama-index library (i.e., evaluation module), and this notebook will walk you through how you can apply them to your evaluation use cases. ```{toctree} --- diff --git a/docs/use_cases/q_and_a/rag_cli.md b/docs/use_cases/q_and_a/rag_cli.md index 040eb93166ef6..06da5db3aaa3f 100644 --- a/docs/use_cases/q_and_a/rag_cli.md +++ b/docs/use_cases/q_and_a/rag_cli.md @@ -112,6 +112,8 @@ import os from llama_index.core.ingestion import IngestionPipeline, IngestionCache from llama_index.core.query_pipeline import QueryPipeline from llama_index.core.storage.docstore import SimpleDocumentStore +from llama_index.cli.rag import RagCLI + # optional, set any API keys your script may need (perhaps using python-dotenv library instead) os.environ["OPENAI_API_KEY"] = "sk-xxx" diff --git a/llama-datasets/10k/uber_2021/BUILD b/llama-datasets/10k/uber_2021/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/10k/uber_2021/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/10k/uber_2021/README.md b/llama-datasets/10k/uber_2021/README.md new file mode 100644 index 0000000000000..8edf323890a03 --- /dev/null +++ b/llama-datasets/10k/uber_2021/README.md @@ -0,0 +1,61 @@ +# Uber 10K Dataset 2021 + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset Uber10KDataset2021 --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("Uber10KDataset2021", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, + query_engine=query_engine, + show_progress=True, +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/10k/uber_2021/card.json b/llama-datasets/10k/uber_2021/card.json new file mode 100644 index 0000000000000..a6fb854c1eafc --- /dev/null +++ b/llama-datasets/10k/uber_2021/card.json @@ -0,0 +1,27 @@ +{ + "name": "Uber 10K Dataset 2021", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based on the Uber 2021 10K document, consisting of queries, reference answers, and reference contexts.", + "numberObservations": 822, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": [], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.943, + "correctness": 3.874, + "faithfulness": 0.667, + "relevancy": 0.844 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/10k/uber_2021/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/10k/uber_2021/llamaindex_baseline.py b/llama-datasets/10k/uber_2021/llamaindex_baseline.py new file mode 100644 index 0000000000000..8af8eb51b536a --- /dev/null +++ b/llama-datasets/10k/uber_2021/llamaindex_baseline.py @@ -0,0 +1,41 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex +from llama_index.llms import OpenAI + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "Uber10KDataset2021", "./uber10k_2021_dataset" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + judge_llm = OpenAI(model="gpt-3.5-turbo") + rag_evaluator = RagEvaluatorPack( + query_engine=query_engine, rag_dataset=rag_dataset, judge_llm=judge_llm + ) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/__init__.py b/llama-datasets/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-datasets/blockchain_solana/BUILD b/llama-datasets/blockchain_solana/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/blockchain_solana/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/blockchain_solana/README.md b/llama-datasets/blockchain_solana/README.md new file mode 100644 index 0000000000000..cebaed8787417 --- /dev/null +++ b/llama-datasets/blockchain_solana/README.md @@ -0,0 +1,61 @@ +# Blockchain Solana Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset BlockchainSolanaDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "BlockchainSolanaDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/blockchain_solana/card.json b/llama-datasets/blockchain_solana/card.json new file mode 100644 index 0000000000000..d2dcba74d5de5 --- /dev/null +++ b/llama-datasets/blockchain_solana/card.json @@ -0,0 +1,27 @@ +{ + "name": "Blockchain Solana", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based off an article, From Bitcoin to Solana – Innovating Blockchain towards Enterprise Applications),by Xiangyu Li, Xinyu Wang, Tingli Kong, Junhao Zheng and Min Luo, consisting of queries, reference answers, and reference contexts.", + "numberObservations": 58, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["https://arxiv.org/abs/2207.05240"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.945, + "correctness": 4.457, + "faithfulness": 1.0, + "relevancy": 1.0 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/blockchain_solana/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/blockchain_solana/llamaindex_baseline.py b/llama-datasets/blockchain_solana/llamaindex_baseline.py new file mode 100644 index 0000000000000..0d9979c490dde --- /dev/null +++ b/llama-datasets/blockchain_solana/llamaindex_baseline.py @@ -0,0 +1,37 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "BlockchainSolanaDataset", "./blockchain_solana" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/braintrust_coda/BUILD b/llama-datasets/braintrust_coda/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/braintrust_coda/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/braintrust_coda/README.md b/llama-datasets/braintrust_coda/README.md new file mode 100644 index 0000000000000..96bedb61f87f8 --- /dev/null +++ b/llama-datasets/braintrust_coda/README.md @@ -0,0 +1,65 @@ +# Braintrust Coda Help Desk Dataset + +[![Braintrust (346 x 40 px)](https://github.com/nerdai/llama-hub/assets/92402603/a99bddf3-0eab-42e8-8c53-8432da8299d3)](https://www.braintrustdata.com/) + +_This dataset was kindly provided by Kenny Wong and Ankur Goyal._ + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset BraintrustCodaHelpDeskDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "BraintrustCodaHelpDeskDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/braintrust_coda/__init__.py b/llama-datasets/braintrust_coda/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-datasets/braintrust_coda/card.json b/llama-datasets/braintrust_coda/card.json new file mode 100644 index 0000000000000..6da7d2f45d7ce --- /dev/null +++ b/llama-datasets/braintrust_coda/card.json @@ -0,0 +1,29 @@ +{ + "name": "Braintrust Coda Help Desk", + "className": "LabelledRagDataset", + "description": "A list of automatically generated question/answer pairs from the Coda (https://coda.io/) help docs. This dataset is interesting because most models include Coda’s documentation as part of their training set, so you can baseline performance without RAG.", + "numberObservations": 100, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": [ + "https://gist.githubusercontent.com/wong-codaio/b8ea0e087f800971ca5ec9eef617273e/raw/39f8bd2ebdecee485021e20f2c1d40fd649a4c77/articles.json" + ], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.955, + "correctness": 4.32, + "faithfulness": 0.9, + "relevancy": 0.93 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/braintrust_coda/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/braintrust_coda/llamaindex_baseline.py b/llama-datasets/braintrust_coda/llamaindex_baseline.py new file mode 100644 index 0000000000000..13fd55153f03c --- /dev/null +++ b/llama-datasets/braintrust_coda/llamaindex_baseline.py @@ -0,0 +1,37 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "BraintrustCodaHelpDeskDataset", "./braintrust_codahdd" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/covidqa/BUILD b/llama-datasets/covidqa/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/covidqa/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/covidqa/README.md b/llama-datasets/covidqa/README.md new file mode 100644 index 0000000000000..1a725277534dc --- /dev/null +++ b/llama-datasets/covidqa/README.md @@ -0,0 +1,59 @@ +# Covid Qa Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset CovidQaDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("CovidQaDataset", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine, show_progress=True +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=40, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/covidqa/card.json b/llama-datasets/covidqa/card.json new file mode 100644 index 0000000000000..6e362e4a70f6f --- /dev/null +++ b/llama-datasets/covidqa/card.json @@ -0,0 +1,29 @@ +{ + "name": "Covid QA Dataset", + "className": "LabelledRagDataset", + "description": "A human-annotated RAG dataset consisting of over 300 question-answer pairs. This dataset represents a subset of the Covid-QA dataset available on Kaggle and authored by Xhlulu. It is a collection of frequently asked questions on COVID from various websites. This subset only considers the top 10 webpages containing the most question-answer pairs.", + "numberObservations": 316, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": [ + "https://www.kaggle.com/datasets/xhlulu/covidqa/?select=news.csv" + ], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": null, + "correctness": 3.96, + "faithfulness": 0.889, + "relevancy": 0.848 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/covidqa/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/covidqa/llamaindex_baseline.py b/llama-datasets/covidqa/llamaindex_baseline.py new file mode 100644 index 0000000000000..152490e025f41 --- /dev/null +++ b/llama-datasets/covidqa/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("CovidQaDataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=40, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/docugami_kg_rag/sec_10_q/BUILD b/llama-datasets/docugami_kg_rag/sec_10_q/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/docugami_kg_rag/sec_10_q/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/docugami_kg_rag/sec_10_q/README.md b/llama-datasets/docugami_kg_rag/sec_10_q/README.md new file mode 100644 index 0000000000000..fcd97d2c03d84 --- /dev/null +++ b/llama-datasets/docugami_kg_rag/sec_10_q/README.md @@ -0,0 +1,63 @@ +# Docugami KG-RAG - Sec 10-Q + +A labelled RAG dataset with SEC 10-Q documents for major tech companies including queries across multiple docs and chunks, with reference answers. See [https://github.com/docugami/KG-RAG-datasets](https://github.com/docugami/KG-RAG-datasets) for details. + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset DocugamiKgRagSec10Q --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "DocugamiKgRagSec10Q", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/docugami_kg_rag/sec_10_q/card.json b/llama-datasets/docugami_kg_rag/sec_10_q/card.json new file mode 100644 index 0000000000000..cfc73290dfc5d --- /dev/null +++ b/llama-datasets/docugami_kg_rag/sec_10_q/card.json @@ -0,0 +1,27 @@ +{ + "name": "Docugami KG-RAG - SEC 10-Q", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset with SEC 10-Q documents for major tech companies including queries across multiple docs and chunks, with reference answers. See https://github.com/docugami/KG-RAG-datasets for details.", + "numberObservations": 195, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": [], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": null, + "correctness": 2.703, + "faithfulness": 0.897, + "relevancy": 0.826 + }, + "codeUrl": "" + } + ] +} diff --git a/llama-datasets/docugami_kg_rag/sec_10_q/llamaindex_baseline.py b/llama-datasets/docugami_kg_rag/sec_10_q/llamaindex_baseline.py new file mode 100644 index 0000000000000..0945521bd17ab --- /dev/null +++ b/llama-datasets/docugami_kg_rag/sec_10_q/llamaindex_baseline.py @@ -0,0 +1,41 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex +from llama_index.llms import OpenAI + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "DocugamiKgRagSec10Q", "./docugami_kg_rag_sec_10_q" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + judge_llm = OpenAI(model="gpt-3.5-turbo") + rag_evaluator = RagEvaluatorPack( + query_engine=query_engine, rag_dataset=rag_dataset, judge_llm=judge_llm + ) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/eval_llm_survey_paper/BUILD b/llama-datasets/eval_llm_survey_paper/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/eval_llm_survey_paper/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/eval_llm_survey_paper/README.md b/llama-datasets/eval_llm_survey_paper/README.md new file mode 100644 index 0000000000000..5252e714a4a4d --- /dev/null +++ b/llama-datasets/eval_llm_survey_paper/README.md @@ -0,0 +1,61 @@ +# Evaluating Llm Survey Paper Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset EvaluatingLlmSurveyPaperDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "EvaluatingLlmSurveyPaperDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/eval_llm_survey_paper/card.json b/llama-datasets/eval_llm_survey_paper/card.json new file mode 100644 index 0000000000000..54c5e4f25556b --- /dev/null +++ b/llama-datasets/eval_llm_survey_paper/card.json @@ -0,0 +1,27 @@ +{ + "name": "Evaluating LLM Survey Paper Dataset", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset over the comprehensive, spanning 111 pages in total, survey on evaluating LLMs.", + "numberObservations": 276, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["https://arxiv.org/pdf/2310.19736.pdf"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.923, + "correctness": 3.81, + "faithfulness": 0.888, + "relevancy": 0.808 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_squadv2/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/eval_llm_survey_paper/llamaindex_baseline.py b/llama-datasets/eval_llm_survey_paper/llamaindex_baseline.py new file mode 100644 index 0000000000000..001accf42813c --- /dev/null +++ b/llama-datasets/eval_llm_survey_paper/llamaindex_baseline.py @@ -0,0 +1,34 @@ +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "EvaluatingLlmSurveyPaperDataset", "./data" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + main() diff --git a/llama-datasets/history_of_alexnet/BUILD b/llama-datasets/history_of_alexnet/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/history_of_alexnet/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/history_of_alexnet/README.md b/llama-datasets/history_of_alexnet/README.md new file mode 100644 index 0000000000000..1cf0f1e64caa0 --- /dev/null +++ b/llama-datasets/history_of_alexnet/README.md @@ -0,0 +1,61 @@ +# History Of Alexnet Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset HistoryOfAlexnetDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "HistoryOfAlexnetDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/history_of_alexnet/card.json b/llama-datasets/history_of_alexnet/card.json new file mode 100644 index 0000000000000..632136c4aec75 --- /dev/null +++ b/llama-datasets/history_of_alexnet/card.json @@ -0,0 +1,27 @@ +{ + "name": "History of Alexnet Dataset", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based off an article, The History Began from AlexNet: A Comprehensive Survey on Deep Learning Approaches, by Md Zahangir Alom, Tarek M. Taha, Christopher Yakopcic, Stefan Westberg, Paheding Sidike, Mst Shamima Nasrin, Brian C Van Esesn, Abdul A S. Awwal, Vijayan K. Asari, consisting of queries, reference answers, and reference contexts.", + "numberObservations": 160, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["https://arxiv.org/abs/1803.01164"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.931, + "correctness": 4.434, + "faithfulness": 0.963, + "relevancy": 0.931 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/history_of_alexnet/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/history_of_alexnet/llamaindex_baseline.py b/llama-datasets/history_of_alexnet/llamaindex_baseline.py new file mode 100644 index 0000000000000..dcf09d21a2db2 --- /dev/null +++ b/llama-datasets/history_of_alexnet/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("HistoryOfAlexnetDataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/library.json b/llama-datasets/library.json new file mode 100644 index 0000000000000..c30a293ccd74a --- /dev/null +++ b/llama-datasets/library.json @@ -0,0 +1,87 @@ +{ + "PaulGrahamEssayDataset": { + "id": "paul_graham_essay", + "author": "nerdai", + "keywords": ["rag"] + }, + "BraintrustCodaHelpDeskDataset": { + "id": "braintrust_coda", + "author": "dashk", + "keywords": ["rag", "help desk"] + }, + "PatronusAIFinanceBenchDataset": { + "id": "patronus_financebench", + "author": "anandnk24", + "keywords": ["rag", "finance"] + }, + "BlockchainSolanaDataset": { + "id": "blockchain_solana", + "author": "CalculusC", + "keywords": ["rag", "cryptocurrency"] + }, + "MiniTruthfulQADataset": { + "id": "mini_truthfulqa", + "author": "nerdai", + "keywords": ["rag", "truthfulqa"] + }, + "Llama2PaperDataset": { + "id": "llama2_paper", + "author": "jerryjliu", + "keywords": ["rag", "llama2"] + }, + "Uber10KDataset2021": { + "id": "10k/uber_2021", + "author": "jerryjliu", + "keywords": ["sec", "uber", "10k"] + }, + "MiniSquadV2Dataset": { + "id": "mini_squadv2", + "author": "axiomofjoy", + "keywords": ["rag", "squadv2"] + }, + "OriginOfCovid19Dataset": { + "id": "origin_of_covid19", + "author": "CalculusC", + "keywords": ["rag", "covid-19"] + }, + "EvaluatingLlmSurveyPaperDataset": { + "id": "eval_llm_survey_paper", + "author": "nerdai", + "keywords": ["rag", "evaluation", "paper"] + }, + "CovidQaDataset": { + "id": "covidqa", + "author": "nerdai", + "keywords": ["rag", "covid"] + }, + "MiniCovidQaDataset": { + "id": "mini_covidqa", + "author": "nerdai", + "keywords": ["rag", "covid", "mini"] + }, + "HistoryOfAlexnetDataset": { + "id": "history_of_alexnet", + "author": "CalculusC", + "keywords": ["rag", "alexnet"] + }, + "DocugamiKgRagSec10Q": { + "id": "docugami_kg_rag/sec_10_q", + "author": "Docugami", + "keywords": ["rag", "kg-rag", "10q", "docugami"] + }, + "MtBenchHumanJudgementDataset": { + "id": "mt_bench_humanjudgement", + "author": "nerdai", + "keywords": ["evaluator", "llm as judge", "human agreement"] + }, + "MiniMtBenchSingleGradingDataset": { + "id": "mini_mt_bench_singlegrading", + "author": "nerdai", + "keywords": ["evaluator", "llm as judge"] + }, + "MiniEsgBenchDataset": { + "id": "mini_esg_bench", + "author": "nerdai", + "keywords": ["rag", "pdf", "esg"] + } +} diff --git a/llama-datasets/llama2_paper/BUILD b/llama-datasets/llama2_paper/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/llama2_paper/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/llama2_paper/README.md b/llama-datasets/llama2_paper/README.md new file mode 100644 index 0000000000000..457cd8fc2f188 --- /dev/null +++ b/llama-datasets/llama2_paper/README.md @@ -0,0 +1,59 @@ +# Llama 2 Paper Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset Llama2PaperDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("Llama2PaperDataset", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/llama2_paper/__init__.py b/llama-datasets/llama2_paper/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-datasets/llama2_paper/card.json b/llama-datasets/llama2_paper/card.json new file mode 100644 index 0000000000000..ce772a8f76205 --- /dev/null +++ b/llama-datasets/llama2_paper/card.json @@ -0,0 +1,27 @@ +{ + "name": "Llama 2 Paper Dataset", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based off the Llama 2 ArXiv PDF.", + "numberObservations": 100, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["https://arxiv.org/abs/2307.09288"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.939, + "correctness": 4.08, + "faithfulness": 0.97, + "relevancy": 0.95 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/llama2_paper/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/llama2_paper/llamaindex_baseline.py b/llama-datasets/llama2_paper/llamaindex_baseline.py new file mode 100644 index 0000000000000..110208f68248c --- /dev/null +++ b/llama-datasets/llama2_paper/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("Llama2PaperDataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mini_covidqa/BUILD b/llama-datasets/mini_covidqa/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mini_covidqa/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mini_covidqa/README.md b/llama-datasets/mini_covidqa/README.md new file mode 100644 index 0000000000000..350c82c739e33 --- /dev/null +++ b/llama-datasets/mini_covidqa/README.md @@ -0,0 +1,59 @@ +# Mini Covid Qa Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MiniCovidQaDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("MiniCovidQaDataset", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/mini_covidqa/card.json b/llama-datasets/mini_covidqa/card.json new file mode 100644 index 0000000000000..99c5b97746ad6 --- /dev/null +++ b/llama-datasets/mini_covidqa/card.json @@ -0,0 +1,29 @@ +{ + "name": "Mini Covid QA Dataset", + "className": "LabelledRagDataset", + "description": "This dataset is a mini version of CovidQaDataset.\n A human-annotated RAG dataset consisting of over 300 question-answer pairs. This dataset represents a subset of the Covid-QA dataset available on Kaggle and authored by Xhlulu. It is a collection of frequently asked questions on COVID from various websites. This subset only considers the top 10 webpages containing the most question-answer pairs.", + "numberObservations": 42, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": [ + "https://www.kaggle.com/datasets/xhlulu/mini_covidqa/?select=news.csv" + ], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": null, + "correctness": 4.214, + "faithfulness": 0.857, + "relevancy": 0.833 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_covidqa/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/mini_covidqa/llamaindex_baseline.py b/llama-datasets/mini_covidqa/llamaindex_baseline.py new file mode 100644 index 0000000000000..bcc9e5b963f81 --- /dev/null +++ b/llama-datasets/mini_covidqa/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("MiniCovidQaDataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=40, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mini_esg_bench/BUILD b/llama-datasets/mini_esg_bench/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mini_esg_bench/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mini_esg_bench/README.md b/llama-datasets/mini_esg_bench/README.md new file mode 100644 index 0000000000000..2f3c89c00115b --- /dev/null +++ b/llama-datasets/mini_esg_bench/README.md @@ -0,0 +1,75 @@ +# Mini Esg Bench Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MiniEsgBenchDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "MiniEsgBenchDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` + +## Citing the data + +If you choose to use this dataset for research, it would be appreciated if you +could cite it with given details below. + +```text +@misc{llamaindex_mini_esg_bench_2023, + title={Mini ESG Bench}, + author={Val Andrei Fajardo}, + year={2023}, + organization={llamaindex} +} +``` diff --git a/llama-datasets/mini_esg_bench/card.json b/llama-datasets/mini_esg_bench/card.json new file mode 100644 index 0000000000000..726fd0909bb4a --- /dev/null +++ b/llama-datasets/mini_esg_bench/card.json @@ -0,0 +1,27 @@ +{ + "name": "Mini ESG Bench Dataset", + "className": "LabelledRagDataset", + "description": "This dataset is meant to be a difficult benchmark for pdf parsers. In particular, adopting the terminology used in the PDFTriage paper (https://arxiv.org/abs/2309.08872), we curate difficult questions involving structural knowledge of the PDF documents. The examples in this dataset come from the Environment, Social and (corporate) Governance (ESG) reports of FAANG (companies) and Microsoft in 2021-2022.", + "numberObservations": 50, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": [], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.836, + "correctness": 1.88, + "faithfulness": 0.84, + "relevancy": 0.6 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_esg_bench/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/mini_esg_bench/llamaindex_baseline.py b/llama-datasets/mini_esg_bench/llamaindex_baseline.py new file mode 100644 index 0000000000000..7aa4607b0f271 --- /dev/null +++ b/llama-datasets/mini_esg_bench/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("MiniEsgBenchDataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mini_mt_bench_singlegrading/BUILD b/llama-datasets/mini_mt_bench_singlegrading/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mini_mt_bench_singlegrading/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mini_mt_bench_singlegrading/README.md b/llama-datasets/mini_mt_bench_singlegrading/README.md new file mode 100644 index 0000000000000..ed7170a4f9321 --- /dev/null +++ b/llama-datasets/mini_mt_bench_singlegrading/README.md @@ -0,0 +1,82 @@ +# Mini Mt Bench Single Grading Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MiniMtBenchSingleGradingDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledEvaluatorDataset + +evaluator_dataset = LabelledEvaluatorDataset.from_json( + "./data/pairwise_evaluation_dataset.json" +) +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `EvaluatorBenchmarkerPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core.evaluation import CorrectnessEvaluator +from llama_index.llms import OpenAI +from llama_index.core import ServiceContext + +# download benchmark dataset +evaluator_dataset, _ = download_llama_dataset( + "MiniMtBenchSingleGradingDataset", "./data" +) + +# define your evaluator +gpt_4_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-4"), +) + +evaluator = CorrectnessEvaluator(service_context=gpt_4_context) + +# evaluate using the EvaluatorBenchmarkerPack +EvaluatorBenchmarkerPack = download_llama_pack( + "EvaluatorBenchmarkerPack", "./pack" +) +evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluator, + eval_dataset=evaluator_dataset, + show_progress=True, +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await evaluator_benchmarker.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` + +## Original data citation + +```text +@misc{zheng2023judging, + title={Judging LLM-as-a-judge with MT-Bench and Chatbot Arena}, + author={Lianmin Zheng and Wei-Lin Chiang and Ying Sheng and Siyuan Zhuang and Zhanghao Wu and Yonghao Zhuang and Zi Lin and Zhuohan Li and Dacheng Li and Eric. P Xing and Hao Zhang and Joseph E. Gonzalez and Ion Stoica}, + year={2023}, + eprint={2306.05685}, + archivePrefix={arXiv}, + primaryClass={cs.CL} +} +``` diff --git a/llama-datasets/mini_mt_bench_singlegrading/baselines.py b/llama-datasets/mini_mt_bench_singlegrading/baselines.py new file mode 100644 index 0000000000000..f8096e882ba40 --- /dev/null +++ b/llama-datasets/mini_mt_bench_singlegrading/baselines.py @@ -0,0 +1,84 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core.evaluation import CorrectnessEvaluator +from llama_index.llms import OpenAI, Gemini +from llama_index.core import ServiceContext +import pandas as pd + + +async def main(): + # DOWNLOAD LLAMADATASET + evaluator_dataset, _ = download_llama_dataset( + "MiniMtBenchSingleGradingDataset", "./mini_mt_bench_data" + ) + + # DEFINE EVALUATORS + gpt_4_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-4"), + ) + + gpt_3p5_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-3.5-turbo"), + ) + + gemini_pro_context = ServiceContext.from_defaults( + llm=Gemini(model="models/gemini-pro", temperature=0) + ) + + evaluators = { + "gpt-4": CorrectnessEvaluator(service_context=gpt_4_context), + "gpt-3.5": CorrectnessEvaluator(service_context=gpt_3p5_context), + "gemini-pro": CorrectnessEvaluator(service_context=gemini_pro_context), + } + + # EVALUATE WITH PACK + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + EvaluatorBenchmarkerPack = download_llama_pack("EvaluatorBenchmarkerPack", "./pack") + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gpt-3.5"], + eval_dataset=evaluator_dataset, + show_progress=True, + ) + gpt_3p5_benchmark_df = await evaluator_benchmarker.arun( + batch_size=100, sleep_time_in_seconds=0 + ) + + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gpt-4"], + eval_dataset=evaluator_dataset, + show_progress=True, + ) + gpt_4_benchmark_df = await evaluator_benchmarker.arun( + batch_size=100, sleep_time_in_seconds=0 + ) + + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gemini-pro"], + eval_dataset=evaluator_dataset, + show_progress=True, + ) + gemini_pro_benchmark_df = await evaluator_benchmarker.arun( + batch_size=5, sleep_time_in_seconds=0.5 + ) + + benchmark_df = pd.concat( + [ + gpt_3p5_benchmark_df, + gpt_4_benchmark_df, + gemini_pro_benchmark_df, + ], + axis=0, + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mini_mt_bench_singlegrading/card.json b/llama-datasets/mini_mt_bench_singlegrading/card.json new file mode 100644 index 0000000000000..06bfe889a7dd2 --- /dev/null +++ b/llama-datasets/mini_mt_bench_singlegrading/card.json @@ -0,0 +1,55 @@ +{ + "name": "Mini MT Bench Dataset", + "className": "LabelledEvaluatorDataset", + "description": "This is a miniature version to the original MT Bench (Single-Grading) Dataset. In particular, this dataset only consists of answers produced by Llama2-70b LLM to the 160 questions i.e., 80 x 2 since there are two turns. The reference evaluations are done using the `CorrectnessEvaluator` class and with GPT-4 as the judge LLM.", + "numberObservations": 160, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": [ + "https://huggingface.co/spaces/lmsys/mt-bench/tree/main/data/mt_bench" + ], + "baselines": [ + { + "name": "gpt-3.5", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/correctness.py#L17", + "llm": "gpt-3.5" + }, + "metrics": { + "invalidPredictions": 0, + "correlation": 0.317, + "meanAbsoluteError": 1.119, + "hamming": 27 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_mt_bench_singlegrading/baselines.py" + }, + { + "name": "gpt-4", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/correctness.py#L17", + "llm": "gpt-4" + }, + "metrics": { + "invalidPredictions": 0, + "correlation": 0.966, + "meanAbsoluteError": 0.094, + "hamming": 143 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_mt_bench_singlegrading/baselines.py" + }, + { + "name": "gemini-pro", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/correctness.py#L17", + "llm": "gemini-pro" + }, + "metrics": { + "invalidPredictions": 1, + "correlation": 0.295, + "meanAbsoluteError": 1.22, + "hamming": 12 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_mt_bench_singlegrading/baselines.py" + } + ] +} diff --git a/llama-datasets/mini_squadv2/BUILD b/llama-datasets/mini_squadv2/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mini_squadv2/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mini_squadv2/README.md b/llama-datasets/mini_squadv2/README.md new file mode 100644 index 0000000000000..ea5cdfd259e9f --- /dev/null +++ b/llama-datasets/mini_squadv2/README.md @@ -0,0 +1,79 @@ +# Mini Squad V2 Dataset + +[![arize (100 x 40 px)](https://github.com/nerdai/llama-hub/assets/92402603/eb4cb77a-1a1a-48a0-9f9d-277798832200)](https://arize.com/) + +This dataset was prepared in collaboration with Xander Song of Arize AI. + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MiniSquadV2Dataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("MiniSquadV2Dataset", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` + +## Original data citation + +```tex +@article{2016arXiv160605250R, + author = {{Rajpurkar}, Pranav and {Zhang}, Jian and {Lopyrev}, + Konstantin and {Liang}, Percy}, + title = "{SQuAD: 100,000+ Questions for Machine Comprehension of Text}", + journal = {arXiv e-prints}, + year = 2016, + eid = {arXiv:1606.05250}, + pages = {arXiv:1606.05250}, +archivePrefix = {arXiv}, + eprint = {1606.05250}, +} +``` diff --git a/llama-datasets/mini_squadv2/card.json b/llama-datasets/mini_squadv2/card.json new file mode 100644 index 0000000000000..6c5adffa7cd01 --- /dev/null +++ b/llama-datasets/mini_squadv2/card.json @@ -0,0 +1,27 @@ +{ + "name": "Mini Squad V2 Dataset", + "className": "LabelledRagDataset", + "description": "This is a subset of the original SquadV2 dataset. In particular, it considers only the top 10 Wikipedia pages in terms of having questions about them.", + "numberObservations": 195, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": ["https://huggingface.co/datasets/squad_v2"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.878, + "correctness": 3.464, + "faithfulness": 0.815, + "relevancy": 0.697 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_squadv2/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/mini_squadv2/llamaindex_baseline.py b/llama-datasets/mini_squadv2/llamaindex_baseline.py new file mode 100644 index 0000000000000..5bfe2a58b6451 --- /dev/null +++ b/llama-datasets/mini_squadv2/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("MiniSquadV2Dataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mini_truthfulqa/BUILD b/llama-datasets/mini_truthfulqa/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mini_truthfulqa/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mini_truthfulqa/README.md b/llama-datasets/mini_truthfulqa/README.md new file mode 100644 index 0000000000000..3ae8b99b1177c --- /dev/null +++ b/llama-datasets/mini_truthfulqa/README.md @@ -0,0 +1,74 @@ +# Mini TruthfulQA Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MiniTruthfulQADataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "MiniTruthfulQADataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` + +## Original data citation + +```tex +@misc{lin2021truthfulqa, + title={TruthfulQA: Measuring How Models Mimic Human Falsehoods}, + author={Stephanie Lin and Jacob Hilton and Owain Evans}, + year={2021}, + eprint={2109.07958}, + archivePrefix={arXiv}, + primaryClass={cs.CL} +} +``` diff --git a/llama-datasets/mini_truthfulqa/card.json b/llama-datasets/mini_truthfulqa/card.json new file mode 100644 index 0000000000000..dae559b961270 --- /dev/null +++ b/llama-datasets/mini_truthfulqa/card.json @@ -0,0 +1,27 @@ +{ + "name": "Mini TruthfulQA Dataset", + "className": "LabelledRagDataset", + "description": "This is a subset of the TruthfulQA benchmark. Only examples that are based off of Wikipedia pages are considered; and furthermore, Wikipedia pages that contain only one question are also dropped. The result is 152 examples for evaluating a RAG system.", + "numberObservations": 152, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": ["https://huggingface.co/datasets/truthful_qa"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": null, + "correctness": 3.845, + "faithfulness": 0.605, + "relevancy": 0.599 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mini_truthfulqa/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/mini_truthfulqa/llamaindex_baseline.py b/llama-datasets/mini_truthfulqa/llamaindex_baseline.py new file mode 100644 index 0000000000000..457fafcc58636 --- /dev/null +++ b/llama-datasets/mini_truthfulqa/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("MiniTruthfulQADataset", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mt_bench_humanjudgement/BUILD b/llama-datasets/mt_bench_humanjudgement/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/mt_bench_humanjudgement/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/mt_bench_humanjudgement/README.md b/llama-datasets/mt_bench_humanjudgement/README.md new file mode 100644 index 0000000000000..9f9e9d762e513 --- /dev/null +++ b/llama-datasets/mt_bench_humanjudgement/README.md @@ -0,0 +1,82 @@ +# Mt Bench Human Judgement Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset MtBenchHumanJudgementDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledPairwiseEvaluatorDataset + +pairwise_evaluator_dataset = LabelledPairwiseEvaluatorDataset.from_json( + "./data/pairwise_evaluator_dataset.json" +) +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `EvaluatorBenchmarkerPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core.evaluator import PairwiseComparisonEvaluator +from llama_index.llms import OpenAI +from llama_index.core import ServiceContext + +# download benchmark dataset +pairwise_evaluator_dataset, _ = download_llama_dataset( + "MtBenchHumanJudgementDataset", "./data" +) + +# define your evaluator +gpt_4_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-4"), +) + +evaluator = PairwiseComparisonEvaluator(service_context=gpt_4_context) + +# evaluate using the EvaluatorBenchmarkerPack +EvaluatorBenchmarkerPack = download_llama_pack( + "EvaluatorBenchmarkerPack", "./pack" +) +evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluator, + eval_dataset=pairwise_evaluator_dataset, + show_progress=True, +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await evaluator_benchmarker.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` + +## Original data citation + +```text +@misc{zheng2023judging, + title={Judging LLM-as-a-judge with MT-Bench and Chatbot Arena}, + author={Lianmin Zheng and Wei-Lin Chiang and Ying Sheng and Siyuan Zhuang and Zhanghao Wu and Yonghao Zhuang and Zi Lin and Zhuohan Li and Dacheng Li and Eric. P Xing and Hao Zhang and Joseph E. Gonzalez and Ion Stoica}, + year={2023}, + eprint={2306.05685}, + archivePrefix={arXiv}, + primaryClass={cs.CL} +} +``` diff --git a/llama-datasets/mt_bench_humanjudgement/baselines.py b/llama-datasets/mt_bench_humanjudgement/baselines.py new file mode 100644 index 0000000000000..3e8094ef91540 --- /dev/null +++ b/llama-datasets/mt_bench_humanjudgement/baselines.py @@ -0,0 +1,84 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core.evaluation import PairwiseComparisonEvaluator +from llama_index.llms import OpenAI, Gemini +from llama_index.core import ServiceContext +import pandas as pd + + +async def main(): + # DOWNLOAD LLAMADATASET + pairwise_evaluator_dataset, _ = download_llama_dataset( + "MtBenchHumanJudgementDataset", "./mt_bench_data" + ) + + # DEFINE EVALUATORS + gpt_4_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-4"), + ) + + gpt_3p5_context = ServiceContext.from_defaults( + llm=OpenAI(temperature=0, model="gpt-3.5-turbo"), + ) + + gemini_pro_context = ServiceContext.from_defaults( + llm=Gemini(model="models/gemini-pro", temperature=0) + ) + + evaluators = { + "gpt-4": PairwiseComparisonEvaluator(service_context=gpt_4_context), + "gpt-3.5": PairwiseComparisonEvaluator(service_context=gpt_3p5_context), + "gemini-pro": PairwiseComparisonEvaluator(service_context=gemini_pro_context), + } + + # EVALUATE WITH PACK + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + EvaluatorBenchmarkerPack = download_llama_pack("EvaluatorBenchmarkerPack", "./pack") + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gpt-3.5"], + eval_dataset=pairwise_evaluator_dataset, + show_progress=True, + ) + gpt_3p5_benchmark_df = await evaluator_benchmarker.arun( + batch_size=100, sleep_time_in_seconds=0 + ) + + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gpt-4"], + eval_dataset=pairwise_evaluator_dataset, + show_progress=True, + ) + gpt_4_benchmark_df = await evaluator_benchmarker.arun( + batch_size=100, sleep_time_in_seconds=0 + ) + + evaluator_benchmarker = EvaluatorBenchmarkerPack( + evaluator=evaluators["gemini-pro"], + eval_dataset=pairwise_evaluator_dataset, + show_progress=True, + ) + gemini_pro_benchmark_df = await evaluator_benchmarker.arun( + batch_size=5, sleep_time_in_seconds=0.5 + ) + + benchmark_df = pd.concat( + [ + gpt_3p5_benchmark_df, + gpt_4_benchmark_df, + gemini_pro_benchmark_df, + ], + axis=0, + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/mt_bench_humanjudgement/card.json b/llama-datasets/mt_bench_humanjudgement/card.json new file mode 100644 index 0000000000000..286ab624ce64d --- /dev/null +++ b/llama-datasets/mt_bench_humanjudgement/card.json @@ -0,0 +1,58 @@ +{ + "name": "MT Bench Human Judgement Dataset", + "className": "LabelledPairwiseEvaluatorDataset", + "description": "This is an adaptation of the original MT Bench Human Judgement dataset, where human evaluators compare two llm model responses and rank them according to their own preference. In the original version, there can be more than one human evaluator for a given example (query, two model responses). In this adapted version however, we aggregate these 'repeated' entries and convert the 'winner' column of the original schema to instead represent the proportion of times 'model_a' wins across all of the human evaluators. To adapt this to a llama-dataset, and to better consider ties (albeit with small samples) we set an uncertainty threshold for this proportion in that if it is between [0.4, 0.6] then we consider there to be no winner between the two models.", + "numberObservations": 1204, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": [ + "https://huggingface.co/datasets/lmsys/mt_bench_human_judgments" + ], + "baselines": [ + { + "name": "gpt-3.5", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/pairwise.py#L21", + "llm": "gpt-3.5" + }, + "metrics": { + "invalidPredictions": 89, + "inconclusives": 407, + "ties": 51, + "agreementRateWithTies": 0.743, + "agreementRateWithoutTies": 0.798 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mt_bench_humanjudgement/baselines.py" + }, + { + "name": "gpt-4", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/pairwise.py#L21", + "llm": "gpt-4" + }, + "metrics": { + "invalidPredictions": 1, + "inconclusives": 107, + "ties": 102, + "agreementRateWithTies": 0.709, + "agreementRateWithoutTies": 0.779 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mt_bench_humanjudgement/baselines.py" + }, + { + "name": "gemini-pro", + "config": { + "promptUrl": "https://github.com/run-llama/llama_index.core/blob/e471e5f8a93ddae6d366cdbba8a497cd6728c7f8/llama_index.core/evaluation/pairwise.py#L21", + "llm": "gemini-pro" + }, + "metrics": { + "invalidPredictions": 2, + "inconclusives": 295, + "ties": 60, + "agreementRateWithTies": 0.742, + "agreementRateWithoutTies": 0.793 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/mt_bench_humanjudgement/baselines.py" + } + ] +} diff --git a/llama-datasets/origin_of_covid19/BUILD b/llama-datasets/origin_of_covid19/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/origin_of_covid19/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/origin_of_covid19/README.md b/llama-datasets/origin_of_covid19/README.md new file mode 100644 index 0000000000000..a7d8b4b9bd8b6 --- /dev/null +++ b/llama-datasets/origin_of_covid19/README.md @@ -0,0 +1,62 @@ +# Origin Of COVID-19 Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset OriginOfCovid19Dataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "OriginOfCovid19Dataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) +benchmark_df = rag_evaluator_pack.run() # async arun() supported as well + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/origin_of_covid19/card.json b/llama-datasets/origin_of_covid19/card.json new file mode 100644 index 0000000000000..6686d3a68b978 --- /dev/null +++ b/llama-datasets/origin_of_covid19/card.json @@ -0,0 +1,27 @@ +{ + "name": "Origin Of Covid19 Dataset", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based off an article, The Origin Of COVID-19 and Why It Matters, by Morens DM, Breman JG, Calisher CH, Doherty PC, Hahn BH, Keusch GT, Kramer LD, LeDuc JW, Monath TP, Taubenberger JK, consisting of queries, reference answers, and reference contexts.", + "numberObservations": 24, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7470595/"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.952, + "correctness": 4.562, + "faithfulness": 1.0, + "relevancy": 0.958 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/origin_of_covid19/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/origin_of_covid19/llamaindex_baseline.py b/llama-datasets/origin_of_covid19/llamaindex_baseline.py new file mode 100644 index 0000000000000..83a5f7415054c --- /dev/null +++ b/llama-datasets/origin_of_covid19/llamaindex_baseline.py @@ -0,0 +1,35 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset("OriginOfCovid19", "./data") + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/patronus_financebench/BUILD b/llama-datasets/patronus_financebench/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/patronus_financebench/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/patronus_financebench/README.md b/llama-datasets/patronus_financebench/README.md new file mode 100644 index 0000000000000..3fb0fdce8129d --- /dev/null +++ b/llama-datasets/patronus_financebench/README.md @@ -0,0 +1,68 @@ +# Patronus AI FinanceBench Dataset + +[![patronus-ai-logo (200 x 40 px)](https://github.com/nerdai/llama-hub/assets/92402603/62a6df3f-57a3-4d68-917b-b0947392efcd)](https://www.patronus.ai/) + +This dataset is a subset of the original FinanceBench dataset. In particular, to +make this benchmark more computationally efficient, we only keep the documents for +which there are 2 or more questions. Such filtering, reduced the total unique pdf +documents from 98 to 32. + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset PatronusAIFinanceBenchDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "PatronusAIFinanceBenchDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/patronus_financebench/__init__.py b/llama-datasets/patronus_financebench/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-datasets/patronus_financebench/card.json b/llama-datasets/patronus_financebench/card.json new file mode 100644 index 0000000000000..38bcfffb6d09d --- /dev/null +++ b/llama-datasets/patronus_financebench/card.json @@ -0,0 +1,27 @@ +{ + "name": "Patronus AI FinanceBench", + "className": "LabelledRagDataset", + "description": "This is a subset of the original FinanceBench dataset. FinanceBench is a first-of-its-kind test suite for evaluating the performance of LLMs on open book financial question answering (QA). This is an open source sample of 150 annotated examples used in the evaluation and analysis of models assessed in the FinanceBench paper. The dataset comprises of questions about publicly traded companies, with corresponding answers and evidence strings. The questions in FinanceBench are ecologically valid and cover a diverse set of scenarios. They are intended to be clear-cut and straightforward to answer to serve as a minimum performance standard.", + "numberObservations": 98, + "containsExamplesByHumans": true, + "containsExamplesByAi": false, + "sourceUrls": ["https://huggingface.co/datasets/PatronusAI/financebench"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 1, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.87, + "correctness": 2.622, + "faithfulness": 0.755, + "relevancy": 0.684 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/patronus_financebench/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/patronus_financebench/llamaindex_baseline.py b/llama-datasets/patronus_financebench/llamaindex_baseline.py new file mode 100644 index 0000000000000..7b9b31b20ec9f --- /dev/null +++ b/llama-datasets/patronus_financebench/llamaindex_baseline.py @@ -0,0 +1,37 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "PatronusAIFinanceBenchDataset", "./patronus_financebench" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/paul_graham_essay/BUILD b/llama-datasets/paul_graham_essay/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-datasets/paul_graham_essay/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-datasets/paul_graham_essay/README.md b/llama-datasets/paul_graham_essay/README.md new file mode 100644 index 0000000000000..ac92763359758 --- /dev/null +++ b/llama-datasets/paul_graham_essay/README.md @@ -0,0 +1,61 @@ +# Paul Graham Essay Dataset + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset PaulGrahamEssayDataset --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset( + "PaulGrahamEssayDataset", "./data" +) + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-datasets/paul_graham_essay/__init__.py b/llama-datasets/paul_graham_essay/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-datasets/paul_graham_essay/card.json b/llama-datasets/paul_graham_essay/card.json new file mode 100644 index 0000000000000..8d4eb8d67dc98 --- /dev/null +++ b/llama-datasets/paul_graham_essay/card.json @@ -0,0 +1,27 @@ +{ + "name": "Paul Graham Essay", + "className": "LabelledRagDataset", + "description": "A labelled RAG dataset based off an essay by Paul Graham, consisting of queries, reference answers, and reference contexts.", + "numberObservations": 44, + "containsExamplesByHumans": false, + "containsExamplesByAi": true, + "sourceUrls": ["http://www.paulgraham.com/articles.html"], + "baselines": [ + { + "name": "llamaindex", + "config": { + "chunkSize": 1024, + "llm": "gpt-3.5-turbo", + "similarityTopK": 2, + "embedModel": "text-embedding-ada-002" + }, + "metrics": { + "contextSimilarity": 0.934, + "correctness": 4.239, + "faithfulness": 0.977, + "relevancy": 0.977 + }, + "codeUrl": "https://github.com/run-llama/llama-hub/blob/main/llama_hub/llama_datasets/paul_graham_essay/llamaindex_baseline.py" + } + ] +} diff --git a/llama-datasets/paul_graham_essay/llamaindex_baseline.py b/llama-datasets/paul_graham_essay/llamaindex_baseline.py new file mode 100644 index 0000000000000..f5f3a76eed926 --- /dev/null +++ b/llama-datasets/paul_graham_essay/llamaindex_baseline.py @@ -0,0 +1,37 @@ +import asyncio + +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + + +async def main(): + # DOWNLOAD LLAMADATASET + rag_dataset, documents = download_llama_dataset( + "PaulGrahamEssayDataset", "./paul_graham" + ) + + # BUILD BASIC RAG PIPELINE + index = VectorStoreIndex.from_documents(documents=documents) + query_engine = index.as_query_engine() + + # EVALUATE WITH PACK + RagEvaluatorPack = download_llama_pack("RagEvaluatorPack", "./pack_stuff") + rag_evaluator = RagEvaluatorPack(query_engine=query_engine, rag_dataset=rag_dataset) + + ############################################################################ + # NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # + # then you'll need to use different batch_size and sleep_time_in_seconds. # + # For Usage Tier 1, settings that seemed to work well were batch_size=5, # + # and sleep_time_in_seconds=15 (as of December 2023.) # + ############################################################################ + benchmark_df = await rag_evaluator.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # number of seconds sleep before making an api call + ) + print(benchmark_df) + + +if __name__ == "__main__": + loop = asyncio.get_event_loop() + loop.run_until_complete(main) diff --git a/llama-datasets/template_README.md b/llama-datasets/template_README.md new file mode 100644 index 0000000000000..10852a6ffc3cd --- /dev/null +++ b/llama-datasets/template_README.md @@ -0,0 +1,59 @@ +# {NAME} + +## CLI Usage + +You can download `llamadatasets` directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamadataset {NAME_CAMELCASE} --download-dir ./data +``` + +You can then inspect the files at `./data`. When you're ready to load the data into +python, you can use the below snippet of code: + +```python +from llama_index.core import SimpleDirectoryReader +from llama_index.core.llama_dataset import LabelledRagDataset + +rag_dataset = LabelledRagDataset.from_json("./data/rag_dataset.json") +documents = SimpleDirectoryReader(input_dir="./data/source_files").load_data() +``` + +## Code Usage + +You can download the dataset to a directory, say `./data` directly in Python +as well. From there, you can use the convenient `RagEvaluatorPack` llamapack to +run your own LlamaIndex RAG pipeline with the `llamadataset`. + +```python +from llama_index.core.llama_dataset import download_llama_dataset +from llama_index.core.llama_pack import download_llama_pack +from llama_index.core import VectorStoreIndex + +# download and install dependencies for benchmark dataset +rag_dataset, documents = download_llama_dataset("{NAME_CAMELCASE}", "./data") + +# build basic RAG system +index = VectorStoreIndex.from_documents(documents=documents) +query_engine = index.as_query_engine() + +# evaluate using the RagEvaluatorPack +RagEvaluatorPack = download_llama_pack( + "RagEvaluatorPack", "./rag_evaluator_pack" +) +rag_evaluator_pack = RagEvaluatorPack( + rag_dataset=rag_dataset, query_engine=query_engine +) + +############################################################################ +# NOTE: If have a lower tier subscription for OpenAI API like Usage Tier 1 # +# then you'll need to use different batch_size and sleep_time_in_seconds. # +# For Usage Tier 1, settings that seemed to work well were batch_size=5, # +# and sleep_time_in_seconds=15 (as of December 2023.) # +############################################################################ + +benchmark_df = await rag_evaluator_pack.arun( + batch_size=20, # batches the number of openai api calls to make + sleep_time_in_seconds=1, # seconds to sleep before making an api call +) +``` diff --git a/llama-index-cli/llama_index/cli/command_line.py b/llama-index-cli/llama_index/cli/command_line.py index a04a20bd29776..73eda0c50f1a0 100644 --- a/llama-index-cli/llama_index/cli/command_line.py +++ b/llama-index-cli/llama_index/cli/command_line.py @@ -4,10 +4,10 @@ from llama_index.cli.rag import RagCLI, default_ragcli_persist_dir from llama_index.cli.upgrade import upgrade_dir, upgrade_file from llama_index.core.ingestion import IngestionCache, IngestionPipeline +from llama_index.core.download.module import LLAMA_HUB_URL from llama_index.core.llama_dataset.download import ( LLAMA_DATASETS_LFS_URL, LLAMA_DATASETS_SOURCE_FILES_GITHUB_TREE_URL, - LLAMA_HUB_URL, download_llama_dataset, ) from llama_index.core.llama_pack.download import ( diff --git a/llama-index-cli/llama_index/cli/upgrade/mappings.json b/llama-index-cli/llama_index/cli/upgrade/mappings.json index 86b7b3ae5417f..9ad04974d42bb 100644 --- a/llama-index-cli/llama_index/cli/upgrade/mappings.json +++ b/llama-index-cli/llama_index/cli/upgrade/mappings.json @@ -519,6 +519,7 @@ "TextEmbeddingsInference": "llama_index.embeddings.text_embeddings_inference", "UpTrainCallbackHandler": "llama_index.callbacks.uptrain", "deepeval_callback_handler": "llama_index.callbacks.deepeval", + "langfuse_callback_handler": "llama_index.callbacks.langfuse", "OpenInferenceCallbackHandler": "llama_index.callbacks.openinference", "WandbCallbackHandler": "llama_index.callbacks.wandb", "argilla_callback_handler": "llama_index.callbacks.argilla", diff --git a/llama-index-cli/pyproject.toml b/llama-index-cli/pyproject.toml index 0c68a47316e16..392231d2a0ce1 100644 --- a/llama-index-cli/pyproject.toml +++ b/llama-index-cli/pyproject.toml @@ -32,7 +32,7 @@ maintainers = [ name = "llama-index-cli" packages = [{include = "llama_index/"}] readme = "README.md" -version = "0.1.6" +version = "0.1.7" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-core/llama_index/core/__init__.py b/llama-index-core/llama_index/core/__init__.py index 7a5e3bc828e92..53f85eb7b4cb1 100644 --- a/llama-index-core/llama_index/core/__init__.py +++ b/llama-index-core/llama_index/core/__init__.py @@ -1,6 +1,6 @@ """Init file of LlamaIndex.""" -__version__ = "0.10.14" +__version__ = "0.10.16" import logging from logging import NullHandler diff --git a/llama-index-core/llama_index/core/base/embeddings/base.py b/llama-index-core/llama_index/core/base/embeddings/base.py index 5fb65b2fdea5b..65d9760ad68e7 100644 --- a/llama-index-core/llama_index/core/base/embeddings/base.py +++ b/llama-index-core/llama_index/core/base/embeddings/base.py @@ -288,16 +288,13 @@ async def aget_text_embedding_batch( nested_embeddings = [] if show_progress: try: - from tqdm.auto import tqdm - - nested_embeddings = [ - await f - for f in tqdm( - asyncio.as_completed(embeddings_coroutines), - total=len(embeddings_coroutines), - desc="Generating embeddings", - ) - ] + from tqdm.asyncio import tqdm_asyncio + + nested_embeddings = await tqdm_asyncio.gather( + *embeddings_coroutines, + total=len(embeddings_coroutines), + desc="Generating embeddings", + ) except ImportError: nested_embeddings = await asyncio.gather(*embeddings_coroutines) else: diff --git a/llama-index-core/llama_index/core/base/llms/types.py b/llama-index-core/llama_index/core/base/llms/types.py index 66ad45b08de36..d771d75467493 100644 --- a/llama-index-core/llama_index/core/base/llms/types.py +++ b/llama-index-core/llama_index/core/base/llms/types.py @@ -1,5 +1,5 @@ from enum import Enum -from typing import Any, AsyncGenerator, Generator, Optional +from typing import Any, AsyncGenerator, Generator, Optional, Union from llama_index.core.bridge.pydantic import BaseModel, Field from llama_index.core.constants import DEFAULT_CONTEXT_WINDOW, DEFAULT_NUM_OUTPUTS @@ -14,6 +14,7 @@ class MessageRole(str, Enum): FUNCTION = "function" TOOL = "tool" CHATBOT = "chatbot" + MODEL = "model" # ===== Generic Model Input - Chat ===== @@ -27,6 +28,17 @@ class ChatMessage(BaseModel): def __str__(self) -> str: return f"{self.role.value}: {self.content}" + @classmethod + def from_str( + cls, + content: str, + role: Union[MessageRole, str] = MessageRole.USER, + **kwargs: Any, + ) -> "ChatMessage": + if isinstance(role, str): + role = MessageRole(role) + return cls(role=role, content=content, **kwargs) + # ===== Generic Model Output - Chat ===== class ChatResponse(BaseModel): diff --git a/llama-index-core/llama_index/core/callbacks/global_handlers.py b/llama-index-core/llama_index/core/callbacks/global_handlers.py index d915eb16451d7..5a49d193cd7b0 100644 --- a/llama-index-core/llama_index/core/callbacks/global_handlers.py +++ b/llama-index-core/llama_index/core/callbacks/global_handlers.py @@ -95,6 +95,17 @@ def create_global_handler(eval_mode: str, **eval_params: Any) -> BaseCallbackHan "Please install it using `pip install llama-index-callbacks-argilla`" ) handler = argilla_callback_handler(**eval_params) + elif eval_mode == "langfuse": + try: + from llama_index.callbacks.langfuse import ( + langfuse_callback_handler, + ) # pants: no-infer-dep + except ImportError: + raise ImportError( + "LangfuseCallbackHandler is not installed. " + "Please install it using `pip install llama-index-callbacks-langfuse`" + ) + handler = langfuse_callback_handler(**eval_params) else: raise ValueError(f"Eval mode {eval_mode} not supported.") diff --git a/llama-index-core/llama_index/core/chat_engine/types.py b/llama-index-core/llama_index/core/chat_engine/types.py index 3174622edbb59..124e1f5d6bca4 100644 --- a/llama-index-core/llama_index/core/chat_engine/types.py +++ b/llama-index-core/llama_index/core/chat_engine/types.py @@ -178,14 +178,19 @@ def response_gen(self) -> Generator[str, None, None]: self.response = self._unformatted_response.strip() async def async_response_gen(self) -> AsyncGenerator[str, None]: - while not self._is_done or not self._aqueue.empty(): - if not self._aqueue.empty(): - delta = self._aqueue.get_nowait() - self._unformatted_response += delta - yield delta + while True: + if not self._aqueue.empty() or not self._is_done: + try: + delta = await asyncio.wait_for(self._aqueue.get(), timeout=0.1) + except asyncio.TimeoutError: + if self._is_done: + break + continue + if delta is not None: + self._unformatted_response += delta + yield delta else: - await self._new_item_event.wait() # Wait until a new item is added - self._new_item_event.clear() # Clear the event for the next wait + break self.response = self._unformatted_response.strip() def print_response_stream(self) -> None: diff --git a/llama-index-core/llama_index/core/command_line/mappings.json b/llama-index-core/llama_index/core/command_line/mappings.json index 86b7b3ae5417f..9ad04974d42bb 100644 --- a/llama-index-core/llama_index/core/command_line/mappings.json +++ b/llama-index-core/llama_index/core/command_line/mappings.json @@ -519,6 +519,7 @@ "TextEmbeddingsInference": "llama_index.embeddings.text_embeddings_inference", "UpTrainCallbackHandler": "llama_index.callbacks.uptrain", "deepeval_callback_handler": "llama_index.callbacks.deepeval", + "langfuse_callback_handler": "llama_index.callbacks.langfuse", "OpenInferenceCallbackHandler": "llama_index.callbacks.openinference", "WandbCallbackHandler": "llama_index.callbacks.wandb", "argilla_callback_handler": "llama_index.callbacks.argilla", diff --git a/llama-index-core/llama_index/core/download/dataset.py b/llama-index-core/llama_index/core/download/dataset.py index 8900107626cdb..5739897598285 100644 --- a/llama-index-core/llama_index/core/download/dataset.py +++ b/llama-index-core/llama_index/core/download/dataset.py @@ -6,7 +6,6 @@ from typing import Any, Dict, List, Optional, Union import tqdm -from llama_index.core.download.module import LLAMA_HUB_URL from llama_index.core.download.utils import ( get_file_content, get_file_content_bytes, @@ -14,6 +13,12 @@ initialize_directory, ) +LLAMA_INDEX_CONTENTS_URL = ( + f"https://raw.githubusercontent.com/run-llama/llama_index/main" +) +LLAMA_DATASETS_PATH = "/llama-datasets" +LLAMA_DATASETS_URL = LLAMA_INDEX_CONTENTS_URL + LLAMA_DATASETS_PATH + LLAMA_DATASETS_LFS_URL = ( f"https://media.githubusercontent.com/media/run-llama/llama-datasets/main" ) @@ -91,7 +96,8 @@ def get_dataset_info( source_files = [] if dataset_class_name == "LabelledRagDataset": source_files = get_source_files_list( - str(remote_source_dir_path), f"/{dataset_id}/{source_files_path}" + str(remote_source_dir_path), + f"/llama_datasets/{dataset_id}/{source_files_path}", ) # create cache dir if needed @@ -141,7 +147,7 @@ def download_dataset_and_source_files( base_file_name = _resolve_dataset_file_name(dataset_class_name) dataset_raw_content, _ = get_file_content( - str(remote_lfs_dir_path), f"/{dataset_id}/{base_file_name}" + str(remote_lfs_dir_path), f"/llama_datasets/{dataset_id}/{base_file_name}" ) with open(f"{module_path}/{base_file_name}", "w") as f: @@ -158,7 +164,7 @@ def download_dataset_and_source_files( if ".pdf" in source_file: source_file_raw_content_bytes, _ = get_file_content_bytes( str(remote_lfs_dir_path), - f"/{dataset_id}/{source_files_dir_path}/{source_file}", + f"/llama_datasets/{dataset_id}/{source_files_dir_path}/{source_file}", ) with open( f"{module_path}/{source_files_dir_path}/{source_file}", "wb" @@ -167,7 +173,7 @@ def download_dataset_and_source_files( else: source_file_raw_content, _ = get_file_content( str(remote_lfs_dir_path), - f"/{dataset_id}/{source_files_dir_path}/{source_file}", + f"/llama_datasets/{dataset_id}/{source_files_dir_path}/{source_file}", ) with open( f"{module_path}/{source_files_dir_path}/{source_file}", "w" @@ -177,7 +183,7 @@ def download_dataset_and_source_files( def download_llama_dataset( dataset_class: str, - llama_hub_url: str = LLAMA_HUB_URL, + llama_datasets_url: str = LLAMA_DATASETS_URL, llama_datasets_lfs_url: str = LLAMA_DATASETS_LFS_URL, llama_datasets_source_files_tree_url: str = LLAMA_DATASETS_SOURCE_FILES_GITHUB_TREE_URL, refresh_cache: bool = False, @@ -218,7 +224,7 @@ def download_llama_dataset( # fetch info from library.json file dataset_info = get_dataset_info( local_dir_path=dirpath, - remote_dir_path=llama_hub_url, + remote_dir_path=llama_datasets_url, remote_source_dir_path=llama_datasets_source_files_tree_url, dataset_class=dataset_class, refresh_cache=refresh_cache, diff --git a/llama-index-core/llama_index/core/embeddings/multi_modal_base.py b/llama-index-core/llama_index/core/embeddings/multi_modal_base.py index 1c41993e3762a..2b8863d2c5b1f 100644 --- a/llama-index-core/llama_index/core/embeddings/multi_modal_base.py +++ b/llama-index-core/llama_index/core/embeddings/multi_modal_base.py @@ -155,16 +155,13 @@ async def aget_image_embedding_batch( nested_embeddings = [] if show_progress: try: - from tqdm.auto import tqdm - - nested_embeddings = [ - await f - for f in tqdm( - asyncio.as_completed(embeddings_coroutines), - total=len(embeddings_coroutines), - desc="Generating image embeddings", - ) - ] + from tqdm.asyncio import tqdm_asyncio + + nested_embeddings = await tqdm_asyncio.gather( + *embeddings_coroutines, + total=len(embeddings_coroutines), + desc="Generating embeddings", + ) except ImportError: nested_embeddings = await asyncio.gather(*embeddings_coroutines) else: diff --git a/llama-index-core/llama_index/core/indices/base.py b/llama-index-core/llama_index/core/indices/base.py index a657a988526ed..a35797a4a1da6 100644 --- a/llama-index-core/llama_index/core/indices/base.py +++ b/llama-index-core/llama_index/core/indices/base.py @@ -85,6 +85,9 @@ def __init__( objects = objects or [] self._object_map = {obj.index_id: obj.obj for obj in objects} + for obj in objects: + obj.obj = None # clear the object to avoid serialization issues + with self._callback_manager.as_trace("index_construction"): if index_struct is None: nodes = nodes or [] diff --git a/llama-index-core/llama_index/core/indices/knowledge_graph/base.py b/llama-index-core/llama_index/core/indices/knowledge_graph/base.py index 86f29a5de8303..b3f9f0013dc3a 100644 --- a/llama-index-core/llama_index/core/indices/knowledge_graph/base.py +++ b/llama-index-core/llama_index/core/indices/knowledge_graph/base.py @@ -259,10 +259,9 @@ def upsert_triplet( self._graph_store.upsert_triplet(*triplet) triplet_str = str(triplet) if include_embeddings: - set_embedding = self._service_context.embed_model.get_text_embedding( - triplet_str - ) + set_embedding = self._embed_model.get_text_embedding(triplet_str) self._index_struct.add_to_embedding_dict(str(triplet), set_embedding) + self._storage_context.index_store.add_index_struct(self._index_struct) def add_node(self, keywords: List[str], node: BaseNode) -> None: """Add node. @@ -300,10 +299,9 @@ def upsert_triplet_and_node( self.add_node([subj, obj], node) triplet_str = str(triplet) if include_embeddings: - set_embedding = self._service_context.embed_model.get_text_embedding( - triplet_str - ) + set_embedding = self._embed_model.get_text_embedding(triplet_str) self._index_struct.add_to_embedding_dict(str(triplet), set_embedding) + self._storage_context.index_store.add_index_struct(self._index_struct) def _delete_node(self, node_id: str, **delete_kwargs: Any) -> None: """Delete a node.""" diff --git a/llama-index-core/llama_index/core/llama_dataset/download.py b/llama-index-core/llama_index/core/llama_dataset/download.py index e17c5657be675..29622e7e4dadd 100644 --- a/llama-index-core/llama_index/core/llama_dataset/download.py +++ b/llama-index-core/llama_index/core/llama_dataset/download.py @@ -4,10 +4,10 @@ from llama_index.core.download.dataset import ( LLAMA_DATASETS_LFS_URL, LLAMA_DATASETS_SOURCE_FILES_GITHUB_TREE_URL, + LLAMA_DATASETS_URL, ) from llama_index.core.download.dataset import download_llama_dataset as download from llama_index.core.download.module import ( - LLAMA_HUB_URL, MODULE_TYPE, track_download, ) @@ -35,7 +35,7 @@ def _resolve_dataset_class(filename: str) -> Type[BaseLlamaDataset]: def download_llama_dataset( llama_dataset_class: str, download_dir: str, - llama_hub_url: str = LLAMA_HUB_URL, + llama_datasets_url: str = LLAMA_DATASETS_URL, llama_datasets_lfs_url: str = LLAMA_DATASETS_LFS_URL, llama_datasets_source_files_tree_url: str = LLAMA_DATASETS_SOURCE_FILES_GITHUB_TREE_URL, show_progress: bool = False, @@ -67,12 +67,12 @@ def download_llama_dataset( """ filenames: Tuple[str, str] = download( llama_dataset_class, - llama_hub_url=llama_hub_url, + llama_datasets_url=llama_datasets_url, llama_datasets_lfs_url=llama_datasets_lfs_url, llama_datasets_source_files_tree_url=llama_datasets_source_files_tree_url, refresh_cache=True, custom_path=download_dir, - library_path="llama_datasets/library.json", + library_path="library.json", disable_library_cache=True, override_path=True, show_progress=show_progress, diff --git a/llama-index-core/llama_index/core/program/multi_modal_llm_program.py b/llama-index-core/llama_index/core/program/multi_modal_llm_program.py index 79621a3d952e4..b42604af24bed 100644 --- a/llama-index-core/llama_index/core/program/multi_modal_llm_program.py +++ b/llama-index-core/llama_index/core/program/multi_modal_llm_program.py @@ -36,7 +36,8 @@ def __init__( @classmethod def from_defaults( cls, - output_parser: PydanticOutputParser, + output_parser: Optional[PydanticOutputParser] = None, + output_cls: Optional[Type[BaseModel]] = None, prompt_template_str: Optional[str] = None, prompt: Optional[PromptTemplate] = None, multi_modal_llm: Optional[MultiModalLLM] = None, @@ -64,6 +65,12 @@ def from_defaults( raise ValueError("Must provide either prompt or prompt_template_str.") if prompt_template_str is not None: prompt = PromptTemplate(prompt_template_str) + + if output_parser is None: + if output_cls is None: + raise ValueError("Must provide either output_cls or output_parser.") + output_parser = PydanticOutputParser(output_cls=output_cls) + return cls( output_parser, prompt=cast(PromptTemplate, prompt), diff --git a/llama-index-core/llama_index/core/prompts/base.py b/llama-index-core/llama_index/core/prompts/base.py index c791076351976..8d3a7a6181d3e 100644 --- a/llama-index-core/llama_index/core/prompts/base.py +++ b/llama-index-core/llama_index/core/prompts/base.py @@ -246,6 +246,20 @@ def __init__( function_mappings=function_mappings, ) + @classmethod + def from_messages( + cls, + message_templates: Union[List[Tuple[str, str]], List[ChatMessage]], + **kwargs: Any, + ) -> "ChatPromptTemplate": + """From messages.""" + if isinstance(message_templates[0], tuple): + message_templates = [ + ChatMessage.from_str(role=role, content=content) + for role, content in message_templates + ] + return cls(message_templates=message_templates, **kwargs) + def partial_format(self, **kwargs: Any) -> "ChatPromptTemplate": prompt = deepcopy(self) prompt.kwargs.update(kwargs) diff --git a/llama-index-core/llama_index/core/prompts/chat_prompts.py b/llama-index-core/llama_index/core/prompts/chat_prompts.py index 3aa6e581b1360..ac5b0cd2d9843 100644 --- a/llama-index-core/llama_index/core/prompts/chat_prompts.py +++ b/llama-index-core/llama_index/core/prompts/chat_prompts.py @@ -69,7 +69,7 @@ "1. **Rewrite** an original answer using the new context.\n" "2. **Repeat** the original answer if the new context isn't useful.\n" "Never reference the original answer or context directly in your answer.\n" - "When in doubt, just repeat the original answer." + "When in doubt, just repeat the original answer.\n" "New Context: {context_msg}\n" "Query: {query_str}\n" "Original Answer: {existing_answer}\n" diff --git a/llama-index-core/llama_index/core/query_engine/jsonalyze_query_engine.py b/llama-index-core/llama_index/core/query_engine/jsonalyze_query_engine.py index e6edc6f8670bc..c2b81afbf9e1e 100644 --- a/llama-index-core/llama_index/core/query_engine/jsonalyze_query_engine.py +++ b/llama-index-core/llama_index/core/query_engine/jsonalyze_query_engine.py @@ -80,7 +80,7 @@ def default_jsonalyzer( try: # Load list of dictionaries into SQLite database db[table_name].insert_all(list_of_dict) - except sqlite_utils.db_exceptions.IntegrityError as exc: + except sqlite_utils.utils.sqlite3.IntegrityError as exc: print_text(f"Error inserting into table {table_name}, expected format:") print_text("[{col1: val1, col2: val2, ...}, ...]") raise ValueError("Invalid list_of_dict") from exc @@ -105,7 +105,7 @@ def default_jsonalyzer( try: # Execute the SQL query results = list(db.query(sql_query)) - except sqlite_utils.db_exceptions.OperationalError as exc: + except sqlite_utils.utils.sqlite3.OperationalError as exc: print_text(f"Error executing query: {sql_query}") raise ValueError("Invalid query") from exc @@ -148,7 +148,7 @@ async def async_default_jsonalyzer( try: # Load list of dictionaries into SQLite database db[table_name].insert_all(list_of_dict) - except sqlite_utils.db_exceptions.IntegrityError as exc: + except sqlite_utils.utils.sqlite3.IntegrityError as exc: print_text(f"Error inserting into table {table_name}, expected format:") print_text("[{col1: val1, col2: val2, ...}, ...]") raise ValueError("Invalid list_of_dict") from exc @@ -173,7 +173,7 @@ async def async_default_jsonalyzer( try: # Execute the SQL query results = list(db.query(sql_query)) - except sqlite_utils.db_exceptions.OperationalError as exc: + except sqlite_utils.utils.sqlite3.OperationalError as exc: print_text(f"Error executing query: {sql_query}") raise ValueError("Invalid query") from exc diff --git a/llama-index-core/llama_index/core/readers/file/base.py b/llama-index-core/llama_index/core/readers/file/base.py index 585b13f723211..a20e7d2b7e5db 100644 --- a/llama-index-core/llama_index/core/readers/file/base.py +++ b/llama-index-core/llama_index/core/readers/file/base.py @@ -56,6 +56,21 @@ def _try_loading_included_file_formats() -> Dict[str, Type[BaseReader]]: return default_file_reader_cls +def _format_file_timestamp(timestamp: float) -> Optional[str]: + """Format file timestamp to a %Y-%m-%d string. + + Args: + timestamp (float): timestamp in float + + Returns: + str: formatted timestamp + """ + try: + return datetime.fromtimestamp(timestamp).strftime("%Y-%m-%d") + except Exception: + return None + + def default_file_metadata_func( file_path: str, fs: Optional[fsspec.AbstractFileSystem] = None ) -> Dict: @@ -66,20 +81,10 @@ def default_file_metadata_func( """ fs = fs or get_default_fs() stat_result = fs.stat(file_path) - creation_date = stat_result.get("created") - last_modified_date = stat_result.get("mtime") - last_accessed_date = stat_result.get("atime") - try: - creation_date = datetime.fromtimestamp(creation_date).strftime("%Y-%m-%d") - last_modified_date = datetime.fromtimestamp(last_modified_date).strftime( - "%Y-%m-%d" - ) - last_accessed_date = datetime.fromtimestamp(last_accessed_date).strftime( - "%Y-%m-%d" - ) - except Exception: - pass - return { + creation_date = _format_file_timestamp(stat_result.get("created")) + last_modified_date = _format_file_timestamp(stat_result.get("mtime")) + last_accessed_date = _format_file_timestamp(stat_result.get("atime")) + default_meta = { "file_path": file_path, "file_name": stat_result["name"], "file_type": mimetypes.guess_type(file_path)[0], @@ -89,6 +94,13 @@ def default_file_metadata_func( "last_accessed_date": last_accessed_date, } + # Return not null value + return { + meta_key: meta_value + for meta_key, meta_value in default_meta.items() + if meta_value is not None + } + class _DefaultFileMetadataFunc: """ @@ -237,7 +249,9 @@ def _add_files(self, input_dir: Path) -> List[Path]: # in glob for backwards compatibility. ref = Path(ref) is_dir = self.fs.isdir(ref) - skip_because_hidden = self.exclude_hidden and self.is_hidden(ref) + skip_because_hidden = self.exclude_hidden and self.is_hidden( + ref.relative_to(input_dir.absolute()) + ) skip_because_bad_ext = ( self.required_exts is not None and ref.suffix not in self.required_exts ) diff --git a/llama-index-core/llama_index/core/retrievers/fusion_retriever.py b/llama-index-core/llama_index/core/retrievers/fusion_retriever.py index d5de8373b1252..d1425fcc9a4e6 100644 --- a/llama-index-core/llama_index/core/retrievers/fusion_retriever.py +++ b/llama-index-core/llama_index/core/retrievers/fusion_retriever.py @@ -130,7 +130,11 @@ def _simple_fusion( for nodes_with_scores in results.values(): for node_with_score in nodes_with_scores: text = node_with_score.node.get_content() - all_nodes[text] = node_with_score + if text in all_nodes: + max_score = max(node_with_score.score, all_nodes[text].score) + all_nodes[text].score = max_score + else: + all_nodes[text] = node_with_score return sorted(all_nodes.values(), key=lambda x: x.score or 0.0, reverse=True) diff --git a/llama-index-core/llama_index/core/tools/tool_spec/load_and_search/README.md b/llama-index-core/llama_index/core/tools/tool_spec/load_and_search/README.md index fad3c0db7b175..53f2ce8d9ec42 100644 --- a/llama-index-core/llama_index/core/tools/tool_spec/load_and_search/README.md +++ b/llama-index-core/llama_index/core/tools/tool_spec/load_and_search/README.md @@ -1,5 +1,9 @@ # LoadAndSearch Tool +```bash +pip install llama-index-tools-wikipedia +``` + This Tool Spec is intended to wrap other tools, allowing the Agent to perform separate loading and reading of data. This is very useful for when tools return information larger than or closer to the size of the context window. ## Usage @@ -11,7 +15,7 @@ from llama_index.core.tools.tool_spec.load_and_search import ( LoadAndSearchToolSpec, ) from llama_index.core.agent import OpenAIAgent -from llama_hub.tools.wikipedia.base import WikipediaToolSpec +from llama_index.tools.wikipedia.base import WikipediaToolSpec wiki_spec = WikipediaToolSpec() diff --git a/llama-index-core/llama_index/core/utilities/gemini_utils.py b/llama-index-core/llama_index/core/utilities/gemini_utils.py new file mode 100644 index 0000000000000..3ed4df6c848d7 --- /dev/null +++ b/llama-index-core/llama_index/core/utilities/gemini_utils.py @@ -0,0 +1,52 @@ +"""Global Gemini Utilities (shared between Gemini LLM and Vertex).""" + +from collections.abc import Sequence +from typing import Dict + +from llama_index.core.base.llms.types import ChatMessage, MessageRole + +ROLES_TO_GEMINI: Dict[MessageRole, MessageRole] = { + MessageRole.USER: MessageRole.USER, + MessageRole.ASSISTANT: MessageRole.MODEL, + ## Gemini only has user and model roles. Put the rest in user role. + MessageRole.SYSTEM: MessageRole.USER, +} +ROLES_FROM_GEMINI: Dict[MessageRole, MessageRole] = { + ## Gemini only has user and model roles. + MessageRole.USER: MessageRole.USER, + MessageRole.MODEL: MessageRole.ASSISTANT, +} + + +def merge_neighboring_same_role_messages( + messages: Sequence[ChatMessage], +) -> Sequence[ChatMessage]: + # Gemini does not support multiple messages of the same role in a row, so we merge them + merged_messages = [] + i = 0 + + while i < len(messages): + current_message = messages[i] + # Initialize merged content with current message content + merged_content = [current_message.content] + + # Check if the next message exists and has the same role + while ( + i + 1 < len(messages) + and ROLES_TO_GEMINI[messages[i + 1].role] + == ROLES_TO_GEMINI[current_message.role] + ): + i += 1 + next_message = messages[i] + merged_content.extend([next_message.content]) + + # Create a new ChatMessage or similar object with merged content + merged_message = ChatMessage( + role=ROLES_TO_GEMINI[current_message.role], + content="\n".join([str(msg_content) for msg_content in merged_content]), + additional_kwargs=current_message.additional_kwargs, + ) + merged_messages.append(merged_message) + i += 1 + + return merged_messages diff --git a/llama-index-core/llama_index/core/vector_stores/__init__.py b/llama-index-core/llama_index/core/vector_stores/__init__.py index c6ce1525becd9..713c7f859a1a8 100644 --- a/llama-index-core/llama_index/core/vector_stores/__init__.py +++ b/llama-index-core/llama_index/core/vector_stores/__init__.py @@ -1,6 +1,5 @@ """Vector stores.""" - from llama_index.core.vector_stores.simple import SimpleVectorStore from llama_index.core.vector_stores.types import ( ExactMatchFilter, @@ -8,8 +7,10 @@ FilterOperator, MetadataFilter, MetadataFilters, + MetadataInfo, VectorStoreQuery, VectorStoreQueryResult, + VectorStoreInfo, ) __all__ = [ @@ -17,8 +18,10 @@ "VectorStoreQueryResult", "MetadataFilters", "MetadataFilter", + "MetadataInfo", "ExactMatchFilter", "FilterCondition", "FilterOperator", "SimpleVectorStore", + "VectorStoreInfo", ] diff --git a/llama-index-core/pyproject.toml b/llama-index-core/pyproject.toml index ffa6a94e30e90..766f8c69c9560 100644 --- a/llama-index-core/pyproject.toml +++ b/llama-index-core/pyproject.toml @@ -43,7 +43,7 @@ name = "llama-index-core" packages = [{include = "llama_index"}] readme = "README.md" repository = "https://github.com/run-llama/llama_index" -version = "0.10.14" +version = "0.10.16" [tool.poetry.dependencies] SQLAlchemy = {extras = ["asyncio"], version = ">=1.4.49"} diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/BUILD b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/BUILD new file mode 100644 index 0000000000000..0896ca890d8bf --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/BUILD @@ -0,0 +1,3 @@ +poetry_requirements( + name="poetry", +) diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/Makefile b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/Makefile new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/Makefile @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/README.md b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/README.md new file mode 100644 index 0000000000000..4048b24540065 --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/README.md @@ -0,0 +1,18 @@ +# LlamaIndex Callbacks Integration: Langfuse + +[Langfuse](https://langfuse.com/docs) is an open source LLM engineering platform to help teams collaboratively debug, analyze and iterate on their LLM Applications. With the Langfuse integration, you can seamlessly track and monitor performance, traces, and metrics of your LlamaIndex application. Detailed traces of the LlamaIndex context augmentation and the LLM querying processes are captured and can be inspected directly in the Langfuse UI. + +#### Usage Pattern + +```python +from llama_index.core import set_global_handler + +# Make sure you've installed the 'llama-index-callbacks-langfuse' integration package. + +# NOTE: Set your environment variables 'LANGFUSE_SECRET_KEY', 'LANGFUSE_PUBLIC_KEY' and 'LANGFUSE_HOST' +# as shown in your langfuse.com project settings. + +set_global_handler("langfuse") +``` + +![langfuse-tracing](https://static.langfuse.com/llamaindex-langfuse-docs.gif) diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/BUILD b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/__init__.py b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/__init__.py new file mode 100644 index 0000000000000..b060aaf4c8446 --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/__init__.py @@ -0,0 +1,3 @@ +from llama_index.callbacks.langfuse.base import langfuse_callback_handler + +__all__ = ["langfuse_callback_handler"] diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/base.py b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/base.py new file mode 100644 index 0000000000000..381b77ccc69a9 --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/llama_index/callbacks/langfuse/base.py @@ -0,0 +1,11 @@ +from typing import Any + +from llama_index.core.callbacks.base_handler import BaseCallbackHandler + +from langfuse.llama_index import LlamaIndexCallbackHandler + + +def langfuse_callback_handler(**eval_params: Any) -> BaseCallbackHandler: + return LlamaIndexCallbackHandler( + **eval_params, sdk_integration="llama-index_set-global-handler" + ) diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/pyproject.toml b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/pyproject.toml new file mode 100644 index 0000000000000..132031548ecf0 --- /dev/null +++ b/llama-index-integrations/callbacks/llama-index-callbacks-langfuse/pyproject.toml @@ -0,0 +1,64 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +ignore-words-list = "Gere" +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +contains_example = false +import_path = "llama_index.callbacks.langfuse" + +[tool.llamahub.class_authors] +LangfuseCallbackHandler = "llama-index" + +[tool.mypy] +disallow_untyped_defs = true +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["Your Name "] +description = "llama-index callbacks langfuse integration" +exclude = ["**/BUILD"] +license = "MIT" +name = "llama-index-callbacks-langfuse" +readme = "README.md" +version = "0.1.2" + +[tool.poetry.dependencies] +python = ">=3.8.1,<4.0" +llama-index-core = "^0.10.8" +langfuse = "^2.18.0" + +[tool.poetry.group.dev.dependencies] +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" +types-setuptools = "67.1.0.0" + +[tool.poetry.group.dev.dependencies.black] +extras = ["jupyter"] +version = "<=23.9.1,>=23.7.0" + +[tool.poetry.group.dev.dependencies.codespell] +extras = ["toml"] +version = ">=v2.2.6" + +[[tool.poetry.packages]] +include = "llama_index/" diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/README.md b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/README.md index f9c12773deaa9..e2f48e4c2338e 100644 --- a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/README.md +++ b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/README.md @@ -1,8 +1,8 @@ # LlamaIndex Callbacks Integration: UpTrain -UpTrain is an open-source tool to evaluate and monitor the performance of language models. It provides a set of pre-built evaluations to assess the quality of responses generated by the model. Once you add UpTrainCallbackHandler to your existing LlamaIndex pipeline, it will take care of sending the generated responses to the UpTrain Managed Service for evaluations and display the results in the output. +UpTrain ([github](https://github.com/uptrain-ai/uptrain) || [website](https://uptrain.ai/) || [docs](https://docs.uptrain.ai/getting-started/introduction)) is an open-source platform to evaluate and improve Generative AI applications. It provides grades for 20+ preconfigured checks (covering language, code, embedding use cases), performs root cause analysis on failure cases and gives insights on how to resolve them. Once you add UpTrainCallbackHandler to your existing LlamaIndex pipeline, it will automatically capture the right data, run evaluations and display the results in the output. -Three additional evaluations for Llamaindex have been introduced, complementing existing ones. These evaluations run automatically, with results displayed in the output. More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-). +More details on UpTrain's evaluations can be found [here](https://github.com/uptrain-ai/uptrain?tab=readme-ov-file#pre-built-evaluations-we-offer-). Selected operators from the LlamaIndex pipeline are highlighted for demonstration: @@ -10,26 +10,26 @@ Selected operators from the LlamaIndex pipeline are highlighted for demonstratio The RAG query engine plays a crucial role in retrieving context and generating responses. To ensure its performance and response quality, we conduct the following evaluations: -- **Context Relevance**: Determines if the context extracted from the query is relevant to the response. -- **Factual Accuracy**: Assesses if the LLM is hallcuinating or providing incorrect information. -- **Response Completeness**: Checks if the response contains all the information requested by the query. +- **[Context Relevance](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-relevance)**: Determines if the context extracted from the query is relevant to the response. +- **[Factual Accuracy](https://docs.uptrain.ai/predefined-evaluations/context-awareness/factual-accuracy)**: Assesses if the LLM is hallucinating or providing incorrect information. +- **[Response Completeness](https://docs.uptrain.ai/predefined-evaluations/response-quality/response-completeness)**: Checks if the response contains all the information requested by the query. ## 2. **Sub-Question Query Generation Evaluation**: -The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using a RAG query engine. Given the complexity, we include the previous evaluations and add: +The SubQuestionQueryGeneration operator decomposes a question into sub-questions, generating responses for each using a RAG query engine. To evaluate the performance of SubQuery module, we add another check as well as run the above three for all the sub-queries: -- **Sub Query Completeness**: Assures that the sub-questions accurately and comprehensively cover the original query. +- **[Sub Query Completeness](https://docs.uptrain.ai/predefined-evaluations/query-quality/sub-query-completeness)**: Assures that the sub-questions accurately and comprehensively cover the original query. ## 3. **Re-Ranking Evaluations**: -Re-ranking involves reordering nodes based on relevance to the query and choosing top n nodes. Different evaluations are performed based on the number of nodes returned after re-ranking. +Re-ranking involves reordering nodes based on relevance to the query and choosing the top n nodes. Different evaluations are performed based on the number of nodes returned after re-ranking. a. Same Number of Nodes -- **Context Reranking**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. +- **[Context Reranking](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-reranking)**: Checks if the order of re-ranked nodes is more relevant to the query than the original order. b. Different Number of Nodes: -- **Context Conciseness**: Examines whether the reduced number of nodes still provides all the required information. +- **[Context Conciseness](https://docs.uptrain.ai/predefined-evaluations/context-awareness/context-conciseness)**: Examines whether the reduced number of nodes still provides all the required information. These evaluations collectively ensure the robustness and effectiveness of the RAG query engine, SubQuestionQueryGeneration operator, and the re-ranking process in the LlamaIndex pipeline. diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/llama_index/callbacks/uptrain/base.py b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/llama_index/callbacks/uptrain/base.py index 69ab6de8e509b..b842c6de18ea5 100644 --- a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/llama_index/callbacks/uptrain/base.py +++ b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/llama_index/callbacks/uptrain/base.py @@ -118,7 +118,7 @@ def uptrain_evaluate( if column == "question": print(f"\nQuestion: {row[column]}") elif column == "response": - print(f"Response: {row[column]}") + print(f"Response: {row[column]}\n") elif column.startswith("score"): if column in score_name_map: print(f"{score_name_map[column]}: {row[column]}") diff --git a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/pyproject.toml b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/pyproject.toml index 903e9f86fa358..d8b310ef645c0 100644 --- a/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/pyproject.toml +++ b/llama-index-integrations/callbacks/llama-index-callbacks-uptrain/pyproject.toml @@ -21,18 +21,18 @@ ignore_missing_imports = true python_version = "3.8" [tool.poetry] -authors = ["Your Name "] +authors = ["Dhruv Chawla "] description = "llama-index callbacks uptrain integration" exclude = ["**/BUILD"] license = "MIT" name = "llama-index-callbacks-uptrain" readme = "README.md" -version = "0.1.1" +version = "0.1.2" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" -llama-index-core = "0.10.0" -uptrain = ">=0.5.0" +llama-index-core = ">=0.10.0" +uptrain = ">=0.6.6" [tool.poetry.group.dev.dependencies] ipython = "8.10.0" diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/llama_index/embeddings/bedrock/base.py b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/llama_index/embeddings/bedrock/base.py index ac5faa6d1c1b2..97262078c3d1b 100644 --- a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/llama_index/embeddings/bedrock/base.py +++ b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/llama_index/embeddings/bedrock/base.py @@ -3,7 +3,7 @@ import warnings from enum import Enum from deprecated import deprecated -from typing import Any, Callable, Dict, List, Literal, Optional, Sequence +from typing import Any, Callable, Dict, List, Literal, Optional, Sequence, Union from llama_index.core.base.embeddings.base import BaseEmbedding, Embedding from llama_index.core.base.llms.types import ChatMessage @@ -27,10 +27,12 @@ class Models(str, Enum): PROVIDER_SPECIFIC_IDENTIFIERS = { PROVIDERS.AMAZON.value: { - "get_embeddings_func": lambda r: r.get("embedding"), + "get_embeddings_func": lambda r, isbatch: r.get("embedding"), }, PROVIDERS.COHERE.value: { - "get_embeddings_func": lambda r: r.get("embeddings")[0], + "get_embeddings_func": lambda r, isbatch: ( + r.get("embeddings") if isbatch else r.get("embeddings")[0] + ), }, } @@ -317,7 +319,18 @@ def from_credentials( verbose=verbose, ) - def _get_embedding(self, payload: str, type: Literal["text", "query"]) -> Embedding: + def _get_embedding( + self, payload: Union[str, List[str]], type: Literal["text", "query"] + ) -> Union[Embedding, List[Embedding]]: + """Get the embedding for the given payload. + + Args: + payload (Union[str, List[str]]): The text or list of texts for which the embeddings are to be obtained. + type (Literal["text", "query"]): The type of the payload. It can be either "text" or "query". + + Returns: + Union[Embedding, List[Embedding]]: The embedding or list of embeddings for the given payload. If the payload is a list of strings, then the response will be a list of embeddings. + """ if self._client is None: self.set_credentials() @@ -338,7 +351,7 @@ def _get_embedding(self, payload: str, type: Literal["text", "query"]) -> Embedd identifiers = PROVIDER_SPECIFIC_IDENTIFIERS.get(provider, None) if identifiers is None: raise ValueError("Provider not supported") - return identifiers["get_embeddings_func"](resp) + return identifiers["get_embeddings_func"](resp, isinstance(payload, list)) def _get_query_embedding(self, query: str) -> Embedding: return self._get_embedding(query, "query") @@ -346,8 +359,17 @@ def _get_query_embedding(self, query: str) -> Embedding: def _get_text_embedding(self, text: str) -> Embedding: return self._get_embedding(text, "text") + def _get_text_embeddings(self, texts: List[str]) -> List[Embedding]: + provider = self.model.split(".")[0] + if provider == PROVIDERS.COHERE: + return self._get_embedding(texts, "text") + return super()._get_text_embeddings(texts) + def _get_request_body( - self, provider: str, payload: str, type: Literal["text", "query"] + self, + provider: str, + payload: Union[str, List[str]], + input_type: Literal["text", "query"], ) -> Any: """Build the request body as per the provider. Currently supported providers are amazon, cohere. @@ -366,6 +388,8 @@ def _get_request_body( """ if provider == PROVIDERS.AMAZON: + if isinstance(payload, list): + raise ValueError("Amazon provider does not support list of texts") request_body = json.dumps({"inputText": payload}) elif provider == PROVIDERS.COHERE: input_types = { @@ -374,8 +398,8 @@ def _get_request_body( } request_body = json.dumps( { - "texts": [payload], - "input_type": input_types[type], + "texts": [payload] if isinstance(payload, str) else payload, + "input_type": input_types[input_type], "truncate": "NONE", } ) diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/pyproject.toml b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/pyproject.toml index 3cf9cc1ffe24b..36cb104a8c710 100644 --- a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/pyproject.toml +++ b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-embeddings-bedrock" readme = "README.md" -version = "0.1.3" +version = "0.1.4" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/tests/test_bedrock.py b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/tests/test_bedrock.py index d14df0be8cd87..3876d0d5c9835 100644 --- a/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/tests/test_bedrock.py +++ b/llama-index-integrations/embeddings/llama-index-embeddings-bedrock/tests/test_bedrock.py @@ -73,3 +73,37 @@ def test_get_text_embedding_cohere(self) -> None: self.bedrock_stubber.assert_no_pending_responses() self.assertEqual(embedding, mock_response["embeddings"][0]) + + def test_get_text_embedding_batch_cohere(self) -> None: + mock_response = { + "embeddings": [ + [0.017410278, 0.040924072, -0.007507324, 0.09429932, 0.015304565], + [0.017410278, 0.040924072, -0.007507324, 0.09429932, 0.015304565], + ] + } + mock_request = ["foo bar baz", "foo baz bar"] + + mock_stream = BytesIO(json.dumps(mock_response).encode()) + + self.bedrock_stubber.add_response( + "invoke_model", + { + "contentType": "application/json", + "body": StreamingBody(mock_stream, len(json.dumps(mock_response))), + }, + ) + + bedrock_embedding = BedrockEmbedding( + model=Models.COHERE_EMBED_ENGLISH_V3, + client=self.bedrock_client, + ) + + self.bedrock_stubber.activate() + embedding = bedrock_embedding.get_text_embedding_batch(texts=mock_request) + + self.bedrock_stubber.deactivate() + + self.assertEqual(len(embedding), 2) + + for i in range(2): + self.assertEqual(embedding[i], mock_response["embeddings"][i]) diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/.gitignore b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/.gitignore new file mode 100644 index 0000000000000..990c18de22908 --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/.gitignore @@ -0,0 +1,153 @@ +llama_index/_static +.DS_Store +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +bin/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +etc/ +include/ +lib/ +lib64/ +parts/ +sdist/ +share/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +.ruff_cache + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints +notebooks/ + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ +pyvenv.cfg + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# Jetbrains +.idea +modules/ +*.swp + +# VsCode +.vscode + +# pipenv +Pipfile +Pipfile.lock + +# pyright +pyrightconfig.json diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/BUILD b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/BUILD new file mode 100644 index 0000000000000..84f2657a9f879 --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/BUILD @@ -0,0 +1,3 @@ +poetry_requirements( + name="poetry", module_mapping={"google-cloud-aiplatform": ["vertexai"]} +) diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/Makefile b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/Makefile new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/Makefile @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/README.md b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/README.md new file mode 100644 index 0000000000000..d625c2907cffb --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/README.md @@ -0,0 +1,14 @@ +# LlamaIndex Embeddings Integration: Vertex + +Implements Vertex AI Embeddings Models: + +| Model | Release Date | +| ------------------------------------ | ----------------- | +| textembedding-gecko@003 | December 12, 2023 | +| textembedding-gecko@002 | November 2, 2023 | +| textembedding-gecko-multilingual@001 | November 2, 2023 | +| textembedding-gecko@001 | June 7, 2023 | +| multimodalembedding | | + +**Note**: Currently Vertex AI does not support async on `multimodalembedding`. +Otherwise, `VertexTextEmbedding` supports async interface. diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/multimodal_embedding.ipynb b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/multimodal_embedding.ipynb new file mode 100644 index 0000000000000..7be7dff32873a --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/multimodal_embedding.ipynb @@ -0,0 +1,202 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "3af200b75c4bd924", + "metadata": {}, + "source": [ + "# Vertex AI Multimodal Embedding\n", + "Uses APPLICATION_DEFAULT_CREDENTIALS if no credentials is specified. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "7b43f20b2f09ff70", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.embeddings.vertex import VertexMultiModalEmbedding\n", + "\n", + "embed_model = VertexMultiModalEmbedding(\n", + " project=\"speedy-atom-413006\", location=\"us-central1\"\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "a10d4efa47801541", + "metadata": {}, + "outputs": [], + "source": [ + "image_url = \"https://upload.wikimedia.org/wikipedia/commons/4/43/Cute_dog.jpg\"" + ] + }, + { + "cell_type": "markdown", + "id": "6e29951621ec9acc", + "metadata": {}, + "source": [ + "Download this image to `data/test-image.jpg`" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "45aca848dd1d17e3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from IPython.core.display import Image\n", + "\n", + "display(Image(url=image_url, width=500))" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2d3394b6ce654ec4", + "metadata": {}, + "outputs": [], + "source": [ + "result = embed_model.get_image_embedding(\"data/test-image.jpg\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "75022fc91552014c", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[-0.00822397694,\n", + " 0.0167199261,\n", + " 0.0195552949,\n", + " 0.00935372803,\n", + " 0.00746282,\n", + " 0.011754944,\n", + " -0.0363474153,\n", + " 0.00836938061,\n", + " -0.0170917399,\n", + " 0.0218462963]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "result[:10]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "103e4c523d039fdd", + "metadata": {}, + "outputs": [], + "source": [ + "text_result = embed_model.get_text_embedding(\n", + " \"a brown and white puppy laying in the grass with purple daisies in the background\"\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c14b8971981d61e5", + "metadata": {}, + "outputs": [], + "source": [ + "text_result_2 = embed_model.get_text_embedding(\"airplanes in the sky\")" + ] + }, + { + "cell_type": "markdown", + "id": "588f1585ba25bc57", + "metadata": {}, + "source": [ + "We expect that a similar description to the image will yield a higher similarity result" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "23a129176e8d1007", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.20342717022759096" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "embed_model.similarity(result, text_result)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "be0c503c3dd57412", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.009063958097860215" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "embed_model.similarity(result, text_result_2)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 2 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython2" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/text_embedding.ipynb b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/text_embedding.ipynb new file mode 100644 index 0000000000000..d992449a5258d --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/examples/text_embedding.ipynb @@ -0,0 +1,221 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "8085d744ceb233ff", + "metadata": {}, + "source": [ + "# Vertex AI Text Embedding\n", + "\n", + "Imports the VertexTextEmbedding class and initializes an instance named embed_model with a specified project and location. Uses APPLICATION_DEFAULT_CREDENTIALS if no credentials is specified. The default model is `textembedding-gecko@003` in document retrival mode." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "c52b0b97984c1ceb", + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.embeddings.vertex import VertexTextEmbedding\n", + "\n", + "embed_model = VertexTextEmbedding(project=\"speedy-atom-413006\", location=\"us-central1\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "61d58ea0808d0941", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'model_name': 'textembedding-gecko@003',\n", + " 'embed_batch_size': 10,\n", + " 'embed_mode': ,\n", + " 'additional_kwargs': {},\n", + " 'class_name': 'VertexTextEmbedding'}" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "embed_model.dict()" + ] + }, + { + "cell_type": "markdown", + "id": "c98da813ca018111", + "metadata": {}, + "source": [ + "## Document and Query Retrival" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "8f6e67d1951da538", + "metadata": {}, + "outputs": [], + "source": [ + "embed_text_result = embed_model.get_text_embedding(\"Hello World!\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f61a801502c3de8f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[0.05736415088176727,\n", + " 0.0049842665903270245,\n", + " -0.07065856456756592,\n", + " -0.021812528371810913,\n", + " 0.060468606650829315]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "embed_text_result[:5]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "416ed8894817e213", + "metadata": {}, + "outputs": [], + "source": [ + "embed_query_result = embed_model.get_query_embedding(\"Hello World!\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "62510b52e204a271", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[0.05158292129635811,\n", + " -0.033334773033857346,\n", + " -0.03221268951892853,\n", + " -0.029282240197062492,\n", + " 0.020004423335194588]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "embed_query_result[:5]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d10c0164acddc5d7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0.7375430761259468" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from llama_index.core.base.embeddings.base import SimilarityMode\n", + "\n", + "embed_model.similarity(\n", + " embed_text_result, embed_query_result, SimilarityMode.DOT_PRODUCT\n", + ")" + ] + }, + { + "cell_type": "markdown", + "id": "68292f47908eabad", + "metadata": {}, + "source": [ + "## Using the async interface" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "10aa2c79d07d6f77", + "metadata": {}, + "outputs": [], + "source": [ + "import nest_asyncio\n", + "\n", + "nest_asyncio.apply()\n", + "\n", + "result = await embed_model.aget_text_embedding(\"Hello World!\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "596498385119ecab", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "[0.05733369290828705,\n", + " 0.005178301595151424,\n", + " -0.07033716142177582,\n", + " -0.021963153034448624,\n", + " 0.06050697714090347]" + ] + }, + "execution_count": null, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "result[:5]" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 2 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython2" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/BUILD b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/__init__.py b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/__init__.py new file mode 100644 index 0000000000000..2889c5b5e5d5a --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/__init__.py @@ -0,0 +1,7 @@ +from llama_index.embeddings.vertex.base import ( + VertexTextEmbedding, + VertexMultiModalEmbedding, + VertexEmbeddingMode, +) + +__all__ = ["VertexTextEmbedding", "VertexMultiModalEmbedding", "VertexEmbeddingMode"] diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/base.py b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/base.py new file mode 100644 index 0000000000000..1095758019a3b --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/llama_index/embeddings/vertex/base.py @@ -0,0 +1,228 @@ +from enum import Enum +from typing import Optional, List, Any, Dict, Union + +import vertexai +from llama_index.core.base.embeddings.base import Embedding, BaseEmbedding +from llama_index.core.bridge.pydantic import PrivateAttr, Field +from llama_index.core.callbacks import CallbackManager +from llama_index.core.embeddings import MultiModalEmbedding +from llama_index.core.schema import ImageType +from llama_index.core.base.embeddings.base import DEFAULT_EMBED_BATCH_SIZE +from vertexai.language_models import TextEmbeddingModel, TextEmbeddingInput +from vertexai.vision_models import MultiModalEmbeddingModel, Image + +from google.auth import credentials as auth_credentials + + +class VertexEmbeddingMode(str, Enum): + """VertexAI embedding mode. + + Attributes: + DEFAULT_MODE (str): The default embedding mode, for older models before August 2023, + that does not support task_type + CLASSIFICATION_MODE (str): Optimizes embeddings for classification tasks. + CLUSTERING_MODE (str): Optimizes embeddings for clustering tasks. + SEMANTIC_SIMILARITY_MODE (str): Optimizes embeddings for tasks that require assessments of semantic similarity. + RETRIEVAL_MODE (str): Optimizes embeddings for retrieval tasks, including search and document retrieval. + """ + + DEFAULT_MODE = "default" + CLASSIFICATION_MODE = "classification" + CLUSTERING_MODE = "clustering" + SEMANTIC_SIMILARITY_MODE = "similarity" + RETRIEVAL_MODE = "retrieval" + + +_TEXT_EMBED_TASK_TYPE_MAPPING: Dict[VertexEmbeddingMode, str] = { + VertexEmbeddingMode.CLASSIFICATION_MODE: "CLASSIFICATION", + VertexEmbeddingMode.CLUSTERING_MODE: "CLUSTERING", + VertexEmbeddingMode.SEMANTIC_SIMILARITY_MODE: "SEMANTIC_SIMILARITY", + VertexEmbeddingMode.RETRIEVAL_MODE: "RETRIEVAL_DOCUMENT", +} + +_QUERY_EMBED_TASK_TYPE_MAPPING: Dict[VertexEmbeddingMode, str] = { + VertexEmbeddingMode.CLASSIFICATION_MODE: "CLASSIFICATION", + VertexEmbeddingMode.CLUSTERING_MODE: "CLUSTERING", + VertexEmbeddingMode.SEMANTIC_SIMILARITY_MODE: "SEMANTIC_SIMILARITY", + VertexEmbeddingMode.RETRIEVAL_MODE: "RETRIEVAL_QUERY", +} + + +def init_vertexai( + project: Optional[str] = None, + location: Optional[str] = None, + credentials: Optional[auth_credentials.Credentials] = None, +) -> None: + """Init vertexai. + + Args: + project: The default GCP project to use when making Vertex API calls. + location: The default location to use when making API calls. + credentials: The default custom + credentials to use when making API calls. If not provided credentials + will be ascertained from the environment. + """ + vertexai.init( + project=project, + location=location, + credentials=credentials, + ) + + +def _get_embedding_request( + texts: List[str], embed_mode: VertexEmbeddingMode, is_query: bool +) -> List[Union[str, TextEmbeddingInput]]: + if embed_mode != VertexEmbeddingMode.DEFAULT_MODE: + mapping = ( + _QUERY_EMBED_TASK_TYPE_MAPPING + if is_query + else _TEXT_EMBED_TASK_TYPE_MAPPING + ) + texts = [ + TextEmbeddingInput(text=text, task_type=mapping[embed_mode]) + for text in texts + ] + return texts + + +class VertexTextEmbedding(BaseEmbedding): + embed_mode: VertexEmbeddingMode = Field(description="The embedding mode to use.") + additional_kwargs: Dict[str, Any] = Field( + default_factory=dict, description="Additional kwargs for the Vertex." + ) + + _model: TextEmbeddingModel = PrivateAttr() + + def __init__( + self, + model_name: str = "textembedding-gecko@003", + project: Optional[str] = None, + location: Optional[str] = None, + credentials: Optional[auth_credentials.Credentials] = None, + embed_mode: VertexEmbeddingMode = VertexEmbeddingMode.RETRIEVAL_MODE, + embed_batch_size: int = DEFAULT_EMBED_BATCH_SIZE, + callback_manager: Optional[CallbackManager] = None, + additional_kwargs: Optional[Dict[str, Any]] = None, + ) -> None: + init_vertexai(project=project, location=location, credentials=credentials) + callback_manager = callback_manager or CallbackManager([]) + additional_kwargs = additional_kwargs or {} + + super().__init__( + embed_mode=embed_mode, + additional_kwargs=additional_kwargs, + model_name=model_name, + embed_batch_size=embed_batch_size, + callback_manager=callback_manager, + ) + self._model = TextEmbeddingModel.from_pretrained(model_name) + + @classmethod + def class_name(cls) -> str: + return "VertexTextEmbedding" + + def _get_text_embeddings(self, texts: List[str]) -> List[Embedding]: + texts = _get_embedding_request( + texts=texts, embed_mode=self.embed_mode, is_query=False + ) + embeddings = self._model.get_embeddings(texts, **self.additional_kwargs) + return [embedding.values for embedding in embeddings] + + def _get_text_embedding(self, text: str) -> Embedding: + return self._get_text_embeddings([text])[0] + + async def _aget_text_embedding(self, text: str) -> Embedding: + return (await self._aget_text_embeddings([text]))[0] + + async def _aget_text_embeddings(self, texts: List[str]) -> List[Embedding]: + texts = _get_embedding_request( + texts=texts, embed_mode=self.embed_mode, is_query=False + ) + embeddings = await self._model.get_embeddings_async( + texts, **self.additional_kwargs + ) + return [embedding.values for embedding in embeddings] + + def _get_query_embedding(self, query: str) -> Embedding: + texts = _get_embedding_request( + texts=[query], embed_mode=self.embed_mode, is_query=True + ) + embeddings = self._model.get_embeddings(texts, **self.additional_kwargs) + return embeddings[0].values + + async def _aget_query_embedding(self, query: str) -> Embedding: + texts = _get_embedding_request( + texts=[query], embed_mode=self.embed_mode, is_query=True + ) + embeddings = await self._model.get_embeddings_async( + texts, **self.additional_kwargs + ) + return embeddings[0].values + + +class VertexMultiModalEmbedding(MultiModalEmbedding): + embed_dimension: int = Field(description="The vertex output embedding dimension.") + additional_kwargs: Dict[str, Any] = Field( + default_factory=dict, description="Additional kwargs for the Vertex." + ) + + _model: MultiModalEmbeddingModel = PrivateAttr() + _embed_dimension: int = PrivateAttr() + + def __init__( + self, + model_name: str = "multimodalembedding", + project: Optional[str] = None, + location: Optional[str] = None, + credentials: Optional[Any] = None, + embed_dimension: int = 1408, + embed_batch_size: int = DEFAULT_EMBED_BATCH_SIZE, + callback_manager: Optional[CallbackManager] = None, + additional_kwargs: Optional[Dict[str, Any]] = None, + ) -> None: + init_vertexai(project=project, location=location, credentials=credentials) + callback_manager = callback_manager or CallbackManager([]) + additional_kwargs = additional_kwargs or {} + + super().__init__( + embed_dimension=embed_dimension, + additional_kwargs=additional_kwargs, + model_name=model_name, + embed_batch_size=embed_batch_size, + callback_manager=callback_manager, + ) + self._model = MultiModalEmbeddingModel.from_pretrained(model_name) + + @classmethod + def class_name(cls) -> str: + return "VertexMultiModalEmbedding" + + def _get_text_embedding(self, text: str) -> Embedding: + return self._model.get_embeddings( + contextual_text=text, + dimension=self.embed_dimension, + **self.additional_kwargs + ).text_embedding + + def _get_image_embedding(self, img_file_path: ImageType) -> Embedding: + if isinstance(img_file_path, str): + image = Image.load_from_file(img_file_path) + else: + image = Image(image_bytes=img_file_path.getvalue()) + embeddings = self._model.get_embeddings( + image=image, dimension=self.embed_dimension, **self.additional_kwargs + ) + return embeddings.image_embedding + + def _get_query_embedding(self, query: str) -> Embedding: + return self._get_text_embedding(query) + + # Vertex AI SDK does not support async variants yet + async def _aget_text_embedding(self, text: str) -> Embedding: + return self._get_text_embedding(text) + + async def _aget_image_embedding(self, img_file_path: ImageType) -> Embedding: + return self._get_image_embedding(img_file_path) + + async def _aget_query_embedding(self, query: str) -> Embedding: + return self._get_query_embedding(query) diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/pyproject.toml b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/pyproject.toml new file mode 100644 index 0000000000000..786c029857e87 --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/pyproject.toml @@ -0,0 +1,58 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +# Feel free to un-skip examples, and experimental, you will just need to +# work through many typos (--write-changes and --interactive will help) +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +contains_example = true +import_path = "llama_index.embeddings.vertex" + +[tool.llamahub.class_authors] +VertexMultiModalEmbedding = "mustartt" +VertexTextEmbedding = "mustartt" + +[tool.mypy] +disallow_untyped_defs = true +# Remove venv skip when integrated with pre-commit +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["Henry Jiang "] +description = "llama-index embeddings vertex integration" +license = "MIT" +name = "llama-index-embeddings-vertex" +packages = [{include = "llama_index/"}] +readme = "README.md" +version = "0.1.0" + +[tool.poetry.dependencies] +python = ">=3.9,<4.0" +llama-index-core = "^0.10.0" +google-cloud-aiplatform = ">=1.43.0" + +[tool.poetry.group.dev.dependencies] +black = {extras = ["jupyter"], version = "<=23.9.1,>=23.7.0"} +codespell = {extras = ["toml"], version = ">=v2.2.6"} +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" # TODO: unpin when mypy>0.991 +types-setuptools = "67.1.0.0" diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/BUILD b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/BUILD new file mode 100644 index 0000000000000..619cac15ff840 --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/BUILD @@ -0,0 +1,3 @@ +python_tests( + interpreter_constraints=["==3.9.*", "==3.10.*"], +) diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/__init__.py b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/test_embeddings_vertex.py b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/test_embeddings_vertex.py new file mode 100644 index 0000000000000..2117305a9ff0e --- /dev/null +++ b/llama-index-integrations/embeddings/llama-index-embeddings-vertex/tests/test_embeddings_vertex.py @@ -0,0 +1,254 @@ +import io +import unittest +from unittest.mock import patch, Mock, MagicMock, AsyncMock + +from llama_index.core.base.embeddings.base import BaseEmbedding +from llama_index.core.embeddings import MultiModalEmbedding +from vertexai.language_models import TextEmbedding +from vertexai.vision_models import MultiModalEmbeddingResponse + +from PIL import Image as PillowImage + +from llama_index.embeddings.vertex import ( + VertexTextEmbedding, + VertexMultiModalEmbedding, + VertexEmbeddingMode, +) + + +class VertexTextEmbeddingTest(unittest.TestCase): + @patch("vertexai.init") + @patch("vertexai.language_models.TextEmbeddingModel.from_pretrained") + def test_init(self, model_mock: Mock, mock_init: Mock): + mock_cred = Mock(return_value="mock_credentials_instance") + embedding = VertexTextEmbedding( + model_name="textembedding-gecko@001", + project="test-project", + location="us-test-location", + credentials=mock_cred, + embed_mode=VertexEmbeddingMode.RETRIEVAL_MODE, + embed_batch_size=100, + ) + + mock_init.assert_called_once_with( + project="test-project", + location="us-test-location", + credentials=mock_cred, + ) + + self.assertIsInstance(embedding, BaseEmbedding) + + self.assertEqual(embedding.model_name, "textembedding-gecko@001") + self.assertEqual(embedding.embed_mode, VertexEmbeddingMode.RETRIEVAL_MODE) + self.assertEqual(embedding.embed_batch_size, 100) + + @patch("vertexai.init") + @patch("vertexai.language_models.TextEmbeddingModel.from_pretrained") + def test_get_embedding_retrieval(self, model_mock: Mock, init_mock: Mock): + model = MagicMock() + model_mock.return_value = model + + embedding = VertexTextEmbedding( + project="test-project", + location="us-test-location", + embed_mode=VertexEmbeddingMode.RETRIEVAL_MODE, + additional_kwargs={"auto_truncate": True}, + ) + + model.get_embeddings.return_value = [TextEmbedding(values=[0.1, 0.2, 0.3])] + result = embedding.get_text_embedding("some text") + + model.get_embeddings.assert_called_once() + positional_args, keyword_args = model.get_embeddings.call_args + model.get_embeddings.reset_mock() + + self.assertEqual(len(positional_args[0]), 1) + self.assertEqual(positional_args[0][0].text, "some text") + self.assertEqual(positional_args[0][0].task_type, "RETRIEVAL_DOCUMENT") + self.assertEqual(result, [0.1, 0.2, 0.3]) + self.assertTrue(keyword_args["auto_truncate"]) + + model.get_embeddings.return_value = [TextEmbedding(values=[0.1, 0.2, 0.3])] + result = embedding.get_query_embedding("some query text") + + model.get_embeddings.assert_called_once() + positional_args, keyword_args = model.get_embeddings.call_args + + self.assertEqual(len(positional_args[0]), 1) + self.assertEqual(positional_args[0][0].text, "some query text") + self.assertEqual(positional_args[0][0].task_type, "RETRIEVAL_QUERY") + self.assertEqual(result, [0.1, 0.2, 0.3]) + self.assertTrue(keyword_args["auto_truncate"]) + + +class VertexTextEmbeddingTestAsync(unittest.IsolatedAsyncioTestCase): + @patch("vertexai.init") + @patch("vertexai.language_models.TextEmbeddingModel.from_pretrained") + async def test_get_embedding_retrieval( + self, model_mock: AsyncMock, init_mock: AsyncMock + ): + model = MagicMock() + model.get_embeddings_async = ( + AsyncMock() + ) # Ensure get_embeddings is an AsyncMock for async calls + model_mock.return_value = model + + embedding = VertexTextEmbedding( + project="test-project", + location="us-test-location", + embed_mode=VertexEmbeddingMode.RETRIEVAL_MODE, + additional_kwargs={"auto_truncate": True}, + ) + + model.get_embeddings_async.return_value = [ + TextEmbedding(values=[0.1, 0.2, 0.3]) + ] + result = await embedding.aget_text_embedding("some text") + + model.get_embeddings_async.assert_called_once() + positional_args, keyword_args = model.get_embeddings_async.call_args + model.get_embeddings_async.reset_mock() + + self.assertEqual(len(positional_args[0]), 1) + self.assertEqual(positional_args[0][0].text, "some text") + self.assertEqual(positional_args[0][0].task_type, "RETRIEVAL_DOCUMENT") + self.assertEqual(result, [0.1, 0.2, 0.3]) + self.assertTrue(keyword_args["auto_truncate"]) + + model.get_embeddings_async.return_value = [ + TextEmbedding(values=[0.1, 0.2, 0.3]) + ] + result = await embedding.aget_query_embedding("some query text") + + model.get_embeddings_async.assert_called_once() + positional_args, keyword_args = model.get_embeddings_async.call_args + + self.assertEqual(len(positional_args[0]), 1) + self.assertEqual(positional_args[0][0].text, "some query text") + self.assertEqual(positional_args[0][0].task_type, "RETRIEVAL_QUERY") + self.assertEqual(result, [0.1, 0.2, 0.3]) + self.assertTrue(keyword_args["auto_truncate"]) + + +class VertexMultiModalEmbeddingTest(unittest.TestCase): + @patch("vertexai.init") + @patch("vertexai.vision_models.MultiModalEmbeddingModel.from_pretrained") + def test_init(self, model_mock: Mock, mock_init: Mock): + mock_cred = Mock(return_value="mock_credentials_instance") + embedding = VertexMultiModalEmbedding( + model_name="multimodalembedding", + project="test-project", + location="us-test-location", + credentials=mock_cred, + embed_dimension=1408, + embed_batch_size=100, + ) + + mock_init.assert_called_once_with( + project="test-project", + location="us-test-location", + credentials=mock_cred, + ) + + self.assertIsInstance(embedding, MultiModalEmbedding) + + self.assertEqual(embedding.model_name, "multimodalembedding") + self.assertEqual(embedding.embed_batch_size, 100) + self.assertEqual(embedding.embed_dimension, 1408) + + @patch("vertexai.init") + @patch("vertexai.vision_models.MultiModalEmbeddingModel.from_pretrained") + def test_text_embedding(self, model_mock: Mock, init_mock: Mock): + model = MagicMock() + model_mock.return_value = model + + embedding = VertexMultiModalEmbedding( + project="test-project", + location="us-test-location", + embed_dimension=1408, + additional_kwargs={"additional_kwarg": True}, + ) + + model.get_embeddings.return_value = MultiModalEmbeddingResponse( + _prediction_response=None, text_embedding=[0.1, 0.2, 0.3] + ) + + result = embedding.get_text_embedding("some text") + self.assertEqual(result, [0.1, 0.2, 0.3]) + + model.get_embeddings.assert_called_once() + positional_args, keyword_args = model.get_embeddings.call_args + + self.assertEqual(keyword_args["contextual_text"], "some text") + self.assertEqual(keyword_args["dimension"], 1408) + self.assertTrue(keyword_args["additional_kwarg"]) + + @patch("vertexai.init") + @patch("vertexai.vision_models.Image.load_from_file") + @patch("vertexai.vision_models.MultiModalEmbeddingModel.from_pretrained") + def test_image_embedding_path( + self, model_mock: Mock, load_file_mock: Mock, init_mock: Mock + ): + model = MagicMock() + model_mock.return_value = model + + embedding = VertexMultiModalEmbedding( + project="test-project", + location="us-test-location", + embed_dimension=1408, + additional_kwargs={"additional_kwarg": True}, + ) + + model.get_embeddings.return_value = MultiModalEmbeddingResponse( + _prediction_response=None, image_embedding=[0.1, 0.2, 0.3] + ) + + result = embedding.get_image_embedding("data/test-image.jpg") + self.assertEqual(result, [0.1, 0.2, 0.3]) + + model.get_embeddings.assert_called_once() + positional_args, keyword_args = model.get_embeddings.call_args + + load_file_mock.assert_called_once_with("data/test-image.jpg") + self.assertTrue("image" in keyword_args) + self.assertEqual(keyword_args["dimension"], 1408) + self.assertTrue(keyword_args["additional_kwarg"]) + + @patch("vertexai.init") + @patch("vertexai.vision_models.Image.load_from_file") + @patch("vertexai.vision_models.MultiModalEmbeddingModel.from_pretrained") + def test_image_embedding_bytes( + self, model_mock: Mock, load_file_mock: Mock, init_mock: Mock + ): + model = MagicMock() + model_mock.return_value = model + + embedding = VertexMultiModalEmbedding( + project="test-project", + location="us-test-location", + embed_dimension=1408, + additional_kwargs={"additional_kwarg": True}, + ) + + model.get_embeddings.return_value = MultiModalEmbeddingResponse( + _prediction_response=None, image_embedding=[0.1, 0.2, 0.3] + ) + + image = PillowImage.new("RGB", (128, 128)) + bytes_io = io.BytesIO() + image.save(bytes_io, "jpeg") + bytes_io.seek(0) + + result = embedding.get_image_embedding(bytes_io) + self.assertEqual(result, [0.1, 0.2, 0.3]) + + model.get_embeddings.assert_called_once() + positional_args, keyword_args = model.get_embeddings.call_args + + load_file_mock.assert_not_called() + self.assertEqual(keyword_args["dimension"], 1408) + self.assertTrue(keyword_args["additional_kwarg"]) + + +if __name__ == "__main__": + unittest.main() diff --git a/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/base.py b/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/base.py index 7fc634cfa05a0..853ba3831faa2 100644 --- a/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/base.py +++ b/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/base.py @@ -1,5 +1,5 @@ from typing import Any, Callable, Dict, Optional, Sequence - +from anthropic.types import ContentBlockDeltaEvent from llama_index.core.base.llms.types import ( ChatMessage, ChatResponse, @@ -28,12 +28,13 @@ from llama_index.core.types import BaseOutputParser, PydanticProgramMode from llama_index.llms.anthropic.utils import ( anthropic_modelname_to_contextsize, - messages_to_anthropic_prompt, + messages_to_anthropic_messages, ) +from llama_index.core.utils import Tokenizer import anthropic -DEFAULT_ANTHROPIC_MODEL = "claude-2" +DEFAULT_ANTHROPIC_MODEL = "claude-2.1" DEFAULT_ANTHROPIC_MAX_TOKENS = 512 @@ -123,12 +124,16 @@ def metadata(self) -> LLMMetadata: model_name=self.model, ) + @property + def tokenizer(self) -> Tokenizer: + return self._client.get_tokenizer() + @property def _model_kwargs(self) -> Dict[str, Any]: base_kwargs = { "model": self.model, "temperature": self.temperature, - "max_tokens_to_sample": self.max_tokens, + "max_tokens": self.max_tokens, } return { **base_kwargs, @@ -143,15 +148,18 @@ def _get_all_kwargs(self, **kwargs: Any) -> Dict[str, Any]: @llm_chat_callback() def chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse: - prompt = messages_to_anthropic_prompt(messages) + anthropic_messages, system_prompt = messages_to_anthropic_messages(messages) all_kwargs = self._get_all_kwargs(**kwargs) - response = self._client.completions.create( - prompt=prompt, stream=False, **all_kwargs + response = self._client.messages.create( + messages=anthropic_messages, + stream=False, + system=system_prompt, + **all_kwargs, ) return ChatResponse( message=ChatMessage( - role=MessageRole.ASSISTANT, content=response.completion + role=MessageRole.ASSISTANT, content=response.content[0].text ), raw=dict(response), ) @@ -167,24 +175,25 @@ def complete( def stream_chat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponseGen: - prompt = messages_to_anthropic_prompt(messages) + anthropic_messages, system_prompt = messages_to_anthropic_messages(messages) all_kwargs = self._get_all_kwargs(**kwargs) - response = self._client.completions.create( - prompt=prompt, stream=True, **all_kwargs + response = self._client.messages.create( + messages=anthropic_messages, system=system_prompt, stream=True, **all_kwargs ) def gen() -> ChatResponseGen: content = "" role = MessageRole.ASSISTANT for r in response: - content_delta = r.completion - content += content_delta - yield ChatResponse( - message=ChatMessage(role=role, content=content), - delta=content_delta, - raw=r, - ) + if isinstance(r, ContentBlockDeltaEvent): + content_delta = r.delta.text + content += content_delta + yield ChatResponse( + message=ChatMessage(role=role, content=content), + delta=content_delta, + raw=r, + ) return gen() @@ -199,15 +208,18 @@ def stream_complete( async def achat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponse: - prompt = messages_to_anthropic_prompt(messages) + anthropic_messages, system_prompt = messages_to_anthropic_messages(messages) all_kwargs = self._get_all_kwargs(**kwargs) - response = await self._aclient.completions.create( - prompt=prompt, stream=False, **all_kwargs + response = await self._aclient.messages.create( + messages=anthropic_messages, + system=system_prompt, + stream=False, + **all_kwargs, ) return ChatResponse( message=ChatMessage( - role=MessageRole.ASSISTANT, content=response.completion + role=MessageRole.ASSISTANT, content=response.content[0].text ), raw=dict(response), ) @@ -223,24 +235,25 @@ async def acomplete( async def astream_chat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponseAsyncGen: - prompt = messages_to_anthropic_prompt(messages) + anthropic_messages, system_prompt = messages_to_anthropic_messages(messages) all_kwargs = self._get_all_kwargs(**kwargs) - response = await self._aclient.completions.create( - prompt=prompt, stream=True, **all_kwargs + response = await self._aclient.messages.create( + messages=anthropic_messages, system=system_prompt, stream=True, **all_kwargs ) async def gen() -> ChatResponseAsyncGen: content = "" role = MessageRole.ASSISTANT async for r in response: - content_delta = r.completion - content += content_delta - yield ChatResponse( - message=ChatMessage(role=role, content=content), - delta=content_delta, - raw=r, - ) + if isinstance(r, ContentBlockDeltaEvent): + content_delta = r.delta.text + content += content_delta + yield ChatResponse( + message=ChatMessage(role=role, content=content), + delta=content_delta, + raw=r, + ) return gen() diff --git a/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/utils.py b/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/utils.py index 3cfbd0177d0df..19c1ae5dc7b5d 100644 --- a/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/utils.py +++ b/llama-index-integrations/llms/llama-index-llms-anthropic/llama_index/llms/anthropic/utils.py @@ -1,17 +1,18 @@ -from typing import Dict, Sequence +from typing import Dict, Sequence, Tuple from llama_index.core.base.llms.types import ChatMessage, MessageRole HUMAN_PREFIX = "\n\nHuman:" ASSISTANT_PREFIX = "\n\nAssistant:" - CLAUDE_MODELS: Dict[str, int] = { "claude-instant-1": 100000, "claude-instant-1.2": 100000, "claude-2": 100000, "claude-2.0": 100000, "claude-2.1": 200000, + "claude-3-opus-20240229": 180000, + "claude-3-sonnet-20240229": 180000, } @@ -25,6 +26,21 @@ def anthropic_modelname_to_contextsize(modelname: str) -> int: return CLAUDE_MODELS[modelname] +def messages_to_anthropic_messages( + messages: Sequence[ChatMessage], +) -> Tuple[Sequence[ChatMessage], str]: + anthropic_messages = [] + system_prompt = "" + for message in messages: + if message.role == MessageRole.SYSTEM: + system_prompt = message.content + else: + message = {"role": message.role.value, "content": message.content} + anthropic_messages.append(message) + return anthropic_messages, system_prompt + + +# Function used in bedrock def _message_to_anthropic_prompt(message: ChatMessage) -> str: if message.role == MessageRole.USER: prompt = f"{HUMAN_PREFIX} {message.content}" diff --git a/llama-index-integrations/llms/llama-index-llms-anthropic/pyproject.toml b/llama-index-integrations/llms/llama-index-llms-anthropic/pyproject.toml index 5e9ce75b791bd..543b8789f719d 100644 --- a/llama-index-integrations/llms/llama-index-llms-anthropic/pyproject.toml +++ b/llama-index-integrations/llms/llama-index-llms-anthropic/pyproject.toml @@ -27,12 +27,12 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-llms-anthropic" readme = "README.md" -version = "0.1.3" +version = "0.1.5" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" llama-index-core = "^0.10.1" -anthropic = "^0.11.0" +anthropic = "^0.17.0" [tool.poetry.group.dev.dependencies] ipython = "8.10.0" diff --git a/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/base.py b/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/base.py index a5e6b3b247d59..5bfaa888fa215 100644 --- a/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/base.py +++ b/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/base.py @@ -1,4 +1,5 @@ """Google's hosted Gemini API.""" + import os import typing from typing import Any, Dict, Optional, Sequence @@ -14,17 +15,16 @@ from llama_index.core.bridge.pydantic import Field, PrivateAttr from llama_index.core.callbacks import CallbackManager from llama_index.core.constants import DEFAULT_NUM_OUTPUTS, DEFAULT_TEMPERATURE -from llama_index.core.llms.callbacks import ( - llm_chat_callback, - llm_completion_callback, -) +from llama_index.core.llms.callbacks import llm_chat_callback, llm_completion_callback from llama_index.core.llms.custom import CustomLLM -from llama_index.llms.gemini.utils import ( +from llama_index.core.utilities.gemini_utils import ( ROLES_FROM_GEMINI, + merge_neighboring_same_role_messages, +) +from llama_index.llms.gemini.utils import ( chat_from_gemini_response, chat_message_to_gemini, completion_from_gemini_response, - merge_neighboring_same_role_messages, ) if typing.TYPE_CHECKING: diff --git a/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/utils.py b/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/utils.py index 8bc01a53c076b..d7c5ae0ca9026 100644 --- a/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/utils.py +++ b/llama-index-integrations/llms/llama-index-llms-gemini/llama_index/llms/gemini/utils.py @@ -1,22 +1,15 @@ -from typing import Sequence, Union +from typing import Union import google.ai.generativelanguage as glm import google.generativeai as genai import PIL -from llama_index.core.base.llms.types import MessageRole + from llama_index.core.base.llms.types import ( ChatMessage, ChatResponse, CompletionResponse, ) - -ROLES_TO_GEMINI = { - MessageRole.USER: "user", - MessageRole.ASSISTANT: "model", - ## Gemini only has user and model roles. Put the rest in user role. - MessageRole.SYSTEM: "user", -} -ROLES_FROM_GEMINI = {v: k for k, v in ROLES_TO_GEMINI.items()} +from llama_index.core.utilities.gemini_utils import ROLES_FROM_GEMINI, ROLES_TO_GEMINI def _error_if_finished_early(candidate: "glm.Candidate") -> None: # type: ignore[name-defined] # only until release @@ -79,37 +72,3 @@ def chat_message_to_gemini(message: ChatMessage) -> "genai.types.ContentDict": "role": ROLES_TO_GEMINI[message.role], "parts": parts, } - - -def merge_neighboring_same_role_messages( - messages: Sequence[ChatMessage], -) -> Sequence[ChatMessage]: - # Gemini does not support multiple messages of the same role in a row, so we merge them - merged_messages = [] - i = 0 - - while i < len(messages): - current_message = messages[i] - # Initialize merged content with current message content - merged_content = [current_message.content] - - # Check if the next message exists and has the same role - while ( - i + 1 < len(messages) - and ROLES_TO_GEMINI[messages[i + 1].role] - == ROLES_TO_GEMINI[current_message.role] - ): - i += 1 - next_message = messages[i] - merged_content.extend([next_message.content]) - - # Create a new ChatMessage or similar object with merged content - merged_message = ChatMessage( - role=current_message.role, - content="\n".join([str(msg_content) for msg_content in merged_content]), - additional_kwargs=current_message.additional_kwargs, - ) - merged_messages.append(merged_message) - i += 1 - - return merged_messages diff --git a/llama-index-integrations/llms/llama-index-llms-gemini/pyproject.toml b/llama-index-integrations/llms/llama-index-llms-gemini/pyproject.toml index 7e365aa08d381..9d03b89c826c4 100644 --- a/llama-index-integrations/llms/llama-index-llms-gemini/pyproject.toml +++ b/llama-index-integrations/llms/llama-index-llms-gemini/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-llms-gemini" readme = "README.md" -version = "0.1.4" +version = "0.1.5" [tool.poetry.dependencies] python = ">=3.9,<4.0" diff --git a/llama-index-integrations/llms/llama-index-llms-ollama/llama_index/llms/ollama/base.py b/llama-index-integrations/llms/llama-index-llms-ollama/llama_index/llms/ollama/base.py index 562b0c73429d8..78281eb5918fd 100644 --- a/llama-index-integrations/llms/llama-index-llms-ollama/llama_index/llms/ollama/base.py +++ b/llama-index-integrations/llms/llama-index-llms-ollama/llama_index/llms/ollama/base.py @@ -20,7 +20,7 @@ DEFAULT_REQUEST_TIMEOUT = 30.0 -def get_addtional_kwargs( +def get_additional_kwargs( response: Dict[str, Any], exclude: Tuple[str, ...] ) -> Dict[str, Any]: return {k: v for k, v in response.items() if k not in exclude} @@ -109,12 +109,12 @@ def chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse: message=ChatMessage( content=message.get("content"), role=MessageRole(message.get("role")), - additional_kwargs=get_addtional_kwargs( + additional_kwargs=get_additional_kwargs( message, ("content", "role") ), ), raw=raw, - additional_kwargs=get_addtional_kwargs(raw, ("message",)), + additional_kwargs=get_additional_kwargs(raw, ("message",)), ) @llm_chat_callback() @@ -156,13 +156,15 @@ def stream_chat( message=ChatMessage( content=text, role=MessageRole(message.get("role")), - additional_kwargs=get_addtional_kwargs( + additional_kwargs=get_additional_kwargs( message, ("content", "role") ), ), delta=delta, raw=chunk, - additional_kwargs=get_addtional_kwargs(chunk, ("message",)), + additional_kwargs=get_additional_kwargs( + chunk, ("message",) + ), ) @llm_completion_callback() @@ -188,7 +190,7 @@ def complete( return CompletionResponse( text=text, raw=raw, - additional_kwargs=get_addtional_kwargs(raw, ("response",)), + additional_kwargs=get_additional_kwargs(raw, ("response",)), ) @llm_completion_callback() @@ -220,7 +222,7 @@ def stream_complete( delta=delta, text=text, raw=chunk, - additional_kwargs=get_addtional_kwargs( + additional_kwargs=get_additional_kwargs( chunk, ("response",) ), ) diff --git a/llama-index-integrations/llms/llama-index-llms-ollama/tests/test_utils.py b/llama-index-integrations/llms/llama-index-llms-ollama/tests/test_utils.py new file mode 100644 index 0000000000000..0d300048cc47d --- /dev/null +++ b/llama-index-integrations/llms/llama-index-llms-ollama/tests/test_utils.py @@ -0,0 +1,12 @@ +from llama_index.llms.ollama.base import get_additional_kwargs + + +def test_get_additional_kwargs(): + response = {"key1": "value1", "key2": "value2", "exclude_me": "value3"} + exclude = ("exclude_me", "exclude_me_too") + + expected = {"key1": "value1", "key2": "value2"} + + actual = get_additional_kwargs(response, exclude) + + assert actual == expected diff --git a/llama-index-integrations/llms/llama-index-llms-openai/pyproject.toml b/llama-index-integrations/llms/llama-index-llms-openai/pyproject.toml index 1319956ecd567..1b0333b9b8d8d 100644 --- a/llama-index-integrations/llms/llama-index-llms-openai/pyproject.toml +++ b/llama-index-integrations/llms/llama-index-llms-openai/pyproject.toml @@ -23,13 +23,13 @@ ignore_missing_imports = true python_version = "3.8" [tool.poetry] -authors = ["Your Name "] +authors = ["llama-index"] description = "llama-index llms openai integration" exclude = ["**/BUILD"] license = "MIT" name = "llama-index-llms-openai" readme = "README.md" -version = "0.1.6" +version = "0.1.7" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/llms/llama-index-llms-perplexity/llama_index/llms/perplexity/base.py b/llama-index-integrations/llms/llama-index-llms-perplexity/llama_index/llms/perplexity/base.py index e3a574f4d5332..5bab5031a782f 100644 --- a/llama-index-integrations/llms/llama-index-llms-perplexity/llama_index/llms/perplexity/base.py +++ b/llama-index-integrations/llms/llama-index-llms-perplexity/llama_index/llms/perplexity/base.py @@ -109,14 +109,13 @@ def metadata(self) -> LLMMetadata: def _get_context_window(self) -> int: model_context_windows = { + "sonar-small-chat": 16384, + "sonar-small-online": 12000, + "sonar-medium-chat": 16384, + "sonar-medium-online": 12000, "codellama-34b-instruct": 16384, - "llama-2-70b-chat": 4096, - "mistral-7b-instruct": 4096, - "mixtral-8x7b-instruct": 4096, - "pplx-7b-chat": 8192, - "pplx-70b-chat": 4096, - "pplx-7b-online": 4096, - "pplx-70b-online": 4096, + "mistral-7b-instruct": 16384, + "mixtral-8x7b-instruct": 16384, } return model_context_windows.get( self.model, 4096 @@ -124,14 +123,12 @@ def _get_context_window(self) -> int: def _is_chat_model(self) -> bool: chat_models = { - "codellama-34b-instruct", - "llama-2-70b-chat", + "sonar-small-chat", + "sonar-small-online", + "sonar-medium-chat", + "sonar-medium-online" "codellama-34b-instruct", "mistral-7b-instruct", "mixtral-8x7b-instruct", - "pplx-7b-chat", - "pplx-70b-chat", - "pplx-7b-online", - "pplx-70b-online", } return self.model in chat_models diff --git a/llama-index-integrations/llms/llama-index-llms-perplexity/pyproject.toml b/llama-index-integrations/llms/llama-index-llms-perplexity/pyproject.toml index 0f1b3e22527b8..824d8a13122e1 100644 --- a/llama-index-integrations/llms/llama-index-llms-perplexity/pyproject.toml +++ b/llama-index-integrations/llms/llama-index-llms-perplexity/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-llms-perplexity" readme = "README.md" -version = "0.1.2" +version = "0.1.3" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/base.py b/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/base.py index 02971bd1833e9..0b21e82975e30 100644 --- a/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/base.py +++ b/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/base.py @@ -16,6 +16,7 @@ from llama_index.core.llms.callbacks import llm_chat_callback, llm_completion_callback from llama_index.core.llms.llm import LLM from llama_index.core.types import BaseOutputParser, PydanticProgramMode +from llama_index.core.utilities.gemini_utils import merge_neighboring_same_role_messages from llama_index.llms.vertex.gemini_utils import create_gemini_client, is_gemini_model from llama_index.llms.vertex.utils import ( CHAT_MODELS, @@ -130,7 +131,9 @@ def metadata(self) -> LLMMetadata: return LLMMetadata( is_chat_model=self._is_chat_model, model_name=self.model, - system_role=MessageRole.USER, # Vertex does not support the default: MessageRole.SYSTEM + system_role=( + MessageRole.USER if self._is_gemini else MessageRole.SYSTEM + ), # Gemini does not support the default: MessageRole.SYSTEM ) @property @@ -152,8 +155,13 @@ def _get_all_kwargs(self, **kwargs: Any) -> Dict[str, Any]: @llm_chat_callback() def chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse: - question = _parse_message(messages[-1], self._is_gemini) - chat_history = _parse_chat_history(messages[:-1], self._is_gemini) + merged_messages = ( + merge_neighboring_same_role_messages(messages) + if self._is_gemini + else messages + ) + question = _parse_message(merged_messages[-1], self._is_gemini) + chat_history = _parse_chat_history(merged_messages[:-1], self._is_gemini) chat_params = {**chat_history} kwargs = kwargs if kwargs else {} @@ -209,8 +217,13 @@ def complete( def stream_chat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponseGen: - question = _parse_message(messages[-1], self._is_gemini) - chat_history = _parse_chat_history(messages[:-1], self._is_gemini) + merged_messages = ( + merge_neighboring_same_role_messages(messages) + if self._is_gemini + else messages + ) + question = _parse_message(merged_messages[-1], self._is_gemini) + chat_history = _parse_chat_history(merged_messages[:-1], self._is_gemini) chat_params = {**chat_history} kwargs = kwargs if kwargs else {} params = {**self._model_kwargs, **kwargs} @@ -283,8 +296,13 @@ def gen() -> CompletionResponseGen: async def achat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponse: - question = _parse_message(messages[-1], self._is_gemini) - chat_history = _parse_chat_history(messages[:-1], self._is_gemini) + merged_messages = ( + merge_neighboring_same_role_messages(messages) + if self._is_gemini + else messages + ) + question = _parse_message(merged_messages[-1], self._is_gemini) + chat_history = _parse_chat_history(merged_messages[:-1], self._is_gemini) chat_params = {**chat_history} kwargs = kwargs if kwargs else {} params = {**self._model_kwargs, **kwargs} diff --git a/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/utils.py b/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/utils.py index c9f7bb2f9e97d..cafdd2977bc0e 100644 --- a/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/utils.py +++ b/llama-index-integrations/llms/llama-index-llms-vertex/llama_index/llms/vertex/utils.py @@ -6,7 +6,6 @@ import google.api_core import vertexai -from llama_index.core.base.llms.types import ChatMessage, MessageRole from tenacity import ( before_sleep_log, retry, @@ -14,12 +13,10 @@ stop_after_attempt, wait_exponential, ) -from vertexai.language_models import ( - ChatMessage as VertexChatMessage, -) -from vertexai.language_models import ( - InputOutputTextPair, -) +from vertexai.language_models import ChatMessage as VertexChatMessage +from vertexai.language_models import InputOutputTextPair + +from llama_index.core.base.llms.types import ChatMessage, MessageRole CHAT_MODELS = ["chat-bison", "chat-bison-32k", "chat-bison@001"] TEXT_MODELS = ["text-bison", "text-bison-32k", "text-bison@001"] @@ -169,9 +166,13 @@ def _parse_chat_history(history: Any, is_gemini: bool) -> Any: for i, message in enumerate(history): if i == 0 and message.role == MessageRole.SYSTEM: if is_gemini: - raise ValueError("Gemini model don't support system messages") + raise ValueError("Gemini model doesn't support system messages") context = message.content - elif message.role == MessageRole.ASSISTANT or message.role == MessageRole.USER: + elif message.role in ( + MessageRole.MODEL, + MessageRole.ASSISTANT, + MessageRole.USER, + ): if is_gemini: from llama_index.llms.vertex.gemini_utils import ( convert_chat_message_to_gemini_content, @@ -185,12 +186,16 @@ def _parse_chat_history(history: Any, is_gemini: bool) -> Any: else: vertex_message = VertexChatMessage( content=message.content, - author="bot" if message.role == MessageRole.ASSISTANT else "user", + author=( + "bot" + if message.role in (MessageRole.ASSISTANT, MessageRole.MODEL) + else MessageRole.USER + ), ) vertex_messages.append(vertex_message) else: raise ValueError( - f"Unexpected message with type {type(message)} at the position {i}." + f"Unexpected message with role {message.role} at the position {i}." ) if len(vertex_messages) % 2 != 0: raise ValueError("total no of messages should be even") diff --git a/llama-index-integrations/llms/llama-index-llms-vertex/pyproject.toml b/llama-index-integrations/llms/llama-index-llms-vertex/pyproject.toml index d1e15c08261df..be582e194b98c 100644 --- a/llama-index-integrations/llms/llama-index-llms-vertex/pyproject.toml +++ b/llama-index-integrations/llms/llama-index-llms-vertex/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-llms-vertex" readme = "README.md" -version = "0.1.3" +version = "0.1.4" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/.gitignore b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/.gitignore new file mode 100644 index 0000000000000..990c18de22908 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/.gitignore @@ -0,0 +1,153 @@ +llama_index/_static +.DS_Store +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +bin/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +etc/ +include/ +lib/ +lib64/ +parts/ +sdist/ +share/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +.ruff_cache + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints +notebooks/ + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ +pyvenv.cfg + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# Jetbrains +.idea +modules/ +*.swp + +# VsCode +.vscode + +# pipenv +Pipfile +Pipfile.lock + +# pyright +pyrightconfig.json diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/BUILD b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/BUILD new file mode 100644 index 0000000000000..0896ca890d8bf --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/BUILD @@ -0,0 +1,3 @@ +poetry_requirements( + name="poetry", +) diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/Makefile b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/Makefile new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/Makefile @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/README.md b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/README.md new file mode 100644 index 0000000000000..2c0efcc4faa28 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/README.md @@ -0,0 +1 @@ +# LlamaIndex Multi-Modal-Llms Integration: Anthropic diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/BUILD b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/__init__.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/__init__.py new file mode 100644 index 0000000000000..f6bbe497845f1 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/__init__.py @@ -0,0 +1,3 @@ +from llama_index.multi_modal_llms.anthropic.base import AnthropicMultiModal + +__all__ = ["AnthropicMultiModal"] diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/base.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/base.py new file mode 100644 index 0000000000000..d9a3168c3dc9c --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/base.py @@ -0,0 +1,330 @@ +from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple + +import httpx +from anthropic.types import ContentBlockDeltaEvent +from llama_index.core.base.llms.types import ( + CompletionResponse, + CompletionResponseAsyncGen, + CompletionResponseGen, + MessageRole, +) +from llama_index.core.bridge.pydantic import Field, PrivateAttr +from llama_index.core.callbacks import CallbackManager +from llama_index.core.constants import ( + DEFAULT_CONTEXT_WINDOW, + DEFAULT_NUM_OUTPUTS, + DEFAULT_TEMPERATURE, +) +from llama_index.core.base.llms.generic_utils import ( + messages_to_prompt as generic_messages_to_prompt, +) +from llama_index.core.multi_modal_llms import ( + MultiModalLLM, + MultiModalLLMMetadata, +) +from llama_index.core.schema import ImageDocument +from llama_index.multi_modal_llms.anthropic.utils import ( + ANTHROPIC_MULTI_MODAL_MODELS, + generate_anthropic_multi_modal_chat_message, + resolve_anthropic_credentials, +) + +from anthropic import Anthropic, AsyncAnthropic + + +class AnthropicMultiModal(MultiModalLLM): + model: str = Field(description="The Multi-Modal model to use from Anthropic.") + temperature: float = Field(description="The temperature to use for sampling.") + max_tokens: Optional[int] = Field( + description=" The maximum numbers of tokens to generate, ignoring the number of tokens in the prompt", + gt=0, + ) + context_window: Optional[int] = Field( + description="The maximum number of context tokens for the model.", + gt=0, + ) + max_retries: int = Field( + default=3, + description="Maximum number of retries.", + gte=0, + ) + timeout: float = Field( + default=60.0, + description="The timeout, in seconds, for API requests.", + gte=0, + ) + api_key: str = Field( + default=None, description="The Anthropic API key.", exclude=True + ) + system_prompt: str = Field(default="", description="System Prompt.") + api_base: str = Field(default=None, description="The base URL for Anthropic API.") + api_version: str = Field(description="The API version for Anthropic API.") + additional_kwargs: Dict[str, Any] = Field( + default_factory=dict, description="Additional kwargs for the Anthropic API." + ) + default_headers: Dict[str, str] = Field( + default=None, description="The default headers for API requests." + ) + + _messages_to_prompt: Callable = PrivateAttr() + _completion_to_prompt: Callable = PrivateAttr() + _client: Anthropic = PrivateAttr() + _aclient: AsyncAnthropic = PrivateAttr() + _http_client: Optional[httpx.Client] = PrivateAttr() + + def __init__( + self, + model: str = "claude-3-opus-20240229", + temperature: float = DEFAULT_TEMPERATURE, + max_tokens: Optional[int] = 300, + additional_kwargs: Optional[Dict[str, Any]] = None, + context_window: Optional[int] = DEFAULT_CONTEXT_WINDOW, + max_retries: int = 3, + timeout: float = 60.0, + api_key: Optional[str] = None, + api_base: Optional[str] = None, + api_version: Optional[str] = None, + messages_to_prompt: Optional[Callable] = None, + completion_to_prompt: Optional[Callable] = None, + callback_manager: Optional[CallbackManager] = None, + default_headers: Optional[Dict[str, str]] = None, + http_client: Optional[httpx.Client] = None, + system_prompt: Optional[str] = "", + **kwargs: Any, + ) -> None: + self._messages_to_prompt = messages_to_prompt or generic_messages_to_prompt + self._completion_to_prompt = completion_to_prompt or (lambda x: x) + api_key, api_base, api_version = resolve_anthropic_credentials( + api_key=api_key, + api_base=api_base, + api_version=api_version, + ) + + super().__init__( + model=model, + temperature=temperature, + max_tokens=max_tokens, + additional_kwargs=additional_kwargs or {}, + context_window=context_window, + max_retries=max_retries, + timeout=timeout, + api_key=api_key, + api_base=api_base, + api_version=api_version, + callback_manager=callback_manager, + default_headers=default_headers, + system_promt=system_prompt, + **kwargs, + ) + self._http_client = http_client + self._client, self._aclient = self._get_clients(**kwargs) + + def _get_clients(self, **kwargs: Any) -> Tuple[Anthropic, AsyncAnthropic]: + client = Anthropic(**self._get_credential_kwargs()) + aclient = AsyncAnthropic(**self._get_credential_kwargs()) + return client, aclient + + @classmethod + def class_name(cls) -> str: + return "anthropic_multi_modal_llm" + + @property + def metadata(self) -> MultiModalLLMMetadata: + """Multi Modal LLM metadata.""" + return MultiModalLLMMetadata( + num_output=self.max_tokens or DEFAULT_NUM_OUTPUTS, + model_name=self.model, + ) + + def _get_credential_kwargs(self, **kwargs: Any) -> Dict[str, Any]: + return { + "api_key": self.api_key, + "base_url": self.api_base, + "max_retries": self.max_retries, + "timeout": self.timeout, + **kwargs, + } + + def _get_multi_modal_chat_messages( + self, + prompt: str, + role: str, + image_documents: Sequence[ImageDocument], + **kwargs: Any, + ) -> List[Dict]: + return generate_anthropic_multi_modal_chat_message( + prompt=prompt, + role=role, + image_documents=image_documents, + ) + + # Model Params for Anthropic Multi Modal model. + def _get_model_kwargs(self, **kwargs: Any) -> Dict[str, Any]: + if self.model not in ANTHROPIC_MULTI_MODAL_MODELS: + raise ValueError( + f"Invalid model {self.model}. " + f"Available models are: {list(ANTHROPIC_MULTI_MODAL_MODELS.keys())}" + ) + base_kwargs = {"model": self.model, "temperature": self.temperature, **kwargs} + if self.max_tokens is not None: + base_kwargs["max_tokens"] = self.max_tokens + return {**base_kwargs, **self.additional_kwargs} + + def _get_response_token_counts(self, raw_response: Any) -> dict: + """Get the token usage reported by the response.""" + if not isinstance(raw_response, dict): + return {} + + usage = raw_response.get("usage", {}) + # NOTE: other model providers that use the Anthropic client may not report usage + if usage is None: + return {} + + return { + "prompt_tokens": usage.get("prompt_tokens", 0), + "completion_tokens": usage.get("completion_tokens", 0), + "total_tokens": usage.get("total_tokens", 0), + } + + def _complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponse: + all_kwargs = self._get_model_kwargs(**kwargs) + message_dict = self._get_multi_modal_chat_messages( + prompt=prompt, role=MessageRole.USER, image_documents=image_documents + ) + + response = self._client.messages.create( + messages=message_dict, + system=self.system_prompt, + stream=False, + **all_kwargs, + ) + + return CompletionResponse( + text=response.content[0].text, + raw=response, + additional_kwargs=self._get_response_token_counts(response), + ) + + def _stream_complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponseGen: + all_kwargs = self._get_model_kwargs(**kwargs) + message_dict = self._get_multi_modal_chat_messages( + prompt=prompt, role=MessageRole.USER, image_documents=image_documents + ) + + def gen() -> CompletionResponseGen: + text = "" + + for response in self._client.messages.create( + messages=message_dict, + stream=True, + system=self.system_prompt, + **all_kwargs, + ): + if isinstance(response, ContentBlockDeltaEvent): + # update using deltas + content_delta = response.delta.text or "" + text += content_delta + + yield CompletionResponse( + delta=content_delta, + text=text, + raw=response, + additional_kwargs=self._get_response_token_counts(response), + ) + + return gen() + + def complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponse: + return self._complete(prompt, image_documents, **kwargs) + + def stream_complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponseGen: + return self._stream_complete(prompt, image_documents, **kwargs) + + def chat( + self, + **kwargs: Any, + ) -> Any: + raise NotImplementedError("This function is not yet implemented.") + + def stream_chat( + self, + **kwargs: Any, + ) -> Any: + raise NotImplementedError("This function is not yet implemented.") + + # ===== Async Endpoints ===== + + async def _acomplete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponse: + all_kwargs = self._get_model_kwargs(**kwargs) + message_dict = self._get_multi_modal_chat_messages( + prompt=prompt, role=MessageRole.USER, image_documents=image_documents + ) + response = await self._aclient.messages.create( + messages=message_dict, + stream=False, + system=self.system_prompt, + **all_kwargs, + ) + + return CompletionResponse( + text=response.content[0].text, + raw=response, + additional_kwargs=self._get_response_token_counts(response), + ) + + async def acomplete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponse: + return await self._acomplete(prompt, image_documents, **kwargs) + + async def _astream_complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponseAsyncGen: + all_kwargs = self._get_model_kwargs(**kwargs) + message_dict = self._get_multi_modal_chat_messages( + prompt=prompt, role=MessageRole.USER, image_documents=image_documents + ) + + async def gen() -> CompletionResponseAsyncGen: + text = "" + + async for response in await self._aclient.messages.create( + messages=message_dict, + stream=True, + system=self.system_prompt, + **all_kwargs, + ): + if isinstance(response, ContentBlockDeltaEvent): + # update using deltas + content_delta = response.delta.text or "" + text += content_delta + + yield CompletionResponse( + delta=content_delta, + text=text, + raw=response, + additional_kwargs=self._get_response_token_counts(response), + ) + + return gen() + + async def astream_complete( + self, prompt: str, image_documents: Sequence[ImageDocument], **kwargs: Any + ) -> CompletionResponseAsyncGen: + return await self._astream_complete(prompt, image_documents, **kwargs) + + async def achat(self, **kwargs: Any) -> Any: + raise NotImplementedError("This function is not yet implemented.") + + async def astream_chat(self, **kwargs: Any) -> Any: + raise NotImplementedError("This function is not yet implemented.") diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/utils.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/utils.py new file mode 100644 index 0000000000000..8ee491b0795b7 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/llama_index/multi_modal_llms/anthropic/utils.py @@ -0,0 +1,133 @@ +import logging +from typing import Any, Dict, Optional, Sequence, Tuple, List +import base64 +import httpx + +from llama_index.core.multi_modal_llms.generic_utils import encode_image +from llama_index.core.schema import ImageDocument +from llama_index.core.base.llms.generic_utils import get_from_param_or_env + +DEFAULT_ANTHROPIC_API_TYPE = "anthropic_ai" +DEFAULT_ANTHROPIC_API_BASE = "https://api.anthropic.com" +DEFAULT_ANTHROPIC_API_VERSION = "" + + +ANTHROPIC_MULTI_MODAL_MODELS = { + "claude-3-opus-20240229": 180000, + "claude-3-sonnet-20240229": 180000, +} + + +MISSING_API_KEY_ERROR_MESSAGE = """No API key found for Anthropic. +Please set either the ANTHROPIC_API_KEY environment variable \ +API keys can be found or created at \ +https://console.anthropic.com/settings/keys +""" + +logger = logging.getLogger(__name__) + + +def infer_image_mimetype(image_file_path: str) -> str: + # Get the file extension + file_extension = image_file_path.split(".")[-1].lower() + + # Map file extensions to mimetypes + # Claude 3 support the base64 source type for images, and the image/jpeg, image/png, image/gif, and image/webp media types. + # https://docs.anthropic.com/claude/reference/messages_post + if file_extension == "jpg" or file_extension == "jpeg": + return "image/jpeg" + elif file_extension == "png": + return "image/png" + elif file_extension == "gif": + return "image/gif" + elif file_extension == "webp": + return "image/webp" + # Add more mappings for other image types if needed + + # If the file extension is not recognized + return "image/jpeg" + + +def generate_anthropic_multi_modal_chat_message( + prompt: str, + role: str, + image_documents: Optional[Sequence[ImageDocument]] = None, +) -> List[Dict[str, Any]]: + # if image_documents is empty, return text only chat message + if image_documents is None: + return [{"role": role, "content": prompt}] + + # if image_documents is not empty, return text with images chat message + completion_content = [] + for image_document in image_documents: + image_content: Dict[str, Any] = {} + if image_document.image_path and image_document.image_path != "": + mimetype = infer_image_mimetype(image_document.image_path) + base64_image = encode_image(image_document.image_path) + image_content = { + "type": "image", + "source": { + "type": "base64", + "media_type": mimetype, + "data": base64_image, + }, + } + elif ( + "file_path" in image_document.metadata + and image_document.metadata["file_path"] != "" + ): + mimetype = infer_image_mimetype(image_document.metadata["file_path"]) + base64_image = encode_image(image_document.metadata["file_path"]) + image_content = { + "type": "image", + "source": { + "type": "base64", + "media_type": mimetype, + "data": base64_image, + }, + } + elif image_document.image_url and image_document.image_url != "": + mimetype = infer_image_mimetype(image_document.image_url) + image_content = { + "type": "image", + "source": { + "type": "base64", + "media_type": mimetype, + "data": base64.b64encode( + httpx.get(image_document.image_url).content + ).decode("utf-8"), + }, + } + completion_content.append(image_content) + + completion_content.append({"type": "text", "text": prompt}) + + return [{"role": role, "content": completion_content}] + + +def resolve_anthropic_credentials( + api_key: Optional[str] = None, + api_base: Optional[str] = None, + api_version: Optional[str] = None, +) -> Tuple[Optional[str], str, str]: + """ "Resolve Anthropic credentials. + + The order of precedence is: + 1. param + 2. env + 3. anthropic module + 4. default + """ + # resolve from param or env + api_key = get_from_param_or_env("api_key", api_key, "ANTHROPIC_API_KEY", "") + api_base = get_from_param_or_env("api_base", api_base, "ANTHROPIC_API_BASE", "") + api_version = get_from_param_or_env( + "api_version", api_version, "ANTHROPIC_API_VERSION", "" + ) + + # resolve from Anthropic module or default + final_api_key = api_key or "" + final_api_base = api_base or DEFAULT_ANTHROPIC_API_BASE + final_api_version = api_version or DEFAULT_ANTHROPIC_API_VERSION + + return final_api_key, str(final_api_base), final_api_version diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/pyproject.toml b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/pyproject.toml new file mode 100644 index 0000000000000..50bee985a72cb --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/pyproject.toml @@ -0,0 +1,63 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +contains_example = false +import_path = "llama_index.multi_modal_llms.anthropic" + +[tool.llamahub.class_authors] +AnthropicMultiModal = "llama-index" + +[tool.mypy] +disallow_untyped_defs = true +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["Your Name "] +description = "llama-index multi-modal-llms anthropic integration" +exclude = ["**/BUILD"] +license = "MIT" +name = "llama-index-multi-modal-llms-anthropic" +readme = "README.md" +version = "0.1.2" + +[tool.poetry.dependencies] +python = ">=3.8.1,<4.0" +llama-index-core = "^0.10.1" +anthropic = "0.17.0" + +[tool.poetry.group.dev.dependencies] +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" +types-setuptools = "67.1.0.0" + +[tool.poetry.group.dev.dependencies.black] +extras = ["jupyter"] +version = "<=23.9.1,>=23.7.0" + +[tool.poetry.group.dev.dependencies.codespell] +extras = ["toml"] +version = ">=v2.2.6" + +[[tool.poetry.packages]] +include = "llama_index/" diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/BUILD b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/BUILD new file mode 100644 index 0000000000000..dabf212d7e716 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/BUILD @@ -0,0 +1 @@ +python_tests() diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/__init__.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/test_multi-modal-llms_anthropic.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/test_multi-modal-llms_anthropic.py new file mode 100644 index 0000000000000..0d401ff2ffb83 --- /dev/null +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-anthropic/tests/test_multi-modal-llms_anthropic.py @@ -0,0 +1,7 @@ +from llama_index.core.multi_modal_llms.base import MultiModalLLM +from llama_index.multi_modal_llms.anthropic import AnthropicMultiModal + + +def test_embedding_class(): + names_of_base_classes = [b.__name__ for b in AnthropicMultiModal.__mro__] + assert MultiModalLLM.__name__ in names_of_base_classes diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/llama_index/multi_modal_llms/ollama/base.py b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/llama_index/multi_modal_llms/ollama/base.py index a1cd409edc75a..c4e44dca3e769 100644 --- a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/llama_index/multi_modal_llms/ollama/base.py +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/llama_index/multi_modal_llms/ollama/base.py @@ -1,4 +1,6 @@ -from typing import Any, Dict, Sequence, Tuple +from typing import Any, Dict, Optional, Sequence, Tuple + +from ollama import Client from llama_index.core.base.llms.types import ( ChatMessage, @@ -10,7 +12,7 @@ CompletionResponseGen, MessageRole, ) -from llama_index.core.bridge.pydantic import Field +from llama_index.core.bridge.pydantic import Field, PrivateAttr from llama_index.core.constants import DEFAULT_CONTEXT_WINDOW, DEFAULT_NUM_OUTPUTS from llama_index.core.multi_modal_llms import ( MultiModalLLM, @@ -48,6 +50,10 @@ def _messages_to_dicts(messages: Sequence[ChatMessage]) -> Sequence[Dict[str, An class OllamaMultiModal(MultiModalLLM): + base_url: str = Field( + default="http://localhost:11434", + description="Base url the model is hosted under.", + ) model: str = Field(description="The MultiModal Ollama model to use.") temperature: float = Field( default=0.75, @@ -60,21 +66,19 @@ class OllamaMultiModal(MultiModalLLM): description="The maximum number of context tokens for the model.", gt=0, ) + request_timeout: Optional[float] = Field( + description="The timeout for making http request to Ollama API server", + ) additional_kwargs: Dict[str, Any] = Field( default_factory=dict, description="Additional model parameters for the Ollama API.", ) + _client: Client = PrivateAttr() def __init__(self, **kwargs: Any) -> None: - """Init params.""" - # make sure that ollama is installed - try: - import ollama # noqa: F401 - except ImportError: - raise ImportError( - "Ollama is not installed. Please install it using `pip install ollama`." - ) + """Init params and ollama client.""" super().__init__(**kwargs) + self._client = Client(host=self.base_url, timeout=self.request_timeout) @classmethod def class_name(cls) -> str: @@ -103,10 +107,8 @@ def _model_kwargs(self) -> Dict[str, Any]: def chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse: """Chat.""" - import ollama - ollama_messages = _messages_to_dicts(messages) - response = ollama.chat( + response = self._client.chat( model=self.model, messages=ollama_messages, stream=False, **kwargs ) return ChatResponse( @@ -123,10 +125,8 @@ def stream_chat( self, messages: Sequence[ChatMessage], **kwargs: Any ) -> ChatResponseGen: """Stream chat.""" - import ollama - ollama_messages = _messages_to_dicts(messages) - response = ollama.chat( + response = self._client.chat( model=self.model, messages=ollama_messages, stream=True, **kwargs ) text = "" @@ -157,9 +157,7 @@ def complete( **kwargs: Any, ) -> CompletionResponse: """Complete.""" - import ollama - - response = ollama.generate( + response = self._client.generate( model=self.model, prompt=prompt, images=image_documents_to_base64(image_documents), @@ -181,9 +179,7 @@ def stream_complete( **kwargs: Any, ) -> CompletionResponseGen: """Stream complete.""" - import ollama - - response = ollama.generate( + response = self._client.generate( model=self.model, prompt=prompt, images=image_documents_to_base64(image_documents), diff --git a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/pyproject.toml b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/pyproject.toml index 8100f24534041..65a021d3cc80b 100644 --- a/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/pyproject.toml +++ b/llama-index-integrations/multi_modal_llms/llama-index-multi-modal-llms-ollama/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-multi-modal-llms-ollama" readme = "README.md" -version = "0.1.2" +version = "0.1.3" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/readers/README.md b/llama-index-integrations/readers/README.md index 28086dbb4d088..cd6aa2c93d911 100644 --- a/llama-index-integrations/readers/README.md +++ b/llama-index-integrations/readers/README.md @@ -1,15 +1,16 @@ # Readers (Loaders) -## Reader Usage (Use `download_loader` from LlamaIndex) +Readers can be installed directly as packages: -You can also use the loaders with `download_loader` from LlamaIndex in a single line of code. +```bash +pip install llama-index-readers-google +``` For example, see the code snippets below using the Google Docs Loader. ```python from llama_index.core import VectorStoreIndex, download_loader - -GoogleDocsReader = download_loader("GoogleDocsReader") +from llama_index.readers.google import GoogleDocsReader gdoc_ids = ["1wf-y2pd9C878Oh-FmLH7Q_BQkljdm6TQal-c1pUfrec"] loader = GoogleDocsReader() diff --git a/llama-index-integrations/readers/llama-index-readers-agent-search/README.md b/llama-index-integrations/readers/llama-index-readers-agent-search/README.md index 3d7f9ad282186..d67611bceac0a 100644 --- a/llama-index-integrations/readers/llama-index-readers-agent-search/README.md +++ b/llama-index-integrations/readers/llama-index-readers-agent-search/README.md @@ -1,5 +1,9 @@ # AgentSearch Loader +```bash +pip install llama-index-readers-agent-search +``` + This framework facilitates seamless integration with the AgentSearch dataset or hosted search APIs (e.g. Search Engines) and with RAG-specialized LLM's (e.g. Search Agents). During query-time, the user passes in the query string, search provider (`bing`, `agent-search`), and RAG provider model (`SciPhi/Sensei-7B-V1`). @@ -15,9 +19,7 @@ Here's an example usage of the AgentSearchReader. # import os # os.environ["SCIPHI_API_KEY"] = "..." -from llama_index import download_loader - -AgentSearch = download_loader("AgentSearchReader") +from llama_index.readers.agent_search import AgentSearchReader reader = AgentSearch() diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-cdk/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-cdk/README.md index 534cdab3b27df..bf621cf2a45d4 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-cdk/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-cdk/README.md @@ -1,10 +1,14 @@ # Airbyte CDK Loader +```bash +pip install llama-index-readers-airbyte-cdk +``` + The Airbyte CDK Loader is a shim for sources created using the [Airbyte Python CDK](https://docs.airbyte.com/connector-development/cdk-python/). It allows you to load data from any Airbyte source into LlamaIndex. ## Installation -- Install llama_hub: `pip install llama_hub` +- Install llama-index reader: `pip install llama-index-readers-airbyte-cdk` - Install airbyte-cdk: `pip install airbyte-cdk` - Install a source via git (or implement your own): `pip install git+https://github.com/airbytehq/airbyte.git@master#egg=source_github&subdirectory=airbyte-integrations/connectors/source-github` @@ -15,8 +19,7 @@ Implement and import your own source. You can find lots of resources for how to Here's an example usage of the AirbyteCdkReader. ```python -from llama_index import download_loader -from llama_hub.airbyte_cdk import AirbyteCDKReader +from llama_index.readers.airbyte_cdk import AirbyteCDKReader from source_github.source import ( SourceGithub, ) # this is just an example, you can use any source here - this one is loaded from the Airbyte Github repo via pip install git+https://github.com/airbytehq/airbyte.git@master#egg=source_github&subdirectory=airbyte-integrations/connectors/source-github` diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-gong/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-gong/README.md index 94a7c3f130e30..20b46ee18e075 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-gong/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-gong/README.md @@ -1,18 +1,17 @@ # Airbyte Gong Loader -The Airbyte Gong Loader allows you to access different Gong objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-gong +``` -- Install llama_hub: `pip install llama_hub` -- Install the gong source: `pip install airbyte-source-gong` +The Airbyte Gong Loader allows you to access different Gong objects. ## Usage Here's an example usage of the AirbyteGongReader. ```python -from llama_hub.airbyte_gong import AirbyteGongReader +from llama_index.readers.airbyte_gong import AirbyteGongReader gong_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-hubspot/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-hubspot/README.md index 34fca9a7318d5..29eef93781030 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-hubspot/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-hubspot/README.md @@ -1,18 +1,17 @@ # Airbyte Hubspot Loader -The Airbyte Hubspot Loader allows you to access different Hubspot objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-hubspot +``` -- Install llama_hub: `pip install llama_hub` -- Install the hubspot source: `pip install airbyte-source-hubspot` +The Airbyte Hubspot Loader allows you to access different Hubspot objects. ## Usage Here's an example usage of the AirbyteHubspotReader. ```python -from llama_hub.airbyte_hubspot import AirbyteHubspotReader +from llama_index.readers.airbyte_hubspot import AirbyteHubspotReader hubspot_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-salesforce/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-salesforce/README.md index 375ea08282eea..7b03d4492a998 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-salesforce/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-salesforce/README.md @@ -1,18 +1,17 @@ # Airbyte Salesforce Loader -The Airbyte Salesforce Loader allows you to access different Salesforce objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-salesforce +``` -- Install llama_hub: `pip install llama_hub` -- Install the salesforce source: `pip install airbyte-source-salesforce` +The Airbyte Salesforce Loader allows you to access different Salesforce objects. ## Usage Here's an example usage of the AirbyteSalesforceReader. ```python -from llama_hub.airbyte_salesforce import AirbyteSalesforceReader +from llama_index.readers.airbyte_salesforce import AirbyteSalesforceReader salesforce_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-shopify/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-shopify/README.md index 8802120283d4f..c2c250b5521e9 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-shopify/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-shopify/README.md @@ -1,18 +1,17 @@ # Airbyte Shopify Loader -The Airbyte Shopify Loader allows you to access different Shopify objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-shopify +``` -- Install llama_hub: `pip install llama_hub` -- Install the shopify source: `pip install airbyte-source-shopify` +The Airbyte Shopify Loader allows you to access different Shopify objects. ## Usage Here's an example usage of the AirbyteShopifyReader. ```python -from llama_hub.airbyte_shopify import AirbyteShopifyReader +from llama_index.readers.airbyte_shopify import AirbyteShopifyReader shopify_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-stripe/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-stripe/README.md index 094255a574969..96b9dfe3de793 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-stripe/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-stripe/README.md @@ -1,18 +1,17 @@ # Airbyte Stripe Loader -The Airbyte Stripe Loader allows you to access different Stripe objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-stripe +``` -- Install llama_hub: `pip install llama_hub` -- Install the stripe source: `pip install airbyte-source-stripe` +The Airbyte Stripe Loader allows you to access different Stripe objects. ## Usage Here's an example usage of the AirbyteStripeReader. ```python -from llama_hub.airbyte_stripe import AirbyteStripeReader +from llama_index.readers.airbyte_stripe import AirbyteStripeReader stripe_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-typeform/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-typeform/README.md index bb9338d260ad3..a4f7ee9760142 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-typeform/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-typeform/README.md @@ -1,18 +1,17 @@ # Airbyte Typeform Loader -The Airbyte Typeform Loader allows you to access different Typeform objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-typeform +``` -- Install llama_hub: `pip install llama_hub` -- Install the typeform source: `pip install airbyte-source-typeform` +The Airbyte Typeform Loader allows you to access different Typeform objects. ## Usage Here's an example usage of the AirbyteTypeformReader. ```python -from llama_hub.airbyte_typeform import AirbyteTypeformReader +from llama_index.readers.airbyte_typeform import AirbyteTypeformReader typeform_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airbyte-zendesk-support/README.md b/llama-index-integrations/readers/llama-index-readers-airbyte-zendesk-support/README.md index 8e9359053e2a9..72aa30eb1cce0 100644 --- a/llama-index-integrations/readers/llama-index-readers-airbyte-zendesk-support/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airbyte-zendesk-support/README.md @@ -1,18 +1,19 @@ # Airbyte ZendeskSupport Loader -The Airbyte ZendeskSupport Loader allows you to access different ZendeskSupport objects. - -## Installation +```bash +pip install llama-index-readers-airbyte-zendesk-support +``` -- Install llama_hub: `pip install llama_hub` -- Install the zendesk_support source: `pip install airbyte-source-zendesk-support` +The Airbyte ZendeskSupport Loader allows you to access different ZendeskSupport objects. ## Usage Here's an example usage of the AirbyteZendeskSupportReader. ```python -from llama_hub.airbyte_zendesk_support import AirbyteZendeskSupportReader +from llama_index.readers.airbyte_zendesk_support import ( + AirbyteZendeskSupportReader, +) zendesk_support_config = { # ... diff --git a/llama-index-integrations/readers/llama-index-readers-airtable/README.md b/llama-index-integrations/readers/llama-index-readers-airtable/README.md index 64197e51dbcb4..ab47b7c07de38 100644 --- a/llama-index-integrations/readers/llama-index-readers-airtable/README.md +++ b/llama-index-integrations/readers/llama-index-readers-airtable/README.md @@ -1,5 +1,9 @@ # Airtable Loader +```bash +pip install llama-index-readers-airtable +``` + This loader loads documents from Airtable. The user specifies an API token to initialize the AirtableReader. They then specify a `table_id` and a `base_id` to load in the corresponding Document objects. ## Usage @@ -7,10 +11,9 @@ This loader loads documents from Airtable. The user specifies an API token to in Here's an example usage of the AirtableReader. ```python -from llama_index import download_loader import os -AirtableReader = download_loader("AirtableReader") +from llama_index.readers.airtable import AirtableReader reader = AirtableReader("") documents = reader.load_data(table_id="", base_id="") diff --git a/llama-index-integrations/readers/llama-index-readers-apify/README.md b/llama-index-integrations/readers/llama-index-readers-apify/README.md index e752e540db716..a52ae9787dc5e 100644 --- a/llama-index-integrations/readers/llama-index-readers-apify/README.md +++ b/llama-index-integrations/readers/llama-index-readers-apify/README.md @@ -1,5 +1,9 @@ # Apify Loaders +```bash +pip install llama-index-readers-apify +``` + ## Apify Actor Loader [Apify](https://apify.com/) is a cloud platform for web scraping and data extraction, @@ -20,8 +24,7 @@ To use this loader, you need to have a (free) Apify account and set your [Apify API token](https://console.apify.com/account/integrations) in the code. ```python -from llama_index import download_loader -from llama_index.readers.schema import Document +from llama_index.core import Document # Converts a single record from the Actor's resulting dataset to the LlamaIndex format @@ -34,7 +37,7 @@ def tranform_dataset_item(item): ) -ApifyActor = download_loader("ApifyActor") +from llama_index.readers.apify import ApifyActor reader = ApifyActor("") documents = reader.load_data( @@ -72,8 +75,7 @@ To use this loader, you need to have a (free) Apify account and set your [Apify API token](https://console.apify.com/account/integrations) in the code. ```python -from llama_index import download_loader -from llama_index.readers.schema import Document +from llama_index.core import Document # Converts a single record from the Apify dataset to the LlamaIndex format @@ -86,7 +88,7 @@ def tranform_dataset_item(item): ) -ApifyDataset = download_loader("ApifyDataset") +from llama_index.readers.apify import ApifyDataset reader = ApifyDataset("") documents = reader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-arango-db/README.md b/llama-index-integrations/readers/llama-index-readers-arango-db/README.md index e31489ee1ec9c..d8fef88eb1f98 100644 --- a/llama-index-integrations/readers/llama-index-readers-arango-db/README.md +++ b/llama-index-integrations/readers/llama-index-readers-arango-db/README.md @@ -1,5 +1,9 @@ # LlamaIndex Readers Integration: Arango Db +```bash +pip install llama-index-readers-arango-db +``` + This loader loads documents from ArangoDB. The user specifies a ArangoDB instance to initialize the reader. They then specify the collection name and query params to fetch the relevant docs. @@ -9,10 +13,9 @@ fetch the relevant docs. Here's an example usage of the SimpleArangoDBReader. ```python -from llama_index.core.readers import download_loader import os -SimpleArangoDBReader = download_loader("SimpleArangoDBReader") +from llama_index.readers.arango_db import SimpleArangoDBReader host = "" db_name = "" @@ -32,4 +35,4 @@ documents = reader.load_data( ) ``` -This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/run-llama/llama-hub/tree/main/llama_hub) for examples. +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. diff --git a/llama-index-integrations/readers/llama-index-readers-asana/README.md b/llama-index-integrations/readers/llama-index-readers-asana/README.md index 2bd439c33e365..cbfe43f829009 100644 --- a/llama-index-integrations/readers/llama-index-readers-asana/README.md +++ b/llama-index-integrations/readers/llama-index-readers-asana/README.md @@ -1,5 +1,9 @@ # Asana Loader +```bash +pip install llama-index-readers-asana +``` + This loader loads documents from Asana. The user specifies an API token to initialize the AsanaReader. They then specify a `workspace_id` OR a `project_id` to load in the corresponding Document objects. ## Usage @@ -7,10 +11,9 @@ This loader loads documents from Asana. The user specifies an API token to initi Here's an example usage of the AsanaReader. ```python -from llama_index import download_loader import os -AsanaReader = download_loader("AsanaReader") +from llama_index.readers.asana import AsanaReader reader = AsanaReader("") diff --git a/llama-index-integrations/readers/llama-index-readers-assemblyai/README.md b/llama-index-integrations/readers/llama-index-readers-assemblyai/README.md index e0e7d14cfef64..36fdd1c65800e 100644 --- a/llama-index-integrations/readers/llama-index-readers-assemblyai/README.md +++ b/llama-index-integrations/readers/llama-index-readers-assemblyai/README.md @@ -1,5 +1,9 @@ # AssemblyAI Audio Transcript Loader +```bash +pip install llama-index-readers-assemblyai +``` + The AssemblyAI Audio Transcript Loader allows to transcribe audio files with the [AssemblyAI API](https://www.assemblyai.com/) and loads the transcribed text into documents. To use it, you should have the `assemblyai` python package installed, and the environment variable `ASSEMBLYAI_API_KEY` set with your API key. Alternatively, the API key can also be passed as an argument. @@ -10,40 +14,12 @@ More info about AssemblyAI: - [Get a Free API key](https://www.assemblyai.com/dashboard/signup) - [AssemblyAI API Docs](https://www.assemblyai.com/docs) -## Installation - -First, you need to install the `assemblyai` python package. - -You can find more info about it inside the [assemblyai-python-sdk GitHub repo](https://github.com/AssemblyAI/assemblyai-python-sdk). - -```bash -pip install assemblyai -``` - -Optionally: You can install the AssemblyAI integration yourself with: - -```bash -pip install llama-index-readers-assemblyai -``` - -Then you can import it with: - -```python -from llama_index.readers.assemblyai import AssemblyAIAudioTranscriptReader -``` - -As an alternative, you can also use the `download_loader()` to install and use this integration (see next section). - ## Usage The `AssemblyAIAudioTranscriptReader` needs at least the `file_path` argument. Audio files can be specified as an URL or a local file path. ```python -from llama_index.core import download_loader - -AssemblyAIAudioTranscriptReader = download_loader( - "AssemblyAIAudioTranscriptReader" -) +from llama_index.readers.assemblyai import AssemblyAIAudioTranscriptReader audio_file = "https://storage.googleapis.com/aai-docs-samples/nbc.mp3" # or a local file path: audio_file = "./nbc.mp3" diff --git a/llama-index-integrations/readers/llama-index-readers-astra-db/README.md b/llama-index-integrations/readers/llama-index-readers-astra-db/README.md index bd7b4e7cdeff2..eda6a64ad4ef4 100644 --- a/llama-index-integrations/readers/llama-index-readers-astra-db/README.md +++ b/llama-index-integrations/readers/llama-index-readers-astra-db/README.md @@ -1,5 +1,9 @@ # Astra DB Loader +```bash +pip install llama-index-readers-astra-db +``` + The Astra DB Loader returns a set of documents retrieved from Astra DB. The user initializes the loader with an Astra DB index. They then pass in a vector. @@ -10,8 +14,6 @@ Here's an example usage of the AstraDBReader. ```python from openai import OpenAI -from llama_index import download_loader - # Get the credentials for Astra DB api_endpoint = "https://324<...>f1c.astra.datastax.com" @@ -29,7 +31,7 @@ response = client.embeddings.create( query_vector = response.data[0].embedding # Initialize the Reader object -AstraDBReader = download_loader("AstraDBReader") +from llama_index.readers.astra_db import AstraDBReader # Your Astra DB Account will provide you with the endpoint URL and Token reader = AstraDBReader( diff --git a/llama-index-integrations/readers/llama-index-readers-athena/README.md b/llama-index-integrations/readers/llama-index-readers-athena/README.md index afff8d84f5c64..082e2ca83c151 100644 --- a/llama-index-integrations/readers/llama-index-readers-athena/README.md +++ b/llama-index-integrations/readers/llama-index-readers-athena/README.md @@ -1,5 +1,11 @@ # Athena reader. +```bash +pip install llama-index-readers-athena + +pip install llama-index-llms-openai +``` + Athena reader allow execute SQL with AWS Athena. We using SQLAlchemy and PyAthena under the hood. ## Permissions @@ -13,10 +19,10 @@ Here's an example usage of the AthenaReader. ``` import os import dotenv -from llama_index import SQLDatabase,ServiceContext -from llama_index.indices.struct_store import NLSQLTableQueryEngine -from llama_index.llms import OpenAI -from llama_hub.athena import AthenaReader +from llama_index.core import SQLDatabase,ServiceContext +from llama_index.core.query_engine import NLSQLTableQueryEngine +from llama_index.llms.openai import OpenAI +from llama_index.readers.athena import AthenaReader dotenv.load_dotenv() diff --git a/llama-index-integrations/readers/llama-index-readers-azcognitive-search/README.md b/llama-index-integrations/readers/llama-index-readers-azcognitive-search/README.md index 953bef038c961..9891527c4abde 100644 --- a/llama-index-integrations/readers/llama-index-readers-azcognitive-search/README.md +++ b/llama-index-integrations/readers/llama-index-readers-azcognitive-search/README.md @@ -1,5 +1,9 @@ # Azure Cognitive Search Loader +```bash +pip install llama-index-readers-azcognitive-search +``` + The AzCognitiveSearchReader Loader returns a set of texts corresponding to documents retrieved from specific index of Azure Cognitive Search. The user initializes the loader with credentials (service name and key) and the index name. @@ -8,9 +12,7 @@ The user initializes the loader with credentials (service name and key) and the Here's an example usage of the AzCognitiveSearchReader. ```python -from llama_index import download_loader - -AzCognitiveSearchReader = download_loader("AzCognitiveSearchReader") +from llama_index.readers.azcognitive_search import AzCognitiveSearchReader reader = AzCognitiveSearchReader( "", @@ -30,11 +32,11 @@ documents = reader.load_data( ## Usage in combination with langchain ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.chains.conversation.memory import ConversationBufferMemory from langchain.agents import Tool, AgentExecutor, load_tools, initialize_agent -AzCognitiveSearchReader = download_loader("AzCognitiveSearchReader") +from llama_index.readers.azcognitive_search import AzCognitiveSearchReader az_loader = AzCognitiveSearchReader( COGNITIVE_SEARCH_SERVICE_NAME, COGNITIVE_SEARCH_KEY, INDEX_NAME diff --git a/llama-index-integrations/readers/llama-index-readers-azstorage-blob/README.md b/llama-index-integrations/readers/llama-index-readers-azstorage-blob/README.md index 306aec783686a..e4c1adcbfb2c1 100644 --- a/llama-index-integrations/readers/llama-index-readers-azstorage-blob/README.md +++ b/llama-index-integrations/readers/llama-index-readers-azstorage-blob/README.md @@ -1,5 +1,9 @@ # Azure Storage Blob Loader +```bash +pip install llama-index-readers-azstorage-blob +``` + This loader parses any file stored as an Azure Storage blob or the entire container (with an optional prefix / attribute filter) if no particular file is specified. When initializing `AzStorageBlobReader`, you may pass in your account url with a SAS token or crdentials to authenticate. All files are temporarily downloaded locally and subsequently parsed with `SimpleDirectoryReader`. Hence, you may also specify a custom `file_extractor`, relying on any of the loaders in this library (or your own)! If you need a clue on finding the file extractor object because you'd like to use your own file extractor, follow this sample. @@ -20,9 +24,7 @@ To use this loader, you need to pass in the name of your Azure Storage Container ### Using a Storage Account SAS URL ```python -from llama_index import download_loader - -AzStorageBlobReader = download_loader("AzStorageBlobReader") +from llama_index.readers.azstorage_blob import AzStorageBlobReader loader = AzStorageBlobReader( container="scrabble-dictionary", @@ -38,9 +40,7 @@ documents = loader.load_data() The sample below will download all files in a container, by only specifying the storage account's connection string and the container name. ```python -from llama_index import download_loader - -AzStorageBlobReader = download_loader("AzStorageBlobReader") +from llama_index.readers.azstorage_blob import AzStorageBlobReader loader = AzStorageBlobReader( container_name="", @@ -57,12 +57,11 @@ Ensure the Azure Identity library is available `pip install azure-identity` The sample below downloads all files in the container using the default credential, alternative credential options are available such as a service principal `ClientSecretCredential` ```python -from llama_index import download_loader from azure.identity import DefaultAzureCredential default_credential = DefaultAzureCredential() -AzStorageBlobReader = download_loader("AzStorageBlobReader") +from llama_index.readers.azstorage_blob import AzStorageBlobReader loader = AzStorageBlobReader( container_name="scrabble-dictionary", diff --git a/llama-index-integrations/readers/llama-index-readers-bilibili/README.md b/llama-index-integrations/readers/llama-index-readers-bilibili/README.md index 36bc3b949e0fd..66e93880f7716 100644 --- a/llama-index-integrations/readers/llama-index-readers-bilibili/README.md +++ b/llama-index-integrations/readers/llama-index-readers-bilibili/README.md @@ -1,5 +1,9 @@ # Bilibili Transcript Loader +```bash +pip install llama-index-readers-bilibili +``` + This loader utilizes the `bilibili_api` to fetch the text transcript from Bilibili, one of the most beloved long-form video sites in China. With this BilibiliTranscriptReader, users can easily obtain the transcript of their desired video content on the platform. @@ -9,9 +13,8 @@ With this BilibiliTranscriptReader, users can easily obtain the transcript of th To use this loader, you need to pass in an array of Bilibili video links. ```python -from llama_index import download_loader +from llama_index.readers.bilibili import BilibiliTranscriptReader -BilibiliTranscriptReader = download_loader("BilibiliTranscriptReader") loader = BilibiliTranscriptReader() documents = loader.load_data( video_urls=["https://www.bilibili.com/video/BV1yx411L73B/"] diff --git a/llama-index-integrations/readers/llama-index-readers-bitbucket/README.md b/llama-index-integrations/readers/llama-index-readers-bitbucket/README.md index a5f4c506593c0..2edc08dadefc4 100644 --- a/llama-index-integrations/readers/llama-index-readers-bitbucket/README.md +++ b/llama-index-integrations/readers/llama-index-readers-bitbucket/README.md @@ -1,5 +1,9 @@ # Bitbucket Loader +```bash +pip install llama-index-readers-bitbucket +``` + This loader utilizes the Bitbucket API to load the files inside a Bitbucket repository as Documents in an index. ## Usage @@ -8,7 +12,7 @@ To use this loader, you need to provide as environment variables the `BITBUCKET_ ```python import os -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader os.environ["BITBUCKET_USERNAME"] = "myusername" os.environ["BITBUCKET_API_KEY"] = "myapikey" @@ -16,7 +20,7 @@ os.environ["BITBUCKET_API_KEY"] = "myapikey" base_url = "https://myserver/bitbucket" project_key = "mykey" -BitbucketReader = download_loader("BitbucketReader") +from llama_index.readers.bitbucket import BitbucketReader loader = BitbucketReader( base_url=base_url, diff --git a/llama-index-integrations/readers/llama-index-readers-boarddocs/README.md b/llama-index-integrations/readers/llama-index-readers-boarddocs/README.md index d10393b5c8722..ce037d0cc14b1 100644 --- a/llama-index-integrations/readers/llama-index-readers-boarddocs/README.md +++ b/llama-index-integrations/readers/llama-index-readers-boarddocs/README.md @@ -1,5 +1,9 @@ # BoardDocs Loader +```bash +pip install llama-index-readers-boarddocs +``` + This loader retrieves an agenda and associated material from a BoardDocs site. This loader is not endorsed by, developed by, supported by, or in any way formally affiliated with Diligent Corporation. @@ -10,9 +14,7 @@ To use this loader, you'll need to specify which BoardDocs site you want to load as well as the committee on the site you want to scrape. ```python -from llama_index import download_loader - -BoardDocsReader = download_loader("BoardDocsReader") +from llama_index.readers.boarddocs import BoardDocsReader # For a site URL https://go.boarddocs.com/ca/redwood/Board.nsf/Public # your site should be set to 'ca/redwood' diff --git a/llama-index-integrations/readers/llama-index-readers-confluence/README.md b/llama-index-integrations/readers/llama-index-readers-confluence/README.md index e1cf202d4a724..4b55e6c1d6d52 100644 --- a/llama-index-integrations/readers/llama-index-readers-confluence/README.md +++ b/llama-index-integrations/readers/llama-index-readers-confluence/README.md @@ -1,5 +1,9 @@ # Confluence Loader +```bash +pip install llama-index-readers-confluence +``` + This loader loads pages from a given Confluence cloud instance. The user needs to specify the base URL for a Confluence instance to initialize the ConfluenceReader - base URL needs to end with `/wiki`. The user can optionally specify OAuth 2.0 credentials to authenticate with the Confluence instance. If no credentials are specified, the loader will @@ -42,7 +46,7 @@ Here's an example usage of the ConfluenceReader. ```python # Example that reads the pages with the `page_ids` -from llama_hub.confluence import ConfluenceReader +from llama_index.readers.confluence import ConfluenceReader token = {"access_token": "", "token_type": ""} oauth2_dict = {"client_id": "", "token": token} @@ -65,7 +69,7 @@ documents.extend( ```python # Example that fetches the first 5, then the next 5 pages from a space -from llama_hub.confluence import ConfluenceReader +from llama_index.readers.confluence import ConfluenceReader token = {"access_token": "", "token_type": ""} oauth2_dict = {"client_id": "", "token": token} @@ -95,7 +99,7 @@ documents.extend( ```python # Example that fetches the first 5 results froma cql query, the uses the cursor to pick up on the next element -from llama_hub.confluence import ConfluenceReader +from llama_index.readers.confluence import ConfluenceReader token = {"access_token": "", "token_type": ""} oauth2_dict = {"client_id": "", "token": token} diff --git a/llama-index-integrations/readers/llama-index-readers-couchbase/README.md b/llama-index-integrations/readers/llama-index-readers-couchbase/README.md index 574ba00b2a61b..f30013bf7a3ff 100644 --- a/llama-index-integrations/readers/llama-index-readers-couchbase/README.md +++ b/llama-index-integrations/readers/llama-index-readers-couchbase/README.md @@ -1,5 +1,9 @@ # LlamaIndex Readers Integration: Couchbase +```bash +pip install llama-index-readers-couchbase +``` + This loader loads documents from Couchbase cluster. The user specifies a Couchbase client or credentials to initialize the reader. They can specify the SQL++ query to fetch the relevant docs. @@ -9,10 +13,9 @@ fetch the relevant docs. Here's an example usage of the CouchbaseReader. ```python -from llama_index.core.readers import download_loader import os -CouchbaseLoader = download_loader("CouchbaseReader") +from llama_index.readers.couchbase import CouchbaseReader connection_string = ( "couchbase://localhost" # valid Couchbase connection string diff --git a/llama-index-integrations/readers/llama-index-readers-couchdb/README.md b/llama-index-integrations/readers/llama-index-readers-couchdb/README.md index d738eb39b9ef9..cd3b51286c6c8 100644 --- a/llama-index-integrations/readers/llama-index-readers-couchdb/README.md +++ b/llama-index-integrations/readers/llama-index-readers-couchdb/README.md @@ -1,5 +1,9 @@ # CouchDB Loader +```bash +pip install llama-index-readers-couchdb +``` + This loader loads documents from CouchDB. The loader currently supports CouchDB 3.x using the CouchDB3 python wrapper from https://github.com/n-vlahovic/couchdb3 The user specifies a CouchDB instance to initialize the reader. They then specify @@ -10,10 +14,9 @@ the database name and query params to fetch the relevant docs. Here's an example usage of the SimpleCouchDBReader. ```python -from llama_index import download_loader import os -SimpleCouchDBReader = download_loader("SimpleCouchDBReader") +from llama_index.readers.couchdb import SimpleCouchDBReader host = "" port = "" diff --git a/llama-index-integrations/readers/llama-index-readers-dad-jokes/README.md b/llama-index-integrations/readers/llama-index-readers-dad-jokes/README.md index f786ca3b513a3..6e07eeffcbda4 100644 --- a/llama-index-integrations/readers/llama-index-readers-dad-jokes/README.md +++ b/llama-index-integrations/readers/llama-index-readers-dad-jokes/README.md @@ -1,5 +1,9 @@ # DadJoke Loader +```bash +pip install llama-index-readers-dad-jokes +``` + This loader fetches a joke from icanhazdadjoke. ## Usage @@ -7,9 +11,7 @@ This loader fetches a joke from icanhazdadjoke. To use this loader, load it. ```python -from llama_index import download_loader - -DadJokesReader = download_loader("DadJokesReader") +from llama_index.readers.dad_jokes import DadJokesReader loader = DadJokesReader() documents = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-discord/README.md b/llama-index-integrations/readers/llama-index-readers-discord/README.md index 522c28c3a63f1..c925cf9539d2a 100644 --- a/llama-index-integrations/readers/llama-index-readers-discord/README.md +++ b/llama-index-integrations/readers/llama-index-readers-discord/README.md @@ -1,5 +1,9 @@ # Discord Loader +```bash +pip install llama-index-readers-discord +``` + This loader loads conversations from Discord. The user specifies `channel_ids` and we fetch conversations from those `channel_ids`. @@ -8,10 +12,9 @@ those `channel_ids`. Here's an example usage of the DiscordReader. ```python -from llama_index import download_loader import os -DiscordReader = download_loader("DiscordReader") +from llama_index.readers.discord import DiscordReader discord_token = os.getenv("DISCORD_TOKEN") channel_ids = [1057178784895348746] # Replace with your channel_id diff --git a/llama-index-integrations/readers/llama-index-readers-docugami/README.md b/llama-index-integrations/readers/llama-index-readers-docugami/README.md index 764a6b603800d..e31a22c9eef45 100644 --- a/llama-index-integrations/readers/llama-index-readers-docugami/README.md +++ b/llama-index-integrations/readers/llama-index-readers-docugami/README.md @@ -1,5 +1,9 @@ # Docugami Loader +```bash +pip install llama-index-readers-docugami +``` + This loader takes in IDs of PDF, DOCX or DOC files processed by [Docugami](https://docugami.com) and returns nodes in a Document XML Knowledge Graph for each document. This is a rich representation that includes the semantic and structural characteristics of various chunks in the document as an XML tree. Entire sets of documents are processed, resulting in forests of XML semantic trees. ## Pre-requisites @@ -14,9 +18,7 @@ This loader takes in IDs of PDF, DOCX or DOC files processed by [Docugami](https To use this loader, you simply need to pass in a Docugami Doc Set ID, and optionally an array of Document IDs (by default, all documents in the Doc Set are loaded). ```python -from llama_index.core import download_loader - -DocugamiReader = download_loader("DocugamiReader") +from llama_index.readers.docugami import DocugamiReader docset_id = "tjwrr2ekqkc3" document_ids = ["ui7pkriyckwi", "1be3o7ch10iy"] diff --git a/llama-index-integrations/readers/llama-index-readers-earnings-call-transcript/README.md b/llama-index-integrations/readers/llama-index-readers-earnings-call-transcript/README.md index 1eb7b9f24708f..bd5e23b64f52d 100644 --- a/llama-index-integrations/readers/llama-index-readers-earnings-call-transcript/README.md +++ b/llama-index-integrations/readers/llama-index-readers-earnings-call-transcript/README.md @@ -1,5 +1,9 @@ # EARNING CALL TRANSCRIPTS LOADER +```bash +pip install llama-index-readers-earnings-call-transcript +``` + This loader fetches the earning call transcripts of US based companies from the website [discountingcashflows.com](https://discountingcashflows.com/). It is not available for commercial purposes Install the required dependencies @@ -17,9 +21,7 @@ The Earning call transcripts takes in three arguments ## Usage ```python -from llama_index import download_loader - -EarningsCallTranscript = download_loader("EarningsCallTranscript") +from llama_index.readers.earnings_call_transcript import EarningsCallTranscript loader = EarningsCallTranscript(2023, "AAPL", "Q3") docs = loader.load_data() @@ -37,10 +39,9 @@ The metadata of the transcripts are the following #### Llama Index ```python -from llama_index import download_loader -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -EarningsCallTranscript = download_loader("EarningsCallTranscript") +from llama_index.readers.earnings_call_transcript import EarningsCallTranscript loader = EarningsCallTranscript(2023, "AAPL", "Q3") docs = loader.load_data() @@ -57,13 +58,12 @@ print(response) #### Langchain ```python -from llama_index import download_loader from langchain.agents import Tool from langchain.agents import initialize_agent from langchain.chat_models import ChatOpenAI from langchain.llms import OpenAI -EarningsCallTranscript = download_loader("EarningsCallTranscript") +from llama_index.readers.earnings_call_transcript import EarningsCallTranscript loader = EarningsCallTranscript(2023, "AAPL", "Q3") docs = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-feedly-rss/README.md b/llama-index-integrations/readers/llama-index-readers-feedly-rss/README.md index fa201e53b933f..3072a55fe6b9c 100644 --- a/llama-index-integrations/readers/llama-index-readers-feedly-rss/README.md +++ b/llama-index-integrations/readers/llama-index-readers-feedly-rss/README.md @@ -1,13 +1,15 @@ # Feedly Loader +```bash +pip install llama-index-readers-feedly-rss +``` + This loader fetches the entries from a list of RSS feeds subscribed in [Feedly](https://feedly.com). You must initialize the loader with your [Feedly API token](https://developer.feedly.com), and then pass the category name which you want to extract. ## Usage ```python -from llama_index import download_loader - -feedlyRssReader = download_loader("FeedlyRssReader") +from llama_index.readers.feedly_rss import FeedlyRssReader loader = feedlyRssReader(bearer_token="[YOUR_TOKEN]") documents = loader.load_data(category_name="news", max_count=100) diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-docs/README.md b/llama-index-integrations/readers/llama-index-readers-feishu-docs/README.md index b28f90cfd6302..2c378943de1ee 100644 --- a/llama-index-integrations/readers/llama-index-readers-feishu-docs/README.md +++ b/llama-index-integrations/readers/llama-index-readers-feishu-docs/README.md @@ -1,5 +1,9 @@ # Feishu Doc Loader +```bash +pip install llama-index-readers-feishu-docs +``` + This loader takes in IDs of Feishu Docs and parses their text into `documents`. You can extract a Feishu Doc's ID directly from its URL. For example, the ID of `https://test-csl481dfkgqf.feishu.cn/docx/HIH2dHv21ox9kVxjRuwc1W0jnkf` is `HIH2dHv21ox9kVxjRuwc1W0jnkf`. As a prerequisite, you will need to register with Feishu and build an custom app. See [here](https://open.feishu.cn/document/home/introduction-to-custom-app-development/self-built-application-development-process) for instructions. ## Usage @@ -7,12 +11,11 @@ This loader takes in IDs of Feishu Docs and parses their text into `documents`. To use this loader, you simply need to pass in an array of Feishu Doc IDs. The default API endpoints are for Feishu, in order to switch to Lark, we should use `set_lark_domain`. ```python -from llama_index import download_loader - app_id = "cli_slkdjalasdkjasd" app_secret = "dskLLdkasdjlasdKK" doc_ids = ["HIH2dHv21ox9kVxjRuwc1W0jnkf"] -FeishuDocsReader = download_loader("FeishuDocsReader") +from llama_index.readers.feishu_docs import FeishuDocsReader + loader = FeishuDocsReader(app_id, app_secret) documents = loader.load_data(document_ids=doc_ids) ``` diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/.gitignore b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/.gitignore new file mode 100644 index 0000000000000..990c18de22908 --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/.gitignore @@ -0,0 +1,153 @@ +llama_index/_static +.DS_Store +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +bin/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +etc/ +include/ +lib/ +lib64/ +parts/ +sdist/ +share/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +.ruff_cache + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints +notebooks/ + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ +pyvenv.cfg + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# Jetbrains +.idea +modules/ +*.swp + +# VsCode +.vscode + +# pipenv +Pipfile +Pipfile.lock + +# pyright +pyrightconfig.json diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/BUILD b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/BUILD new file mode 100644 index 0000000000000..0896ca890d8bf --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/BUILD @@ -0,0 +1,3 @@ +poetry_requirements( + name="poetry", +) diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/CHANGELOG.md b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/CHANGELOG.md new file mode 100644 index 0000000000000..36bff877abcbe --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/CHANGELOG.md @@ -0,0 +1,5 @@ +# CHANGELOG + +## [0.1.2] - 2024-02-13 + +- Add maintainers and keywords from library.json (llamahub) diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/Makefile b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/Makefile new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/Makefile @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/README.md b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/README.md new file mode 100644 index 0000000000000..1f1b384ba6847 --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/README.md @@ -0,0 +1,22 @@ +# Feishu Wiki Loader + +This loader can traverse all feishu documents under the feishi space. + +## Usage + +To use this loader, you need to: + +1. apply the permission(`wiki:wiki:readonly`) of the feishu app +2. add the feishu app as the admin of your feishu space, see [here](https://open.feishu.cn/document/server-docs/docs/wiki-v2/wiki-qa#b5da330b) for more help +3. finally, pass your feishu space id to this loader + +```python +app_id = "xxx" +app_secret = "xxx" +space_id = "xxx" +FeishuWikiReader = download_loader("FeishuWikiReader") +loader = FeishuWikiReader(app_id, app_secret) +documents = loader.load_data(space_id=space_id) +``` + +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/emptycrown/llama-hub/tree/main) for examples. diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/BUILD b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/__init__.py b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/__init__.py new file mode 100644 index 0000000000000..3a4f56d259dcc --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/__init__.py @@ -0,0 +1,3 @@ +from llama_index.readers.feishu_wiki.base import FeishuWikiReader + +__all__ = ["FeishuWikiReader"] diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/base.py b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/base.py new file mode 100644 index 0000000000000..e4f6e003c87db --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/llama_index/readers/feishu_wiki/base.py @@ -0,0 +1,150 @@ +"""Feishu wiki reader.""" +import json +import os +import time +from typing import List + +import requests +from llama_index.core.readers.base import BaseReader +from llama_index.core.schema import Document + +# Copyright (2023) Bytedance Ltd. and/or its affiliates +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + + +class FeishuWikiReader(BaseReader): + """Feishu Wiki reader. + + Reads pages from Feishu wiki under the space + + """ + + host = "https://open.feishu.cn" + wiki_nodes_url_path = "/open-apis/wiki/v2/spaces/{}/nodes" + documents_raw_content_url_path = "/open-apis/docx/v1/documents/{}/raw_content" + tenant_access_token_internal_url_path = ( + "/open-apis/auth/v3/tenant_access_token/internal" + ) + + def __init__(self, app_id: str, app_secret: str) -> None: + """ + + Args: + app_id: The unique identifier of the application is obtained after the application is created. + app_secret: Application key, obtained after creating the application. + """ + super().__init__() + self.app_id = app_id + self.app_secret = app_secret + + self.tenant_access_token = "" + self.expire = 0 + + def load_data(self, space_id: str, parent_node_token: str = None) -> List[Document]: + """Load data from the input directory. + + Args: + space_id (str): a space id. + parent_node_token (str[optional]): a parent node token of the space + """ + if space_id is None: + raise ValueError('Must specify a "space_id" in `load_kwargs`.') + + document_ids = self._load_space(space_id, parent_node_token=parent_node_token) + document_ids = list(set(document_ids)) + + results = [] + for document_id in document_ids: + doc = self._load_doc(document_id) + results.append(Document(text=doc, extra_info={"document_id": document_id})) + return results + + def _load_space(self, space_id: str, parent_node_token: str = None) -> str: + if self.tenant_access_token == "" or self.expire < time.time(): + self._update_tenant_access_token() + headers = { + "Authorization": f"Bearer {self.tenant_access_token}", + "Content-Type": "application/json; charset=utf-8", + } + + url = self.host + self.wiki_spaces_url_path.format(space_id) + if parent_node_token: + url += f"?parent_node_token={parent_node_token}" + try: + response = requests.get(url, headers=headers) + result = response.json() + except Exception: + return [] + if not result.get("data"): + return [] + obj_token_list = [] + for item in result["data"]["items"]: + obj_token_list.append(item["obj_token"]) + if item["has_child"]: + child_obj_token_list = self._load_space( + space_id=space_id, parent_node_token=item["node_token"] + ) + if child_obj_token_list: + obj_token_list.extend(child_obj_token_list) + return obj_token_list + + def _load_doc(self, document_id: str) -> str: + """Load a document from Feishu Docs. + + Args: + document_id: the document id. + + Returns: + The document text. + """ + url = self.host + self.documents_raw_content_url_path.format(document_id) + if self.tenant_access_token == "" or self.expire < time.time(): + self._update_tenant_access_token() + headers = { + "Authorization": f"Bearer {self.tenant_access_token}", + "Content-Type": "application/json; charset=utf-8", + } + try: + response = requests.get(url, headers=headers) + result = response.json() + except Exception: + return None + if not result.get("data"): + return None + return result["data"]["content"] + + def _update_tenant_access_token(self) -> None: + """For update tenant_access_token.""" + url = self.host + self.tenant_access_token_internal_url_path + headers = {"Content-Type": "application/json; charset=utf-8"} + data = {"app_id": self.app_id, "app_secret": self.app_secret} + response = requests.post(url, data=json.dumps(data), headers=headers) + self.tenant_access_token = response.json()["tenant_access_token"] + self.expire = time.time() + response.json()["expire"] + + def set_lark_domain(self, host: str) -> None: + """Set lark domain.""" + self.host = host + + +if __name__ == "__main__": + app_id = os.environ.get("FEISHU_APP_ID") + app_secret = os.environ.get("FEISHU_APP_SECRET") + reader = FeishuWikiReader(app_id, app_secret) + print( + reader.load_data( + space_id=os.environ.get("FEISHU_SPACE_ID"), + parent_node_token=os.environ.get("FEISHU_PARENT_NODE_TOKEN"), + ) + ) diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/pyproject.toml b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/pyproject.toml new file mode 100644 index 0000000000000..f8b9c264233fa --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/pyproject.toml @@ -0,0 +1,64 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +contains_example = false +import_path = "llama_index.readers.feishu_wiki" + +[tool.llamahub.class_authors] +FeishuWikiReader = "zhourunlai" + +[tool.mypy] +disallow_untyped_defs = true +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["Your Name "] +description = "llama-index readers feishu_wiki integration" +exclude = ["**/BUILD"] +license = "MIT" +maintainers = ["zhourunlai"] +name = "llama-index-readers-feishu-wiki" +readme = "README.md" +version = "0.1.0" + +[tool.poetry.dependencies] +python = ">=3.8.1,<4.0" +llama-index-core = "^0.10.1" +requests = "^2.31.0" + +[tool.poetry.group.dev.dependencies] +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" +types-setuptools = "67.1.0.0" + +[tool.poetry.group.dev.dependencies.black] +extras = ["jupyter"] +version = "<=23.9.1,>=23.7.0" + +[tool.poetry.group.dev.dependencies.codespell] +extras = ["toml"] +version = ">=v2.2.6" + +[[tool.poetry.packages]] +include = "llama_index/" diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/BUILD b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/BUILD new file mode 100644 index 0000000000000..dabf212d7e716 --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/BUILD @@ -0,0 +1 @@ +python_tests() diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/__init__.py b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/test_readers_feishu_wiki.py b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/test_readers_feishu_wiki.py new file mode 100644 index 0000000000000..2fef634282e38 --- /dev/null +++ b/llama-index-integrations/readers/llama-index-readers-feishu-wiki/tests/test_readers_feishu_wiki.py @@ -0,0 +1,7 @@ +from llama_index.core.readers.base import BaseReader +from llama_index.readers.feishu_wiki import FeishuWikiReader + + +def test_class(): + names_of_base_classes = [b.__name__ for b in FeishuWikiReader.__mro__] + assert BaseReader.__name__ in names_of_base_classes diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/image_deplot/README.md b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/image_deplot/README.md index 05ba4fe82d25e..c4869ab48d24e 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/image_deplot/README.md +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/image_deplot/README.md @@ -1,5 +1,9 @@ # Image Tabular Chart Loader (Deplot) +```bash +pip install llama-index-readers-file +``` + This loader captions an image file containing a tabular chart (bar chart, line charts) using deplot. ## Usage @@ -8,7 +12,7 @@ To use this loader, you need to pass in a `Path` to a local file. ```python from pathlib import Path -from llama_hub.file.image_deplot import ImageTabularChartReader +from llama_index.readers.file import ImageTabularChartReader loader = ImageTabularChartReader() documents = loader.load_data(file=Path("./image.png")) diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/paged_csv/README.md b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/paged_csv/README.md index e46a6d4c9a1d8..a5a0eae2e09e7 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/paged_csv/README.md +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/paged_csv/README.md @@ -1,5 +1,9 @@ # Paged CSV Loader +```bash +pip install llama-index-readers-file +``` + This loader extracts the text from a local .csv file by formatting each row in an LLM-friendly way and inserting it into a separate Document. A single local file is passed in each time you call `load_data`. For example, a Document might look like: ``` @@ -15,9 +19,8 @@ To use this loader, you need to pass in a `Path` to a local file. ```python from pathlib import Path -from llama_index.core.readers import download_loader -PagedCSVReader = download_loader("PagedCSVReader") +from llama_index.readers.file import PagedCSVReader loader = PagedCSVReader(encoding="utf-8") documents = loader.load_data(file=Path("./transactions.csv")) diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/pymu_pdf/README.md b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/pymu_pdf/README.md index 9abd1e99e3d66..cfde1701d6e3a 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/pymu_pdf/README.md +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/pymu_pdf/README.md @@ -1,6 +1,10 @@ # PyMuPDF Loader -This loader extracts text from a local PDF file using the `PyMuPDF` Python library. This is the fastest among all other PDF parsing options available in `llama_hub`. If `metadata` is passed as True while calling `load` function; extracted documents will include basic metadata such as page numbers, file path and total number of pages in pdf. +```bash +pip install llama-index-readers-file +``` + +This loader extracts text from a local PDF file using the `PyMuPDF` Python library. If `metadata` is passed as True while calling `load` function; extracted documents will include basic metadata such as page numbers, file path and total number of pages in pdf. ## Usage @@ -8,9 +12,8 @@ To use this loader, you need to pass file path of the local file as string or `P ```python from pathlib import Path -from llama_index import download_loader -PyMuPDFReader = download_loader("PyMuPDFReader") +from llama_index.readers.file import PyMuPDFReader loader = PyMuPDFReader() documents = loader.load_data(file_path=Path("./article.pdf"), metadata=True) diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/tabular/base.py b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/tabular/base.py index 9b1bc097b1ac8..02008b258f816 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/tabular/base.py +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/tabular/base.py @@ -46,10 +46,15 @@ def load_data( csv_reader = csv.reader(fp) for row in csv_reader: text_list.append(", ".join(row)) + + metadata = {"filename": file.name, "extension": file.suffix} + if extra_info: + metadata = {**metadata, **extra_info} + if self._concat_rows: - return [Document(text="\n".join(text_list), metadata=extra_info)] + return [Document(text="\n".join(text_list), metadata=metadata)] else: - return [Document(text=text, metadata=extra_info) for text in text_list] + return [Document(text=text, metadata=metadata) for text in text_list] class PandasCSVReader(BaseReader): diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/unstructured/README.md b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/unstructured/README.md index 5a59f69ab6a87..a08ad57e71009 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/unstructured/README.md +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/unstructured/README.md @@ -1,5 +1,9 @@ # Unstructured.io File Loader +```bash +pip install llama-index-readers-file +``` + This loader extracts the text from a variety of unstructured text files using [Unstructured.io](https://github.com/Unstructured-IO/unstructured). Currently, the file extensions that are supported are `.txt`, `.docx`, `.pptx`, `.jpg`, `.png`, `.eml`, `.html`, and `.pdf` documents. A single local file is passed in each time you call `load_data`. Check out their documentation to see more details, but notably, this enables you to parse the unstructured data of many use-cases. For example, you can download the 10-K SEC filings of public companies (e.g. [Coinbase](https://www.sec.gov/ix?doc=/Archives/edgar/data/0001679788/000167978822000031/coin-20211231.htm)), and feed it directly into this loader without worrying about cleaning up the formatting or HTML tags. @@ -10,7 +14,7 @@ To use this loader, you need to pass in a `Path` to a local file. Optionally, yo ```python from pathlib import Path -from llama_hub.file.unstructured import UnstructuredReader +from llama_index.readers.file import UnstructuredReader loader = UnstructuredReader() documents = loader.load_data(file=Path("./10k_filing.html")) @@ -20,10 +24,9 @@ You can also easily use this loader in conjunction with `SimpleDirectoryReader` ```python from pathlib import Path -from llama_index import download_loader -from llama_index import SimpleDirectoryReader +from llama_index.core import SimpleDirectoryReader -UnstructuredReader = download_loader("UnstructuredReader") +from llama_index.readers.file import UnstructuredReader dir_reader = SimpleDirectoryReader( "./data", diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/xml/README.md b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/xml/README.md index c7860ddc0e0ee..1fa813908046d 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/xml/README.md +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/xml/README.md @@ -1,5 +1,9 @@ # XML Loader +```bash +pip install llama-index-readers-file +``` + This loader extracts the text from a local XML file. A single local file is passed in each time you call `load_data`. ## Usage @@ -8,12 +12,11 @@ To use this loader, you need to pass in a `Path` to a local file. ```python from pathlib import Path -from llama_index import download_loader -XMLReader = download_loader("XMLReader") +from llama_index.readers.file import XMLReader loader = XMLReader() documents = loader.load_data(file=Path("../example.xml")) ``` -This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/run-llama/llama-hub/tree/main/llama_hub) for examples. +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. diff --git a/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml b/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml index d1ad309d6cb52..ea3cca17bf187 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml +++ b/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml @@ -49,7 +49,7 @@ license = "MIT" maintainers = ["FarisHijazi", "Haowjy", "ephe-meral", "hursh-desai", "iamarunbrahma", "jon-chuang", "mmaatouk", "ravi03071991", "sangwongenip", "thejessezhang"] name = "llama-index-readers-file" readme = "README.md" -version = "0.1.6" +version = "0.1.7" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/readers/llama-index-readers-firebase-realtimedb/README.md b/llama-index-integrations/readers/llama-index-readers-firebase-realtimedb/README.md index ad5ea2f6e4e40..0894b91d8a622 100644 --- a/llama-index-integrations/readers/llama-index-readers-firebase-realtimedb/README.md +++ b/llama-index-integrations/readers/llama-index-readers-firebase-realtimedb/README.md @@ -1,5 +1,9 @@ # Firebase Realtime Database Loader +```bash +pip install llama-index-readers-firebase-realtimedb +``` + This loader retrieves documents from Firebase Realtime Database. The user specifies the Firebase Realtime Database URL and, optionally, the path to a service account key file for authentication. ## Usage @@ -7,10 +11,8 @@ This loader retrieves documents from Firebase Realtime Database. The user specif Here's an example usage of the FirebaseRealtimeDatabaseReader. ```python -from llama_index import download_loader - -FirebaseRealtimeDatabaseReader = download_loader( - "FirebaseRealtimeDatabaseReader" +from llama_index.readers.firebase_realtimedb import ( + FirebaseRealtimeDatabaseReader, ) database_url = "" @@ -20,4 +22,4 @@ reader = FirebaseRealtimeDatabaseReader(database_url, service_account_key_path) documents = reader.load_data(path) ``` -This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/emptycrown/llama-hub/tree/main) for examples. +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. diff --git a/llama-index-integrations/readers/llama-index-readers-firestore/README.md b/llama-index-integrations/readers/llama-index-readers-firestore/README.md index fb3d9b3329018..05cad520aeaee 100644 --- a/llama-index-integrations/readers/llama-index-readers-firestore/README.md +++ b/llama-index-integrations/readers/llama-index-readers-firestore/README.md @@ -1,5 +1,9 @@ # Firestore Loader +```bash +pip install llama-index-readers-firestore +``` + This loader loads from a Firestore collection or a specific document from Firestore. The loader assumes your project already has the google cloud credentials loaded. To find out how to set up credentials, [see here](https://cloud.google.com/docs/authentication/provide-credentials-adc). ## Usage @@ -9,9 +13,8 @@ To initialize the loader, provide the project-id of the google cloud project. ## Initializing the reader ```python -from llama_index import download_loader +from llama_index.readers.firestore import FirestoreReader -FirestoreReader = download_loader("FirestoreReader") reader = FirestoreReader(project_id="") ``` diff --git a/llama-index-integrations/readers/llama-index-readers-genius/README.md b/llama-index-integrations/readers/llama-index-readers-genius/README.md index cce1ff910532e..5ebf06cc78645 100644 --- a/llama-index-integrations/readers/llama-index-readers-genius/README.md +++ b/llama-index-integrations/readers/llama-index-readers-genius/README.md @@ -1,5 +1,9 @@ # LlamaIndex Readers Integration: Genius +```bash +pip install llama-index-readers-genius +``` + This loader connects to the Genius API and loads lyrics, metadata, and album art into `Documents`. As a prerequisite, you will need to register with [Genius API](https://genius.com/api-clients) and create an app in order to get a `client_id` and a `client_secret`. You should then set a `redirect_uri` for the app. The `redirect_uri` does not need to be functional. You should then generate an access token as an instantiator for the GeniusReader. @@ -60,9 +64,7 @@ Here's an example usage of the GeniusReader. It will retrieve songs that match s - **Returns**: List of `Document` objects with song lyrics. ```python -from llama_index.core.readers import download_loader - -GeniusReader = download_loader("GeniusReader") +from llama_index.readers.genius import GeniusReader access_token = "your_generated_access_token" @@ -79,7 +81,7 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ```python from llama_index.core import VectorStoreIndex, download_loader -GeniusReader = download_loader("GeniusReader") +from llama_index.readers.genius import GeniusReader access_token = "your_generated_access_token" diff --git a/llama-index-integrations/readers/llama-index-readers-gpt-repo/README.md b/llama-index-integrations/readers/llama-index-readers-gpt-repo/README.md index 286383911b739..2609090e89be8 100644 --- a/llama-index-integrations/readers/llama-index-readers-gpt-repo/README.md +++ b/llama-index-integrations/readers/llama-index-readers-gpt-repo/README.md @@ -1,5 +1,9 @@ # GPT Repository Loader +```bash +pip install llama-index-readers-gpt-repo +``` + This loader is an adaptation of https://github.com/mpoon/gpt-repository-loader to LlamaHub. Full credit goes to mpoon for coming up with this! @@ -8,9 +12,7 @@ to LlamaHub. Full credit goes to mpoon for coming up with this! To use this loader, you need to pass in a path to a local Git repository ```python -from llama_index import download_loader - -GPTRepoReader = download_loader("GPTRepoReader") +from llama_index.readers.gpt_repo import GPTRepoReader loader = GPTRepoReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-graphdb-cypher/README.md b/llama-index-integrations/readers/llama-index-readers-graphdb-cypher/README.md index e39cf1bfcf9b4..ee59f64a200d3 100644 --- a/llama-index-integrations/readers/llama-index-readers-graphdb-cypher/README.md +++ b/llama-index-integrations/readers/llama-index-readers-graphdb-cypher/README.md @@ -1,5 +1,9 @@ # Graph Database Cypher Loader +```bash +pip install llama-index-readers-graphdb-cypher +``` + This loader populates documents from results of Cypher queries from a Graph database endpoint. The user specifies a GraphDB endpoint URL with optional credentials to initialize the reader. By declaring the Cypher query and optional parameters the loader can fetch the nested result docs. @@ -14,10 +18,9 @@ Here's an example usage of the `GraphDBCypherReader`. You can test out queries directly with the Neo4j labs demo server: demo.neo4jlabs.com or with a free instance https://neo4j.com/aura ```python -from llama_index import download_loader import os -GraphDBCypherReader = download_loader("GraphDBCypherReader") +from llama_index.readers.graphdb_cypher import GraphDBCypherReader uri = "neo4j+s://demo.neo4jlabs.com" username = "stackoverflow" diff --git a/llama-index-integrations/readers/llama-index-readers-graphql/README.md b/llama-index-integrations/readers/llama-index-readers-graphql/README.md index 4d779719226a0..adc08fb338d64 100644 --- a/llama-index-integrations/readers/llama-index-readers-graphql/README.md +++ b/llama-index-integrations/readers/llama-index-readers-graphql/README.md @@ -1,5 +1,9 @@ # GraphQL Loader +```bash +pip install llama-index-readers-graphql +``` + This loader loads documents via GraphQL queries from a GraphQL endpoint. The user specifies a GraphQL endpoint URL with optional credentials to initialize the reader. By declaring the GraphQL query and optional variables (parameters) the loader can fetch the nested result docs. @@ -10,10 +14,9 @@ Here's an example usage of the GraphQLReader. You can test out queries directly [on the site](https://countries.trevorblades.com/) ```python -from llama_index import download_loader import os -GraphQLReader = download_loader("GraphQLReader") +from llama_index.readers.graphql import GraphQLReader uri = "https://countries.trevorblades.com/" headers = {} diff --git a/llama-index-integrations/readers/llama-index-readers-guru/README.md b/llama-index-integrations/readers/llama-index-readers-guru/README.md index 147a5ef9e6911..d580cc60322fa 100644 --- a/llama-index-integrations/readers/llama-index-readers-guru/README.md +++ b/llama-index-integrations/readers/llama-index-readers-guru/README.md @@ -1,5 +1,9 @@ # Guru Loader +```bash +pip install llama-index-readers-guru +``` + This loader loads documents from [Guru](https://www.getguru.com/). The user specifies a username and api key to initialize the GuruReader. Note this is not your password. You need to create a new api key in the admin tab of the portal. @@ -9,9 +13,7 @@ Note this is not your password. You need to create a new api key in the admin ta Here's an example usage of the GuruReader. ```python -from llama_index import download_loader - -GuruReader = download_loader("GuruReader") +from llama_index.readers.guru import GuruReader reader = GuruReader(username="", api_key="") diff --git a/llama-index-integrations/readers/llama-index-readers-hatena-blog/README.md b/llama-index-integrations/readers/llama-index-readers-hatena-blog/README.md index 777749cb6004c..ef17a2892f64c 100644 --- a/llama-index-integrations/readers/llama-index-readers-hatena-blog/README.md +++ b/llama-index-integrations/readers/llama-index-readers-hatena-blog/README.md @@ -1,5 +1,9 @@ # Hatena Blog Loader +```bash +pip install llama-index-readers-hatena-blog +``` + This loader fetches article from your own [Hatena Blog](https://hatenablog.com/) blog posts using the AtomPub API. You can get AtomPub info from the admin page after logging into Hatena Blog. @@ -9,10 +13,9 @@ You can get AtomPub info from the admin page after logging into Hatena Blog. Here's an example usage of the HatenaBlogReader. ```python -from llama_index import download_loader import os -HatenaBlogReader = download_loader("HatenaBlogReader") +from llama_index.readers.hatena_blog import HatenaBlogReader root_endpoint = os.getenv("ATOM_PUB_ROOT_ENDPOINT") api_key = os.getenv("ATOM_PUB_API_KEY") diff --git a/llama-index-integrations/readers/llama-index-readers-hive/README.md b/llama-index-integrations/readers/llama-index-readers-hive/README.md index 39e721c1c02d7..dd9be6afe87d5 100644 --- a/llama-index-integrations/readers/llama-index-readers-hive/README.md +++ b/llama-index-integrations/readers/llama-index-readers-hive/README.md @@ -1,5 +1,9 @@ # Hive Loader +```bash +pip install llama-index-readers-hive +``` + The Hive Loader returns a set of texts corresponding to documents from Hive based on the customized query. The user initializes the loader with Hive connection args and then using query to fetch data from Hive. @@ -8,9 +12,7 @@ The user initializes the loader with Hive connection args and then using query t Here's an example usage of the hiveReader to load 100 documents. ```python -from llama_index import download_loader - -HiveReader = download_loader("HiveReader") +from llama_index.readers.hive import HiveReader reader = HiveReader( host="localhost", @@ -24,4 +26,4 @@ query = "SELECT * FROM p1 LIMIT 100" documents = reader.load_data(query=query) ``` -This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/run-llama/llama-hub/tree/main/llama_hub) for examples. +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. diff --git a/llama-index-integrations/readers/llama-index-readers-hubspot/README.md b/llama-index-integrations/readers/llama-index-readers-hubspot/README.md index d7682e2437a9b..0660c3369fc8d 100644 --- a/llama-index-integrations/readers/llama-index-readers-hubspot/README.md +++ b/llama-index-integrations/readers/llama-index-readers-hubspot/README.md @@ -1,5 +1,9 @@ # Hubspot Loader +```bash +pip install llama-index-readers-hubspot +``` + This loader loads documents from Hubspot. The user specifies an access token to initialize the HubspotReader. At the moment, this loader only supports access token authentication. To obtain an access token, you will need to create a private app by following instructions [here](https://developers.hubspot.com/docs/api/private-apps). @@ -9,10 +13,9 @@ At the moment, this loader only supports access token authentication. To obtain Here's an example usage of the HubspotReader. ```python -from llama_index import download_loader import os -HubspotReader = download_loader("HubspotReader") +from llama_index.readers.hubspot import HubspotReader reader = HubspotReader("") documents = reader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-huggingface-fs/README.md b/llama-index-integrations/readers/llama-index-readers-huggingface-fs/README.md index bcfc874039b24..ebc6ece29e457 100644 --- a/llama-index-integrations/readers/llama-index-readers-huggingface-fs/README.md +++ b/llama-index-integrations/readers/llama-index-readers-huggingface-fs/README.md @@ -1,5 +1,9 @@ # Hugging Face FS Loader +```bash +pip install llama-index-readers-huggingface-fs +``` + This loader uses Hugging Face Hub's Filesystem API (> 0.14) to load datasets. @@ -12,9 +16,8 @@ To use this loader, you need to pass in a path to a Hugging Face dataset. ```python from pathlib import Path -from llama_index import download_loader -HuggingFaceFSReader = download_loader("HuggingFaceFSReader") +from llama_index.readers.huggingface_fs import HuggingFaceFSReader # load documents loader = HuggingFaceFSReader() diff --git a/llama-index-integrations/readers/llama-index-readers-hwp/README.md b/llama-index-integrations/readers/llama-index-readers-hwp/README.md index 0f45d30d0103b..a330901c19d5e 100644 --- a/llama-index-integrations/readers/llama-index-readers-hwp/README.md +++ b/llama-index-integrations/readers/llama-index-readers-hwp/README.md @@ -1,5 +1,9 @@ # HWP Loader +```bash +pip install llama-index-readers-file +``` + This loader reads the HWP file, which is the format of many official documents in South Korea. ## Usage @@ -7,7 +11,7 @@ This loader reads the HWP file, which is the format of many official documents i To use this loader, you need to pass in a file name. It's fine whether the file is compressed or not. ```python -from llama_hub.hangeul import HWPReader +from llama_index.readers.file import HWPReader from pathlib import Path hwp_path = Path("/path/to/hwp") diff --git a/llama-index-integrations/readers/llama-index-readers-imdb-review/README.md b/llama-index-integrations/readers/llama-index-readers-imdb-review/README.md index 844e67ced77db..20d8daf2668a4 100644 --- a/llama-index-integrations/readers/llama-index-readers-imdb-review/README.md +++ b/llama-index-integrations/readers/llama-index-readers-imdb-review/README.md @@ -1,5 +1,9 @@ ## IMDB MOVIE REVIEWS LOADER +```bash +pip install llama-index-readers-imdb-review +``` + This loader fetches all the reviews of a movie or a TV-series from IMDB official site. This loader is working on Windows machine and it requires further debug on Linux. Fixes are on the way Install the required dependencies @@ -18,9 +22,7 @@ The IMDB downloader takes in two attributes ## Usage ```python -from llama_index import download_loader - -IMDBReviewsloader = download_loader("IMDBReviews") +from llama_index.readers.imdb_review import IMDBReviews loader = IMDBReviews( movie_name_year="The Social Network 2010", webdriver_engine="edge" @@ -47,10 +49,10 @@ This loader can be used with both Langchain and LlamaIndex. ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader -from llama_index import VectorStoreIndex +from llama_index.core import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex -IMDBReviewsloader = download_loader("IMDBReviews") +from llama_index.readers.imdb_review import IMDBReviews loader = IMDBReviewsloader( movie_name_year="The Social Network 2010", @@ -72,7 +74,6 @@ print(response) ### Langchain ```python -from llama_index import download_loader from langchain.llms import OpenAI from langchain.agents.agent_toolkits.pandas import ( create_pandas_dataframe_agent, @@ -81,7 +82,7 @@ from langchain.agents import Tool from langchain.agents import initialize_agent from langchain.chat_models import ChatOpenAI -IMDBReviewsloader = download_loader("IMDBReviews") +from llama_index.readers.imdb_review import IMDBReviews loader = IMDBReviewsloader( movie_name_year="The Social Network 2010", diff --git a/llama-index-integrations/readers/llama-index-readers-intercom/README.md b/llama-index-integrations/readers/llama-index-readers-intercom/README.md index 7c6c7163198a9..f15265703a64e 100644 --- a/llama-index-integrations/readers/llama-index-readers-intercom/README.md +++ b/llama-index-integrations/readers/llama-index-readers-intercom/README.md @@ -1,5 +1,9 @@ # Intercom Loader +```bash +pip install llama-index-readers-intercom +``` + This loader fetches the text from Intercom help articles using the Intercom API. It also uses the BeautifulSoup library to parse the HTML and extract the text from the articles. ## Usage @@ -7,9 +11,7 @@ This loader fetches the text from Intercom help articles using the Intercom API. To use this loader, you need to pass in an Intercom account access token. ```python -from llama_index import download_loader - -IntercomReader = download_loader("IntercomReader") +from llama_index.readers.intercom import IntercomReader loader = IntercomReader(intercom_access_token="my_access_token") documents = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-jira/README.md b/llama-index-integrations/readers/llama-index-readers-jira/README.md index a36d63872b7b6..2e76552ba9317 100644 --- a/llama-index-integrations/readers/llama-index-readers-jira/README.md +++ b/llama-index-integrations/readers/llama-index-readers-jira/README.md @@ -1,5 +1,9 @@ # JIRA Reader +```bash +pip install llama-index-readers-jira +``` + The Jira loader returns a set of issues based on the query provided to the dataloader. We can follow two methods to initialize the loader- 1- basic_auth -> this takes a dict with the following keys @@ -21,7 +25,7 @@ You can follow this link for more information regarding Oauth2 -> https://develo Here's an example of how to use it ```python -from llama_hub.jira import JiraReader +from llama_index.readers.jira import JiraReader reader = JiraReader( email=email, api_token=api_token, server_url="your-jira-server.com" @@ -32,9 +36,7 @@ documents = reader.load_data(query="project = ") Alternately, you can also use download_loader from llama_index ```python -from llama_index import download_loader - -JiraReader = download_loader("JiraReader") +from llama_index.readers.jira import JiraReader reader = JiraReader( email=email, api_token=api_token, server_url="your-jira-server.com" diff --git a/llama-index-integrations/readers/llama-index-readers-joplin/README.md b/llama-index-integrations/readers/llama-index-readers-joplin/README.md index bcd7afb5855cf..c8a14e07fd25b 100644 --- a/llama-index-integrations/readers/llama-index-readers-joplin/README.md +++ b/llama-index-integrations/readers/llama-index-readers-joplin/README.md @@ -1,5 +1,9 @@ # Joplin (Markdown) Loader +```bash +pip install llama-index-readers-joplin +``` + > [Joplin](https://joplinapp.org/) is an open source note-taking app. Capture your thoughts and securely access them from any device. This readme covers how to load documents from a `Joplin` database. @@ -20,10 +24,10 @@ An alternative to this approach is to export the `Joplin`'s note database to Mar Here's an example usage of the JoplinReader. ```python -from llama_index import download_loader import os -JoplinReader = download_loader("JoplinReader") +from llama_index.readers.joplin import JoplinReader + documents = JoplinReader( access_token="" ).load_data() # Returns list of documents diff --git a/llama-index-integrations/readers/llama-index-readers-kaltura/README.md b/llama-index-integrations/readers/llama-index-readers-kaltura/README.md index 6aba072088d86..1d5fae146e88d 100644 --- a/llama-index-integrations/readers/llama-index-readers-kaltura/README.md +++ b/llama-index-integrations/readers/llama-index-readers-kaltura/README.md @@ -1,5 +1,9 @@ # Kaltura eSearch Loader +```bash +pip install llama-index-readers-kaltura-esearch +``` + This loader reads Kaltura Entries from [Kaltura](https://corp.kaltura.com) based on a Kaltura eSearch API call. Search queries can be passed as a pre-defined object of KalturaESearchEntryParams, or through a simple free text query. The result is a list of documents containing the Kaltura Entries and Captions json. @@ -64,9 +68,7 @@ Each dictionary in the response represents a Kaltura media entry, where the keys First, instantiate the KalturaReader (aka Kaltura Loader) with your Kaltura configuration credentials: ```python -from llama_index import download_loader - -KalturaESearchReader = download_loader("KalturaESearchReader") +from llama_index.readers.kaltura_esearch import KalturaESearchReader loader = KalturaESearchReader( partnerId="INSERT_YOUR_PARTNER_ID", diff --git a/llama-index-integrations/readers/llama-index-readers-kibela/README.md b/llama-index-integrations/readers/llama-index-readers-kibela/README.md index 97323863e872c..d4a39b1a455d4 100644 --- a/llama-index-integrations/readers/llama-index-readers-kibela/README.md +++ b/llama-index-integrations/readers/llama-index-readers-kibela/README.md @@ -1,5 +1,9 @@ # Kibela Reader +```bash +pip install llama-index-readers-kibela +``` + This reader fetches article from your [Kibela](https://kibe.la/) notes using the GraphQL API. # Usage @@ -8,7 +12,7 @@ Here's an example of how to use it. You can get your access token from [here](ht ```python import os -from llama_hub.kibela import KibelaReader +from llama_index.readers.kibela import KibelaReader team = os.environ["KIBELA_TEAM"] token = os.environ["KIBELA_TOKEN"] @@ -21,9 +25,8 @@ Alternately, you can also use download_loader from llama_index ```python import os -from llama_index import download_loader -KibelaReader = download_loader("KibelaReader") +from llama_index.readers.kibela import KibelaReader team = os.environ["KIBELA_TEAM"] token = os.environ["KIBELA_TOKEN"] diff --git a/llama-index-integrations/readers/llama-index-readers-lilac/README.md b/llama-index-integrations/readers/llama-index-readers-lilac/README.md index 0a396b701a2c7..210d23f6bbfce 100644 --- a/llama-index-integrations/readers/llama-index-readers-lilac/README.md +++ b/llama-index-integrations/readers/llama-index-readers-lilac/README.md @@ -1,5 +1,11 @@ # Lilac reader +```bash +pip install llama-index-readers-papers + +pip install llama-index-readers-lilac +``` + [Lilac](https://lilacml.com/) is an open-source product that helps you analyze, enrich, and clean unstructured data with AI. It can be used to analyze, clean, structure, and label data that can be used in downstream LlamaIndex and LangChain applications. @@ -17,11 +23,10 @@ You can use any LlamaIndex loader to load data into Lilac, clean data, and then See [this notebook](https://github.com/lilacai/lilac/blob/main/notebooks/LlamaIndexLoader.ipynb) for getting data into Lilac from LlamaHub. ```python -from llama_index import download_loader import lilac as ll # See: https://llamahub.ai/l/papers-arxiv -ArxivReader = download_loader("ArxivReader") +from llama_index.readers.papers import ArxivReader loader = ArxivReader() documents = loader.load_data(search_query="au:Karpathy") @@ -49,9 +54,9 @@ ll.start_server(project_dir="./data") ### Lilac => LlamaIndex Documents ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -LilacReader = download_loader("LilacReader") +from llama_index.readers.lilac import LilacReader loader = LilacReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-linear/README.md b/llama-index-integrations/readers/llama-index-readers-linear/README.md index 59e14cdc7184a..3c3a0f97ccafe 100644 --- a/llama-index-integrations/readers/llama-index-readers-linear/README.md +++ b/llama-index-integrations/readers/llama-index-readers-linear/README.md @@ -1,5 +1,9 @@ # Linear Reader +```bash +pip install llama-index-readers-linear +``` + The Linear loader returns issue based on the query. ## Usage @@ -7,7 +11,7 @@ The Linear loader returns issue based on the query. Here's an example of how to use it ```python -from llama_hub.linear import LinearReader +from llama_index.readers.linear import LinearReader reader = LinearReader(api_key=api_key) query = """ @@ -38,9 +42,7 @@ documents = reader.load_data(query=query) Alternately, you can also use download_loader from llama_index ```python -from llama_index import download_loader - -LinearReader = download_loader("LinearReader") +from llama_index.readers.linear import LinearReader reader = LinearReader(api_key=api_key) query = """ diff --git a/llama-index-integrations/readers/llama-index-readers-macrometa-gdn/README.md b/llama-index-integrations/readers/llama-index-readers-macrometa-gdn/README.md index e2fd8a41bef7b..a9fae3033bdcb 100644 --- a/llama-index-integrations/readers/llama-index-readers-macrometa-gdn/README.md +++ b/llama-index-integrations/readers/llama-index-readers-macrometa-gdn/README.md @@ -1,5 +1,9 @@ # Macrometa GDN Loader +```bash +pip install llama-index-readers-macrometa-gdn +``` + This loader takes in a Macrometa federation URL, API key, and collection name and returns a list of vectors. ## Usage @@ -7,9 +11,7 @@ This loader takes in a Macrometa federation URL, API key, and collection name an To use this loader, you need to pass the URL and API key through the class constructor, and then load the data using an array of collection names. ```python -from llama_index import download_loader - -MacrometaGDNReader = download_loader("MacrometaGDNReader") +from llama_index.readers.macrometa_gdn import MacrometaGDNReader collections = ["test_collection"] loader = MacrometaGDNReader(url="https://api-macrometa.io", apikey="test") diff --git a/llama-index-integrations/readers/llama-index-readers-mangadex/README.md b/llama-index-integrations/readers/llama-index-readers-mangadex/README.md index 685c59af9f735..893aadd634106 100644 --- a/llama-index-integrations/readers/llama-index-readers-mangadex/README.md +++ b/llama-index-integrations/readers/llama-index-readers-mangadex/README.md @@ -1,13 +1,15 @@ # MangaDex Loader +```bash +pip install llama-index-readers-mangadex +``` + This loader fetches information from the MangaDex API, by manga title. ## Usage ```python -from llama_index import download_loader - -MangaDexReader = download_loader("MangaDexReader") +from llama_index.readers.mangadex import MangaDexReader loader = MangaDexReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-mangoapps-guides/README.md b/llama-index-integrations/readers/llama-index-readers-mangoapps-guides/README.md index 87e03688c8104..51f392bd8c660 100644 --- a/llama-index-integrations/readers/llama-index-readers-mangoapps-guides/README.md +++ b/llama-index-integrations/readers/llama-index-readers-mangoapps-guides/README.md @@ -1,5 +1,9 @@ # MangoppsGuides Loader +```bash +pip install llama-index-readers-mangoapps-guides +``` + This loader fetches the text from Mangopps Guides. ## Usage @@ -7,9 +11,7 @@ This loader fetches the text from Mangopps Guides. To use this loader, you need to pass base url of the MangoppsGuides installation (e.g. `https://guides.mangoapps.com/`) and the limit , i.e. max number of links it should crawl ```python -from llama_index import download_loader - -MangoppsGuidesReader = download_loader("MangoppsGuidesReader") +from llama_index.readers.mangoapps_guides import MangoppsGuidesReader loader = MangoppsGuidesReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-maps/README.md b/llama-index-integrations/readers/llama-index-readers-maps/README.md index 920dfdd45fd0c..47f318eb75077 100644 --- a/llama-index-integrations/readers/llama-index-readers-maps/README.md +++ b/llama-index-integrations/readers/llama-index-readers-maps/README.md @@ -1,5 +1,9 @@ # **_Osmmap Loader_** +```bash +pip install llama-index-readers-maps +``` + The Osmmap Loader will fetch map data from the [Overpass](https://wiki.openstreetmap.org/wiki/Main_Page) api for a certain place or area. Version **Overpass API 0.7.60** is used by this loader. The api will provide you with all the **nodes, relations, and ways** for the particular region when you request data for a region or location. @@ -27,9 +31,7 @@ She requires all the nodes, routes, and relations within a five-kilometer radius ### And the code snippet looks like ```python -from llama_index import download_loader - -MapReader = download_loader("OpenMap") +from llama_index.readers.maps import OpenMap loader = MapReader() documents = loader.load_data( @@ -46,9 +48,7 @@ documents = loader.load_data( - so she search for hospital tag in the [Taginfo](https://taginfo.openstreetmap.org/tags) and she got ```python -from llama_index import download_loader - -MapReader = download_loader("OpenMap") +from llama_index.readers.maps import OpenMap loader = MapReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-memos/README.md b/llama-index-integrations/readers/llama-index-readers-memos/README.md index 85dfd31c08430..849e4dd1fedcb 100644 --- a/llama-index-integrations/readers/llama-index-readers-memos/README.md +++ b/llama-index-integrations/readers/llama-index-readers-memos/README.md @@ -1,5 +1,9 @@ # Memos Loader +```bash +pip install llama-index-readers-memos +``` + This loader fetches text from self-hosted [memos](https://github.com/usememos/memos). ## Usage @@ -7,9 +11,8 @@ This loader fetches text from self-hosted [memos](https://github.com/usememos/me To use this loader, you need to specify the host where memos is deployed. If you need to filter, pass the [corresponding parameter](https://github.com/usememos/memos/blob/4fe8476169ecd2fc4b164a25611aae6861e36812/api/memo.go#L76) in `load_data`. ```python -from llama_index import download_loader +from llama_index.readers.memos import MemosReader -MemosReader = download_loader("MemosReader") loader = MemosReader("https://demo.usememos.com/") documents = loader.load_data({"creatorId": 101}) ``` diff --git a/llama-index-integrations/readers/llama-index-readers-microsoft-onedrive/README.md b/llama-index-integrations/readers/llama-index-readers-microsoft-onedrive/README.md index e2df15698bcaa..05a43f3de03d4 100644 --- a/llama-index-integrations/readers/llama-index-readers-microsoft-onedrive/README.md +++ b/llama-index-integrations/readers/llama-index-readers-microsoft-onedrive/README.md @@ -1,5 +1,9 @@ # Microsoft OneDrive Loader +```bash +pip install llama-index-readers-microsoft-onedrive +``` + This loader reads files from: - Microsoft OneDrive Personal [(https://onedrive.live.com/)](https://onedrive.live.com/) and @@ -61,9 +65,7 @@ For example, the file_id of `https://onedrive.live.com/?cid=0B5AF52BE769DFDE4&id #### OneDrive Personal Example Usage: ```python -from llama_index import download_loader - -OneDriveReader = download_loader("OneDriveReader") +from llama_index.readers.microsoft_onedrive import OneDriveReader # User Authentication flow: Replace client id with your own id loader = OneDriveReader(client_id="82ee706e-2439-47fa-877a-95048ead9318") @@ -108,9 +110,7 @@ For example, the path of file "demo_doc.docx" within test subfolder from previou #### OneDrive For Business Example Usage: ```python -from llama_index import download_loader - -OneDriveReader = download_loader("OneDriveReader") +from llama_index.readers.microsoft_onedrive import OneDriveReader loader = OneDriveReader( client_id="82ee706e-2439-47fa-877a-95048ead9318", diff --git a/llama-index-integrations/readers/llama-index-readers-microsoft-outlook/README.md b/llama-index-integrations/readers/llama-index-readers-microsoft-outlook/README.md index 3869c7a6cd386..c2f556fb67155 100644 --- a/llama-index-integrations/readers/llama-index-readers-microsoft-outlook/README.md +++ b/llama-index-integrations/readers/llama-index-readers-microsoft-outlook/README.md @@ -1,5 +1,9 @@ # Outlook Local Calendar Loader +```bash +pip install llama-index-readers-microsoft-outlook +``` + This loader reads your past and upcoming Calendar events from your local Outlook .ost or .pst and parses the relevant info into `Documents`. It runs on Windows only and has only been tested with Windows 11. It has been designed to have a supoerset of the functionality of the Google Calendar reader. @@ -11,9 +15,7 @@ Here's an example usage of the OutlookCalendar Reader. It will retrieve up to 10 It always returns Start, End, Subject, Location, and Organizer attributes and optionally returns additional attributes specified in the `more_attributes` parameter, which, if specified, must be a list of strings eg. ['Body','someotherattribute',...]. Attributes which don't exist in a calendar entry are ignored without warning. ```python -from llama_index import download_loader - -OutlookCalendarReader = download_loader("OutlookLocalCalendarReader") +from llama_index.readers.microsoft_outlook import OutlookLocalCalendarReader loader = OutlookCalendarReader() documents = loader.load_data() @@ -26,9 +28,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -OutlookCalendarReader = download_loader("OutlookLocalCalendarReader") +from llama_index.readers.microsoft_outlook import OutlookLocalCalendarReader loader = OutlookCalendarReader( start_date="2022-01-01", number_of_documents=1000 diff --git a/llama-index-integrations/readers/llama-index-readers-microsoft-sharepoint/README.md b/llama-index-integrations/readers/llama-index-readers-microsoft-sharepoint/README.md index e382b0f013194..9ea404eae410f 100644 --- a/llama-index-integrations/readers/llama-index-readers-microsoft-sharepoint/README.md +++ b/llama-index-integrations/readers/llama-index-readers-microsoft-sharepoint/README.md @@ -1,5 +1,9 @@ # Microsoft SharePoint Reader +```bash +pip install llama-index-readers-microsoft-sharepoint +``` + The loader loads the files from a folder in sharepoint site. It also supports traversing recursively through the sub-folders. @@ -27,9 +31,7 @@ If the files are present in the `Test` folder in SharePoint Site under `root` di ![FilePath](file_path_info.png) ```python -from llama_index import download_loader - -SharePointLoader = download_loader("SharePointReader") +from llama_index.readers.microsoft_sharepoint import SharePointReader loader = SharePointLoader( client_id="", diff --git a/llama-index-integrations/readers/llama-index-readers-minio/README.md b/llama-index-integrations/readers/llama-index-readers-minio/README.md index d0bb5d20dd2d1..6fa3d65e706ce 100644 --- a/llama-index-integrations/readers/llama-index-readers-minio/README.md +++ b/llama-index-integrations/readers/llama-index-readers-minio/README.md @@ -6,4 +6,4 @@ ## Import -`from llama_index.readers.minio import MinioReader, BotoMinioReader` +from llama_index.core.readers.minio import MinioReader, BotoMinioReader` diff --git a/llama-index-integrations/readers/llama-index-readers-minio/llama_index/README.md b/llama-index-integrations/readers/llama-index-readers-minio/llama_index/README.md index e17e81f4d6bcc..3ae38a238236b 100644 --- a/llama-index-integrations/readers/llama-index-readers-minio/llama_index/README.md +++ b/llama-index-integrations/readers/llama-index-readers-minio/llama_index/README.md @@ -13,8 +13,6 @@ To use this loader, you need to pass in the name of your Minio Bucket. After tha Otherwise, you may specify a prefix if you only want to parse certain files in the Bucket, or a subdirectory. ```python -from llama_index import download_loader - MinioReader = download_loader("BotoMinioReader") loader = MinioReader( bucket="documents", @@ -40,8 +38,6 @@ Otherwise, you may specify a prefix if you only want to parse certain files in t You can now use the client with a TLS-secured MinIO instance (`minio_secure=True`), even if server's certificate isn't trusted (`minio_cert_check=False`). ```python -from llama_index import download_loader - MinioReader = download_loader("MinioReader") loader = MinioReader( bucket="documents", diff --git a/llama-index-integrations/readers/llama-index-readers-mondaydotcom/README.md b/llama-index-integrations/readers/llama-index-readers-mondaydotcom/README.md index 47e4b14b946e7..fd9d1f696fa5d 100644 --- a/llama-index-integrations/readers/llama-index-readers-mondaydotcom/README.md +++ b/llama-index-integrations/readers/llama-index-readers-mondaydotcom/README.md @@ -1,5 +1,9 @@ # Monday Loader +```bash +pip install llama-index-readers-mondaydotcom +``` + This loader loads data from monday.com. The user specifies an API token to initialize the MondayReader. They then specify a monday.com board id to load in the corresponding Document objects. ## Usage @@ -7,9 +11,7 @@ This loader loads data from monday.com. The user specifies an API token to initi Here's an example usage of the MondayReader. ```python -from llama_index import download_loader - -MondayReader = download_loader("MondayReader") +from llama_index.readers.mondaydotcom import MondayReader reader = MondayReader("") documents = reader.load_data("") diff --git a/llama-index-integrations/readers/llama-index-readers-nougat-ocr/README.md b/llama-index-integrations/readers/llama-index-readers-nougat-ocr/README.md index d38c41f7a01ad..56b3285ae302d 100644 --- a/llama-index-integrations/readers/llama-index-readers-nougat-ocr/README.md +++ b/llama-index-integrations/readers/llama-index-readers-nougat-ocr/README.md @@ -1,5 +1,9 @@ # Nougat OCR loader +```bash +pip install llama-index-readers-nougat-ocr +``` + This loader reads the equations, symbols, and tables included in the PDF. Users can input the path of the academic PDF document `file` which they want to parse. This OCR understands LaTeX math and tables. @@ -9,7 +13,7 @@ Users can input the path of the academic PDF document `file` which they want to Here's an example usage of the PDFNougatOCR. ```python -from llama_hub.nougat_ocr import PDFNougatOCR +from llama_index.readers.nougat_ocr import PDFNougatOCR reader = PDFNougatOCR() diff --git a/llama-index-integrations/readers/llama-index-readers-openalex/README.md b/llama-index-integrations/readers/llama-index-readers-openalex/README.md index a171d0697be41..3ba2fb3b3bc11 100644 --- a/llama-index-integrations/readers/llama-index-readers-openalex/README.md +++ b/llama-index-integrations/readers/llama-index-readers-openalex/README.md @@ -1,11 +1,15 @@ # OpenAlex Reader +```bash +pip install llama-index-readers-openalex +``` + This loader will search for papers in OpenAlex and load them in llama-index. The main advantage of using OpenAlex is that you can search the full-text for Open Access papers as well. ## Usage ```python -from llama_hub.openalex_loader import OpenAlexReader +from llama_index.readers.openalex import OpenAlexReader openalex_reader = OpenAlexReader(email="shauryr@gmail.com") query = "biases in large language models" diff --git a/llama-index-integrations/readers/llama-index-readers-opendal/README.md b/llama-index-integrations/readers/llama-index-readers-opendal/README.md index 86cf7176efcb8..8890a2cc0aa78 100644 --- a/llama-index-integrations/readers/llama-index-readers-opendal/README.md +++ b/llama-index-integrations/readers/llama-index-readers-opendal/README.md @@ -1,5 +1,9 @@ # OpenDAL Loaders +```bash +pip install llama-index-readers-opendal +``` + ## Base OpendalReader This loader parses any file via [Apache OpenDAL](https://github.com/apache/incubator-opendal). @@ -11,9 +15,7 @@ All files are temporarily downloaded locally and subsequently parsed with `Simpl `OpendalReader` can read data from any supported storage services including `s3`, `azblob`, `gcs` and so on. ```python -from llama_index import download_loader - -OpendalReader = download_loader("OpendalReader") +from llama_index.readers.opendal import OpendalReader loader = OpendalReader( scheme="s3", @@ -40,9 +42,7 @@ All files are temporarily downloaded locally and subsequently parsed with `Simpl ### Usage ```python -from llama_index import download_loader - -OpendalAzblobReader = download_loader("OpendalAzblobReader") +from llama_index.readers.opendal import OpendalAzblobReader loader = OpendalAzblobReader( container="container", @@ -69,9 +69,7 @@ All files are temporarily downloaded locally and subsequently parsed with `Simpl ### Usage ```python -from llama_index import download_loader - -OpendalGcsReader = download_loader("OpendalGcsReader") +from llama_index.readers.opendal import OpendalGcsReader loader = OpendalGcsReader( bucket="bucket", @@ -99,10 +97,6 @@ All files are temporarily downloaded locally and subsequently parsed with `Simpl ### Usage ```python -from llama_index import download_loader - -OpendalS3Reader = download_loader("OpendalS3Reader") - loader = OpendalS3Reader( bucket="bucket", path="path/to/data/", diff --git a/llama-index-integrations/readers/llama-index-readers-opensearch/README.md b/llama-index-integrations/readers/llama-index-readers-opensearch/README.md index 2af8cd6372232..b9a172008b24f 100644 --- a/llama-index-integrations/readers/llama-index-readers-opensearch/README.md +++ b/llama-index-integrations/readers/llama-index-readers-opensearch/README.md @@ -1,5 +1,9 @@ # Opensearch Loader +```bash +pip install llama-index-readers-opensearch +``` + The Opensearch Loader returns a set of texts corresponding to documents retrieved from an Opensearch index. The user initializes the loader with an Opensearch index. They then pass in a field, and optionally a JSON query DSL object to fetch the fields they want. @@ -8,9 +12,7 @@ The user initializes the loader with an Opensearch index. They then pass in a fi Here's an example usage of the OpensearchReader to load 100 documents. ```python -from llama_index import download_loader - -OpensearchReader = download_loader("OpensearchReader") +from llama_index.readers.opensearch import OpensearchReader reader = OpensearchReader( host="localhost", diff --git a/llama-index-integrations/readers/llama-index-readers-pandas-ai/README.md b/llama-index-integrations/readers/llama-index-readers-pandas-ai/README.md index 7c5dc5d16c2a2..15124e6e2f9ec 100644 --- a/llama-index-integrations/readers/llama-index-readers-pandas-ai/README.md +++ b/llama-index-integrations/readers/llama-index-readers-pandas-ai/README.md @@ -1,5 +1,9 @@ # Pandas AI Loader +```bash +pip install llama-index-readers-pandas-ai +``` + This loader is a light wrapper around the `PandasAI` Python package. See here: https://github.com/gventuri/pandas-ai. @@ -10,7 +14,6 @@ you can choose to load in `Document` objects via `load_data`. ## Usage ```python -from llama_index import download_loader from pandasai.llm.openai import OpenAI import pandas as pd @@ -47,7 +50,7 @@ df = pd.DataFrame( llm = OpenAI() -PandasAIReader = download_loader("PandasAIReader") +from llama_index.readers.pandas_ai import PandasAIReader # use run_pandas_ai directly # set is_conversational_answer=False to get parsed output diff --git a/llama-index-integrations/readers/llama-index-readers-papers/README.md b/llama-index-integrations/readers/llama-index-readers-papers/README.md index 54d66b6bc3da6..7dbebcfb7499b 100644 --- a/llama-index-integrations/readers/llama-index-readers-papers/README.md +++ b/llama-index-integrations/readers/llama-index-readers-papers/README.md @@ -1,5 +1,9 @@ # Papers Loaders +```bash +pip install llama-index-readers-papers +``` + ## Arxiv Papers Loader This loader fetches the text from the most relevant scientific papers on Arxiv specified by a search query (e.g. "Artificial Intelligence"). For each paper, the abstract is extracted and put in a separate document. The search query may be any string, Arxiv paper id, or a general Arxiv query string (see the full list of capabilities [here](https://info.arxiv.org/help/api/user-manual.html#query_details)). @@ -9,9 +13,7 @@ This loader fetches the text from the most relevant scientific papers on Arxiv s To use this loader, you need to pass in the search query. You may also optionally specify a local directory to temporarily store the paper PDFs (they are deleted automatically) and the maximum number of papers you want to parse for your search query (default is 10). ```python -from llama_index import download_loader - -ArxivReader = download_loader("ArxivReader") +from llama_index.readers.papers import ArxivReader loader = ArxivReader() documents = loader.load_data(search_query="au:Karpathy") @@ -20,9 +22,7 @@ documents = loader.load_data(search_query="au:Karpathy") Alternatively, if you would like to load papers and abstracts separately: ```python -from llama_index import download_loader - -ArxivReader = download_loader("ArxivReader") +from llama_index.readers.papers import ArxivReader loader = ArxivReader() documents, abstracts = loader.load_papers_and_abstracts( @@ -41,9 +41,7 @@ This loader fetches the text from the most relevant scientific papers on Pubmed To use this loader, you need to pass in the search query. You may also optionally specify the maximum number of papers you want to parse for your search query (default is 10). ```python -from llama_index import download_loader - -PubmedReader = download_loader("PubmedReader") +from llama_index.readers.papers import PubmedReader loader = PubmedReader() documents = loader.load_data(search_query="amyloidosis") diff --git a/llama-index-integrations/readers/llama-index-readers-patentsview/README.md b/llama-index-integrations/readers/llama-index-readers-patentsview/README.md index 127d653495ab3..c283ffa887e4e 100644 --- a/llama-index-integrations/readers/llama-index-readers-patentsview/README.md +++ b/llama-index-integrations/readers/llama-index-readers-patentsview/README.md @@ -1,5 +1,9 @@ # Patentsview Loader +```bash +pip install llama-index-readers-patentsview +``` + This loader loads patent abstract from `a list of patent numbers` with API provided by [Patentsview](https://patentsview.org/). ## Usage @@ -7,9 +11,8 @@ This loader loads patent abstract from `a list of patent numbers` with API provi Here'a an example usage of PatentsviewReader. ```python -from llama_index import download_loader +from llama_index.readers.patentsview import PatentsviewReader -PatentsviewReader = download_loader("PatentsviewReader") loader = PatentsviewReader() patents = ["8848839", "10452978"] abstracts = loader.load_data(patents) diff --git a/llama-index-integrations/readers/llama-index-readers-pdb/README.md b/llama-index-integrations/readers/llama-index-readers-pdb/README.md index 9997c20ac48ec..b82f352b14e29 100644 --- a/llama-index-integrations/readers/llama-index-readers-pdb/README.md +++ b/llama-index-integrations/readers/llama-index-readers-pdb/README.md @@ -1,5 +1,9 @@ # Protein Data Bank (PDB) publication Loader +```bash +pip install llama-index-readers-pdb +``` + This loader fetches the abstract of PDB entries using the RCSB (Research Collaboratory for Structural Bioinformatics) or EBI (European Bioinformatics Institute) REST api. ## Usage @@ -7,7 +11,7 @@ This loader fetches the abstract of PDB entries using the RCSB (Research Collabo To use this loader, simply pass an array of PDB ids into `load_data`: ```python -from llama_hub.pdb import PdbAbstractReader +from llama_index.readers.pdb import PdbAbstractReader loader = PdbAbstractReader() documents = loader.load_data(pdb_id=["1cbs"]) diff --git a/llama-index-integrations/readers/llama-index-readers-pdf-table/README.md b/llama-index-integrations/readers/llama-index-readers-pdf-table/README.md index bfe9e0271a333..5036097ec1e85 100644 --- a/llama-index-integrations/readers/llama-index-readers-pdf-table/README.md +++ b/llama-index-integrations/readers/llama-index-readers-pdf-table/README.md @@ -1,5 +1,9 @@ # PDF Table Loader +```bash +pip install llama-index-readers-pdf-table +``` + This loader reads the tables included in the PDF. Users can input the PDF `file` and the `pages` from which they want to extract tables, and they can read the tables included on those pages. @@ -10,7 +14,7 @@ Here's an example usage of the PDFTableReader. `pages` parameter is the same as camelot's `pages`. Therefore, you can use patterns such as `all`, `1,2,3`, `10-20`, and so on. ```python -from llama_hub.pdf_table import PDFTableReader +from llama_index.readers.pdf_table import PDFTableReader from pathlib import Path reader = PDFTableReader() diff --git a/llama-index-integrations/readers/llama-index-readers-preprocess/README.md b/llama-index-integrations/readers/llama-index-readers-preprocess/README.md index ae514fbdf4893..ebd34f3fdea04 100644 --- a/llama-index-integrations/readers/llama-index-readers-preprocess/README.md +++ b/llama-index-integrations/readers/llama-index-readers-preprocess/README.md @@ -1,5 +1,9 @@ # Preprocess Loader +```bash +pip install llama-index-readers-preprocess +``` + [Preprocess](https://preprocess.co) is an API service that splits any kind of document into optimal chunks of text for use in language model tasks. Given documents in input `Preprocess` splits them into chunks of text that respect the layout and semantics of the original document. We split the content by taking into account sections, paragraphs, lists, images, data tables, text tables, and slides, and following the content semantics for long texts. @@ -26,10 +30,9 @@ To chunk a file pass a valid filepath and the reader will start converting and c If you want to handle the nodes directly: ```python -from llama_index import VectorStoreIndex -from llama_index import download_loader +from llama_index.core import VectorStoreIndex -PreprocessReader = download_loader("PreprocessReader") +from llama_index.readers.preprocess import PreprocessReader # pass a filepath and get the chunks as nodes loader = PreprocessReader( @@ -45,10 +48,9 @@ query_engine = index.as_query_engine() By default load_data() returns a document for each chunk, remember to not apply any splitting to these documents ```python -from llama_index import VectorStoreIndex -from llama_index import download_loader +from llama_index.core import VectorStoreIndex -PreprocessReader = download_loader("PreprocessReader") +from llama_index.readers.preprocess import PreprocessReader # pass a filepath and get the chunks as nodes loader = PreprocessReader( diff --git a/llama-index-integrations/readers/llama-index-readers-rayyan/README.md b/llama-index-integrations/readers/llama-index-readers-rayyan/README.md index d5dae921eac7c..05c589fa43c8e 100644 --- a/llama-index-integrations/readers/llama-index-readers-rayyan/README.md +++ b/llama-index-integrations/readers/llama-index-readers-rayyan/README.md @@ -1,5 +1,9 @@ # Rayyan Loader +```bash +pip install llama-index-readers-rayyan +``` + This loader fetches review articles from [Rayyan](https://www.rayyan.ai/) using the [Rayyan SDK](https://github.com/rayyansys/rayyan-python-sdk). All articles for a given review are fetched by default unless a filter is specified. @@ -11,9 +15,8 @@ and optionally the API server URL if different from the default. More details about these parameters can be found in the official Rayyan SDK repository. ```python -from llama_index import download_loader +from llama_index.readers.rayyan import RayyanReader -RayyanReader = download_loader("RayyanReader") loader = RayyanReader(credentials_path="path/to/rayyan-creds.json") ``` diff --git a/llama-index-integrations/readers/llama-index-readers-readwise/README.md b/llama-index-integrations/readers/llama-index-readers-readwise/README.md index 525cfe8b25917..9aa461c5822f3 100644 --- a/llama-index-integrations/readers/llama-index-readers-readwise/README.md +++ b/llama-index-integrations/readers/llama-index-readers-readwise/README.md @@ -1,5 +1,9 @@ # Readwise Reader +```bash +pip install llama-index-readers-readwise +``` + Use Readwise's export API to fetch your highlights from web articles, epubs, pdfs, Kindle, YouTube, and load the resulting text into LLMs. ## Setup @@ -12,9 +16,10 @@ Here is an example usage of the Readwise Reader: ```python import os -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader + +from llama_index.readers.readwise import ReadwiseReader -ReadwiseReader = download_loader("ReadwiseReader") token = os.getenv("READWISE_API_KEY") loader = ReadwiseReader(api_key=token) documents = loader.load_data() @@ -28,9 +33,10 @@ You can also query for highlights that have been created after a certain time: ```python import os import datetime -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader + +from llama_index.readers.readwise import ReadwiseReader -ReadwiseReader = download_loader("ReadwiseReader") token = os.getenv("READWISE_API_KEY") loader = ReadwiseReader(api_key=token) seven_days_ago = datetime.datetime.now() - datetime.timedelta(days=7) diff --git a/llama-index-integrations/readers/llama-index-readers-reddit/README.md b/llama-index-integrations/readers/llama-index-readers-reddit/README.md index 7153d344f6d81..ea964afc453eb 100644 --- a/llama-index-integrations/readers/llama-index-readers-reddit/README.md +++ b/llama-index-integrations/readers/llama-index-readers-reddit/README.md @@ -1,5 +1,9 @@ # Reddit Reader +```bash +pip install llama-index-readers-reddit +``` + For any subreddit(s) you're interested in, search for relevant posts using keyword(s) and load the resulting text in the post and and top-level comments into LLMs/ LangChains. ## Get your Reddit credentials ready @@ -15,9 +19,9 @@ For any subreddit(s) you're interested in, search for relevant posts using keywo ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -RedditReader = download_loader("RedditReader") +from llama_index.readers.reddit import RedditReader subreddits = ["MachineLearning"] search_keys = ["PyTorch", "deploy"] @@ -35,13 +39,13 @@ index.query("What are the pain points of PyTorch users?") ### LangChain ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -RedditReader = download_loader("RedditReader") +from llama_index.readers.reddit import RedditReader subreddits = ["MachineLearning"] search_keys = ["PyTorch", "deploy"] diff --git a/llama-index-integrations/readers/llama-index-readers-remote-depth/README.md b/llama-index-integrations/readers/llama-index-readers-remote-depth/README.md index 48ba8b0ab8159..886acec8ddeb0 100644 --- a/llama-index-integrations/readers/llama-index-readers-remote-depth/README.md +++ b/llama-index-integrations/readers/llama-index-readers-remote-depth/README.md @@ -1,5 +1,9 @@ # Remote Page/File Loader +```bash +pip install llama-index-readers-remote-depth +``` + This loader makes it easy to extract the text from the links available in a webpage URL, and extract the links presents in the page. It's based on `RemoteReader` (reading single page), that is based on `SimpleDirectoryReader` (parsing the document if file is a pdf, etc). It is an all-in-one tool for (almost) any group of urls. You can try with this MIT lecture link, it will be able to extract the syllabus, the PDFs, etc: @@ -10,9 +14,7 @@ You can try with this MIT lecture link, it will be able to extract the syllabus, You need to specify the parameter `depth` to specify how many levels of links you want to extract. For example, if you want to extract the links in the page, and the links in the links in the page, you need to specify `depth=2`. ```python -from llama_index import download_loader - -RemoteDepthReader = download_loader("RemoteDepthReader") +from llama_index.readers.remote_depth import RemoteDepthReader loader = RemoteDepthReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-remote/README.md b/llama-index-integrations/readers/llama-index-readers-remote/README.md index f9ff15c271201..c4f8e64a1c8f0 100644 --- a/llama-index-integrations/readers/llama-index-readers-remote/README.md +++ b/llama-index-integrations/readers/llama-index-readers-remote/README.md @@ -1,5 +1,9 @@ # Remote Page/File Loader +```bash +pip install llama-index-readers-remote +``` + This loader makes it easy to extract the text from any remote page or file using just its url. If there's a file at the url, this loader will download it temporarily and parse it using `SimpleDirectoryReader`. It is an all-in-one tool for (almost) any url. As a result, any page or type of file is supported. For instance, if a `.txt` url such as a [Project Gutenberg book](https://www.gutenberg.org/cache/epub/69994/pg69994.txt) is passed in, the text will be parsed as is. On the other hand, if a hosted .mp3 url is passed in, it will be downloaded and parsed using `AudioTranscriber`. @@ -9,9 +13,7 @@ As a result, any page or type of file is supported. For instance, if a `.txt` ur To use this loader, you need to pass in a `Path` to a local file. Optionally, you may specify a `file_extractor` for the `SimpleDirectoryReader` to use, other than the default one. ```python -from llama_index import download_loader - -RemoteReader = download_loader("RemoteReader") +from llama_index.readers.remote import RemoteReader loader = RemoteReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-s3/README.md b/llama-index-integrations/readers/llama-index-readers-s3/README.md index f4413b0f5a2ae..96c3ed4d95f27 100644 --- a/llama-index-integrations/readers/llama-index-readers-s3/README.md +++ b/llama-index-integrations/readers/llama-index-readers-s3/README.md @@ -11,10 +11,6 @@ To use this loader, you need to pass in the name of your S3 Bucket. After that, Otherwise, you may specify a prefix if you only want to parse certain files in the Bucket, or a subdirectory. AWS Access Key credentials may either be passed in during initialization or stored locally (see above). ```python -from llama_index import download_loader - -S3Reader = download_loader("S3Reader") - loader = S3Reader( bucket="scrabble-dictionary", key="dictionary.txt", diff --git a/llama-index-integrations/readers/llama-index-readers-sec-filings/README.md b/llama-index-integrations/readers/llama-index-readers-sec-filings/README.md index 15d0155f31f04..4a2e0a33abd02 100644 --- a/llama-index-integrations/readers/llama-index-readers-sec-filings/README.md +++ b/llama-index-integrations/readers/llama-index-readers-sec-filings/README.md @@ -1,5 +1,9 @@ # SEC DATA DOWNLOADER +```bash +pip install llama-index-readers-sec-filings +``` + Please checkout this repo that I am building on SEC Question Answering Agent [SEC-QA](https://github.com/Athe-kunal/SEC-QA-Agent) This repository downloads all the texts from SEC documents (10-K and 10-Q). Currently, it is not supporting documents that are amended, but that will be added in the near futures. @@ -21,9 +25,7 @@ The SEC Downloader expects 5 attributes ## Usage ```python -from llama_index import download_loader - -SECFilingsLoader = download_loader("SECFilingsLoader") +from llama_index.readers.sec_filings import SECFilingsLoader loader = SECFilingsLoader(tickers=["TSLA"], amount=3, filing_type="10-K") loader.load_data() @@ -95,10 +97,10 @@ This loader is can be used with both Langchain and LlamaIndex. ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader -from llama_index import SimpleDirectoryReader +from llama_index.core import VectorStoreIndex, download_loader +from llama_index.core import SimpleDirectoryReader -SECFilingsLoader = download_loader("SECFilingsLoader") +from llama_index.readers.sec_filings import SECFilingsLoader loader = SECFilingsLoader(tickers=["TSLA"], amount=3, filing_type="10-K") loader.load_data() @@ -111,13 +113,12 @@ index.query("What are the risk factors of Tesla for the year 2022?") ### Langchain ```python -from llama_index import download_loader from langchain.llms import OpenAI from langchain.chains import RetrievalQA from langchain.document_loaders import DirectoryLoader from langchain.indexes import VectorstoreIndexCreator -SECFilingsLoader = download_loader("SECFilingsLoader") +from llama_index.readers.sec_filings import SECFilingsLoader loader = SECFilingsLoader(tickers=["TSLA"], amount=3, filing_type="10-K") loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-semanticscholar/README.md b/llama-index-integrations/readers/llama-index-readers-semanticscholar/README.md index 0242f63cd6e20..08b6a486f6053 100644 --- a/llama-index-integrations/readers/llama-index-readers-semanticscholar/README.md +++ b/llama-index-integrations/readers/llama-index-readers-semanticscholar/README.md @@ -1,5 +1,11 @@ # Semantic Scholar Loader +```bash +pip install llama-index-readers-semanticscholar + +pip install llama-index-llms-openai +``` + Welcome to Semantic Scholar Loader. This module serves as a crucial utility for researchers and professionals looking to get scholarly articles and publications from the Semantic Scholar database. For any research topic you are interested in, this loader reads relevant papers from a search result in Semantic Scholar into `Documents`. @@ -27,13 +33,10 @@ Here is an example of how to use this loader in `llama_index` and get citations ### LlamaIndex ```python -from llama_index.llms import OpenAI -from llama_index.query_engine import CitationQueryEngine -from llama_index import ( - VectorStoreIndex, - ServiceContext, -) -from llama_hub.semanticscholar import SemanticScholarReader +from llama_index.llms.openai import OpenAI +from llama_index.core.query_engine import CitationQueryEngine +from llama_index.core import VectorStoreIndex, ServiceContext +from llama_index.readers.semanticscholar import SemanticScholarReader s2reader = SemanticScholarReader() diff --git a/llama-index-integrations/readers/llama-index-readers-singlestore/README.md b/llama-index-integrations/readers/llama-index-readers-singlestore/README.md index 5ab20d4d6c46f..1b98a72969891 100644 --- a/llama-index-integrations/readers/llama-index-readers-singlestore/README.md +++ b/llama-index-integrations/readers/llama-index-readers-singlestore/README.md @@ -1,5 +1,9 @@ # SingleStore Loader +```bash +pip install llama-index-readers-singlestore +``` + The SingleStore Loader retrieves a set of documents from a specified table in a SingleStore database. The user initializes the loader with database information and then provides a search embedding for retrieving similar documents. ## Usage @@ -7,7 +11,7 @@ The SingleStore Loader retrieves a set of documents from a specified table in a Here's an example usage of the SingleStoreReader: ```python -from llama_hub.singlestore import SingleStoreReader +from llama_index.readers.singlestore import SingleStoreReader # Initialize the reader with your SingleStore database credentials and other relevant details reader = SingleStoreReader( diff --git a/llama-index-integrations/readers/llama-index-readers-smart-pdf-loader/README.md b/llama-index-integrations/readers/llama-index-readers-smart-pdf-loader/README.md index ceccf5377e664..1184ce086a6a6 100644 --- a/llama-index-integrations/readers/llama-index-readers-smart-pdf-loader/README.md +++ b/llama-index-integrations/readers/llama-index-readers-smart-pdf-loader/README.md @@ -1,5 +1,9 @@ # Smart PDF Loader +```bash +pip install llama-index-readers-smart-pdf-loader +``` + SmartPDFLoader is a super fast PDF reader that understands the layout structure of PDFs such as nested sections, nested lists, paragraphs and tables. It uses layout information to smartly chunk PDFs into optimal short contexts for LLMs. @@ -16,7 +20,7 @@ pip install llmsherpa Here's an example usage of the SmartPDFLoader: ```python -from llama_hub.smart_pdf_loader import SmartPDFLoader +from llama_index.readers.smart_pdf_loader import SmartPDFLoader llmsherpa_api_url = "https://readers.llmsherpa.com/api/document/developer/parseDocument?renderFormat=all" pdf_url = "https://arxiv.org/pdf/1910.13461.pdf" # also allowed is a file path e.g. /home/downloads/xyz.pdf @@ -27,7 +31,7 @@ documents = pdf_loader.load_data(pdf_url) Now you can use the documents with other LlamaIndex components. For example, for retrieval augmented generation, try this: ```python -from llama_index import VectorStoreIndex +from llama_index.core import VectorStoreIndex index = VectorStoreIndex.from_documents(documents) query_engine = index.as_query_engine() diff --git a/llama-index-integrations/readers/llama-index-readers-snowflake/README.md b/llama-index-integrations/readers/llama-index-readers-snowflake/README.md index d0302f8343088..c6c0daec2cf5b 100644 --- a/llama-index-integrations/readers/llama-index-readers-snowflake/README.md +++ b/llama-index-integrations/readers/llama-index-readers-snowflake/README.md @@ -1,5 +1,9 @@ # Snowflake Loader +```bash +pip install llama-index-readers-snowflake +``` + This loader connects to Snowflake (using SQLAlchemy under the hood). The user specifies a query and extracts Document objects corresponding to the results. You can use this loader to easily connect to a database on Snowflake and pass the documents into a `GPTSQLStructStoreIndex` from LlamaIndex. ## Usage @@ -9,9 +13,7 @@ This loader connects to Snowflake (using SQLAlchemy under the hood). The user sp Here's an example usage of the SnowflakeReader. ```python -from llama_index import download_loader - -SnowflakeReader = download_loader("SnowflakeReader") +from llama_index.readers.snowflake import SnowflakeReader reader = SnowflakeReader( engine=your_sqlalchemy_engine, @@ -27,9 +29,7 @@ documents = reader.load_data(query=query) Here's an example usage of the SnowflakeReader. ```python -from llama_index import download_loader - -SnowflakeReader = download_loader("SnowflakeReader") +from llama_index.readers.snowflake import SnowflakeReader reader = SnowflakeReader( account="your_account", diff --git a/llama-index-integrations/readers/llama-index-readers-snscrape-twitter/README.md b/llama-index-integrations/readers/llama-index-readers-snscrape-twitter/README.md index 681155514845a..e6d7b0f9aee60 100644 --- a/llama-index-integrations/readers/llama-index-readers-snscrape-twitter/README.md +++ b/llama-index-integrations/readers/llama-index-readers-snscrape-twitter/README.md @@ -1,5 +1,9 @@ # Snscrape twitter Loader +```bash +pip install llama-index-readers-snscrape-twitter +``` + This loader loads documents from Twitter using the Snscrape Python package. ## Usage @@ -7,10 +11,9 @@ This loader loads documents from Twitter using the Snscrape Python package. Here's an example usage of the SnscrapeReader. ```python -from llama_index import download_loader import os -SnscrapeReader = download_loader("SnscrapeTwitterReader") +from llama_index.readers.snscrape_twitter import SnscrapeTwitterReader loader = SnscrapeReader() documents = loader.load_data(username="elonmusk", num_tweets=10) diff --git a/llama-index-integrations/readers/llama-index-readers-spotify/README.md b/llama-index-integrations/readers/llama-index-readers-spotify/README.md index 502d91d282b8a..59cc209d622e3 100644 --- a/llama-index-integrations/readers/llama-index-readers-spotify/README.md +++ b/llama-index-integrations/readers/llama-index-readers-spotify/README.md @@ -1,5 +1,9 @@ # Spotify Loader +```bash +pip install llama-index-readers-spotify +``` + This loader reads your Spotify account and loads saved albums, tracks, or playlists into `Documents`. As a prerequisite, you will need to register with [Spotify for Developers](https://developer.spotify.com) and create an app in order to get a `client_id` and a `client_secret`. You should then set a `redirect_uri` for the app (in the web dashboard under app settings). The `redirect_uri` does not need to be functional. You should then set the `client_id`, `client_secret`, and `redirect_uri` as environmental variables. @@ -13,9 +17,7 @@ As a prerequisite, you will need to register with [Spotify for Developers](https Here's an example usage of the SpotifyReader. It will retrieve your saved albums, unless an optional `collection` argument is passed. Acceptable arguments are "albums", "tracks", and "playlists". ```python -from llama_index import download_loader - -SpotifyReader = download_loader("SpotifyReader") +from llama_index.readers.spotify import SpotifyReader loader = SpotifyReader() documents = loader.load_data() @@ -28,9 +30,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -SpotifyReader = download_loader("SpotifyReader") +from llama_index.readers.spotify import SpotifyReader loader = SpotifyReader() documents = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-stripe-docs/README.md b/llama-index-integrations/readers/llama-index-readers-stripe-docs/README.md index 33d669b7aeb49..15dddba1fab8e 100644 --- a/llama-index-integrations/readers/llama-index-readers-stripe-docs/README.md +++ b/llama-index-integrations/readers/llama-index-readers-stripe-docs/README.md @@ -1,5 +1,9 @@ # StripeDocs Loader +```bash +pip install llama-index-readers-stripe-docs +``` + This loader asynchronously loads data from the [Stripe documentation](https://stripe.com/docs). It iterates through the Stripe sitemap to get all `/docs` references. It is based on the [Async Website Loader](https://llamahub.ai/l/web-async_web). @@ -7,8 +11,8 @@ It is based on the [Async Website Loader](https://llamahub.ai/l/web-async_web). ## Usage ```python -from llama_index import VectorStoreIndex -from llama_hub.stripe_docs import StripeDocsReader +from llama_index.core import VectorStoreIndex +from llama_index.readers.stripe_docs import StripeDocsReader loader = StripeDocsReader() documents = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-telegram/README.md b/llama-index-integrations/readers/llama-index-readers-telegram/README.md index 0ee82e3344510..6b05fdc064223 100644 --- a/llama-index-integrations/readers/llama-index-readers-telegram/README.md +++ b/llama-index-integrations/readers/llama-index-readers-telegram/README.md @@ -1,5 +1,9 @@ # Telegram Loader +```bash +pip install llama-index-readers-telegram +``` + This loader fetches posts/chat messages/comments from Telegram channels or chats into `Document`s. Before working with Telegram’s API, you need to get your own API ID and hash: @@ -31,9 +35,8 @@ If the `.session` file already existed, it will not login again, so be aware of To use this loader, you simply need to pass in a entity name. ```python -from llama_index.core import download_loader +from llama_index.readers.telegram import TelegramReader -TelegramReader = download_loader("TelegramReader") loader = TelegramReader( session_name="[YOUR_SESSION_NAME]", api_id="[YOUR_API_ID]", diff --git a/llama-index-integrations/readers/llama-index-readers-trello/README.md b/llama-index-integrations/readers/llama-index-readers-trello/README.md index 787e53605bb80..aaf2fe018b78a 100644 --- a/llama-index-integrations/readers/llama-index-readers-trello/README.md +++ b/llama-index-integrations/readers/llama-index-readers-trello/README.md @@ -1,5 +1,9 @@ # Trello Loader +```bash +pip install llama-index-readers-trello +``` + This loader loads documents from Trello. The user specifies an API key and API token to initialize the TrelloReader. They then specify a board_id to load in the corresponding Document objects representing Trello cards. @@ -8,10 +12,9 @@ load in the corresponding Document objects representing Trello cards. Here's an example usage of the TrelloReader. ```python -from llama_index import download_loader import os -TrelloReader = download_loader("TrelloReader") +from llama_index.readers.trello import TrelloReader reader = TrelloReader("", "") documents = reader.load_data(board_id="") diff --git a/llama-index-integrations/readers/llama-index-readers-weather/README.md b/llama-index-integrations/readers/llama-index-readers-weather/README.md index f20eb54baa6cf..93de04fc5ceef 100644 --- a/llama-index-integrations/readers/llama-index-readers-weather/README.md +++ b/llama-index-integrations/readers/llama-index-readers-weather/README.md @@ -1,5 +1,9 @@ # Weather Loader +```bash +pip install llama-index-readers-weather +``` + This loader fetches the weather data from the [OpenWeatherMap](https://openweathermap.org/api)'s OneCall API, using the `pyowm` Python package. You must initialize the loader with your OpenWeatherMap API token, and then pass in the names of the cities you want the weather data for. OWM's One Call API provides the following weather data for any geographical coordinate: - Current weather - Hourly forecast for 48 hours - Daily forecast for 7 days @@ -9,9 +13,7 @@ OWM's One Call API provides the following weather data for any geographical coor To use this loader, you need to pass in an array of city names (eg. [chennai, chicago]). Pass in the country codes as well for better accuracy. ```python -from llama_index import download_loader - -WeatherReader = download_loader("WeatherReader") +from llama_index.readers.weather import WeatherReader loader = WeatherReader(token="[YOUR_TOKEN]") documents = loader.load_data(places=["Chennai, IN", "Dublin, IE"]) diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/async_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/async_web/README.md index 44c8985196a36..0706ae999e574 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/async_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/async_web/README.md @@ -1,5 +1,9 @@ # Async Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is an asynchronous web scraper that fetches the text from static websites by converting the HTML to text. ## Usage @@ -7,7 +11,7 @@ This loader is an asynchronous web scraper that fetches the text from static web To use this loader, you need to pass in an array of URLs. ```python -from llama_index.readers.web.async_web.base import AsyncWebPageReader +from llama_index.readers.web import AsyncWebPageReader # for jupyter notebooks uncomment the following two lines of code: # import nest_asyncio diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/beautiful_soup_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/beautiful_soup_web/README.md index 331cd5fce7661..f3506e6818ad6 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/beautiful_soup_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/beautiful_soup_web/README.md @@ -1,5 +1,9 @@ # Beautiful Soup Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is a web scraper that fetches the text from websites using the `Beautiful Soup` (aka `bs4`) Python package. Furthermore, the flexibility of Beautiful Soup allows for custom templates that enable the loader to extract the desired text from specific website designs, such as Substack. Check out the code to see how to add your own. ## Usage @@ -7,9 +11,7 @@ This loader is a web scraper that fetches the text from websites using the `Beau To use this loader, you need to pass in an array of URLs. ```python -from llama_index import download_loader - -BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader") +from llama_index.readers.web import BeautifulSoupWebReader loader = BeautifulSoupWebReader() documents = loader.load_data(urls=["https://google.com"]) @@ -38,9 +40,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader") +from llama_index.readers.web import BeautifulSoupWebReader loader = BeautifulSoupWebReader() documents = loader.load_data(urls=["https://google.com"]) @@ -53,12 +55,12 @@ index.query("What language is on this website?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader") +from llama_index.readers.web import BeautifulSoupWebReader loader = BeautifulSoupWebReader() documents = loader.load_data(urls=["https://google.com"]) diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/knowledge_base/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/knowledge_base/README.md index 816e70f3e7a61..397380d64829d 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/knowledge_base/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/knowledge_base/README.md @@ -1,5 +1,9 @@ # Knowledge Base Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is a web crawler and scraper that fetches text content from websites hosting public knowledge bases. Examples are the [Intercom help center](https://www.intercom.com/help/en/) or the [Robinhood help center](https://robinhood.com/us/en/support/). Typically these sites have a directory structure with several sections and many articles in each section. This loader crawls and finds all links that match the article path provided, and scrapes the content of each article. This can be used to create bots that answer customer questions based on public documentation. It uses [Playwright](https://playwright.dev/python/) to drive a browser. This reduces the chance of getting blocked by Cloudflare or other CDNs, but makes it a bit more challenging to run on cloud services. @@ -17,9 +21,7 @@ This installs the browsers that Playwright requires. To use this loader, you need to pass in the root URL and the string to search for in the URL to tell if the crawler has reached an article. You also need to pass in several CSS selectors so the cralwer knows which links to follow and which elements to extract content from. use ```python -from llama_index import download_loader - -KnowledgeBaseWebReader = download_loader("KnowledgeBaseWebReader") +from llama_index.readers.web import KnowledgeBaseWebReader loader = KnowledgeBaseWebReader() documents = loader.load_data( @@ -39,9 +41,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -KnowledgeBaseWebReader = download_loader("KnowledgeBaseWebReader") +from llama_index.readers.web import KnowledgeBaseWebReader loader = KnowledgeBaseWebReader() documents = loader.load_data( @@ -61,12 +63,12 @@ index.query("What languages does Intercom support?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -KnowledgeBaseWebReader = download_loader("KnowledgeBaseWebReader") +from llama_index.readers.web import KnowledgeBaseWebReader loader = KnowledgeBaseWebReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/main_content_extractor/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/main_content_extractor/README.md index 6fb33b7b5e7b5..1dea93a5890da 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/main_content_extractor/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/main_content_extractor/README.md @@ -1,5 +1,9 @@ # MainContentExtractor Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is a web scraper that fetches the text from static websites using the `MainContentExtractor` Python package. For information on how to extract main content, README in the following github repository @@ -11,9 +15,7 @@ For information on how to extract main content, README in the following github r To use this loader, you need to pass in an array of URLs. ```python -from llama_index import download_loader - -MainContentExtractorReader = download_loader("MainContentExtractorReader") +from llama_index.readers.web import MainContentExtractorReader loader = MainContentExtractorReader() documents = loader.load_data(urls=["https://google.com"]) @@ -24,9 +26,9 @@ documents = loader.load_data(urls=["https://google.com"]) ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -MainContentExtractorReader = download_loader("MainContentExtractorReader") +from llama_index.readers.web import MainContentExtractorReader loader = MainContentExtractorReader() documents = loader.load_data(urls=["https://google.com"]) @@ -39,12 +41,12 @@ index.query("What language is on this website?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -MainContentExtractorReader = download_loader("MainContentExtractorReader") +from llama_index.readers.web import MainContentExtractorReader loader = MainContentExtractorReader() documents = loader.load_data(urls=["https://google.com"]) diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/news/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/news/README.md index a20e912379d80..b56b7b83265b4 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/news/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/news/README.md @@ -1,5 +1,9 @@ # News Article Loader +```bash +pip install llama-index-readers-web +``` + This loader makes use of the `newspaper3k` library to parse web page urls which have news articles in them. @@ -12,7 +16,7 @@ pip install newspaper3k Pass in an array of individual page URLs: ```python -from llama_index.readers.web.news import NewsArticleReader +from llama_index.readers.web import NewsArticleReader reader = NewsArticleReader(use_nlp=False) documents = reader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/readability_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/readability_web/README.md index 75da465912bc2..d41b4fe2d97af 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/readability_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/readability_web/README.md @@ -1,5 +1,9 @@ # Readability Webpage Loader +```bash +pip install llama-index-readers-web +``` + Extracting relevant information from a fully rendered web page. During the processing, it is always assumed that web pages used as data sources contain textual content. @@ -13,9 +17,7 @@ It is particularly effective for websites that use client-side rendering. To use this loader, you need to pass in a single of URL. ```python -from llama_index import download_loader - -ReadabilityWebPageReader = download_loader("ReadabilityWebPageReader") +from llama_index.readers.web import ReadabilityWebPageReader # or set proxy server for playwright: loader = ReadabilityWebPageReader(proxy="http://your-proxy-server:port") # For some specific web pages, you may need to set "wait_until" to "networkidle". loader = ReadabilityWebPageReader(wait_until="networkidle") @@ -33,9 +35,7 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import download_loader - -ReadabilityWebPageReader = download_loader("ReadabilityWebPageReader") +from llama_index.readers.web import ReadabilityWebPageReader loader = ReadabilityWebPageReader() documents = loader.load_data( @@ -51,12 +51,12 @@ print(index.query("What is pages?")) Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -ReadabilityWebPageReader = download_loader("ReadabilityWebPageReader") +from llama_index.readers.web import ReadabilityWebPageReader loader = ReadabilityWebPageReader() documents = loader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss/README.md index 4431bbb140f28..5e4e4e5d5440b 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss/README.md @@ -1,5 +1,9 @@ # RSS Loader +```bash +pip install llama-index-readers-web +``` + This loader allows fetching text from an RSS feed. It uses the `feedparser` module to fetch the feed and optionally the `html2text` module to sanitize it. @@ -8,9 +12,7 @@ to fetch the feed and optionally the `html2text` module to sanitize it. To use this loader, pass in an array of URL's. ```python -from llama_index import download_loader - -RssReader = download_loader("RssReader") +from llama_index.readers.web import RssReader reader = RssReader() documents = reader.load_data( diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss_news/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss_news/README.md index 7b6965399f4e6..fb345385a3be8 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss_news/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/rss_news/README.md @@ -9,7 +9,7 @@ To use this loader, pass in an array of URLs of RSS feeds. It will download the combine them: ```python -from llama_index.readers.web.rss_news import RSSNewsReader +from llama_index.core.readers.web.rss_news import RSSNewsReader urls = [ "https://rss.nytimes.com/services/xml/rss/nyt/HomePage.xml", diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/simple_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/simple_web/README.md index f14354eb2016a..b6f9d0ffa433a 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/simple_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/simple_web/README.md @@ -1,5 +1,9 @@ # Simple Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is a simple web scraper that fetches the text from static websites by converting the HTML to text. ## Usage @@ -7,9 +11,7 @@ This loader is a simple web scraper that fetches the text from static websites b To use this loader, you need to pass in an array of URLs. ```python -from llama_index import download_loader - -SimpleWebPageReader = download_loader("SimpleWebPageReader") +from llama_index.readers.web import SimpleWebPageReader loader = SimpleWebPageReader() documents = loader.load_data(urls=["https://google.com"]) @@ -22,9 +24,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -SimpleWebPageReader = download_loader("SimpleWebPageReader") +from llama_index.readers.web import SimpleWebPageReader loader = SimpleWebPageReader() documents = loader.load_data(urls=["https://google.com"]) @@ -37,12 +39,12 @@ index.query("What language is on this website?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -SimpleWebPageReader = download_loader("SimpleWebPageReader") +from llama_index.readers.web import SimpleWebPageReader loader = SimpleWebPageReader() documents = loader.load_data(urls=["https://google.com"]) diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/sitemap/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/sitemap/README.md index 67066ecceb2e8..b7b5f557fe368 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/sitemap/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/sitemap/README.md @@ -1,5 +1,9 @@ # Sitemap Loader +```bash +pip install llama-index-readers-web +``` + This loader is an asynchronous web scraper that fetches the text from static websites by using its sitemap and optionally converting the HTML to text. It is based on the [Async Website Loader](https://llama-hub-ui.vercel.app/l/web-async_web) @@ -9,7 +13,7 @@ It is based on the [Async Website Loader](https://llama-hub-ui.vercel.app/l/web- To use this loader, you just declare the sitemap.xml url like this: ```python -from llama_index.readers.web.sitemap import SitemapReader +from llama_index.readers.web import SitemapReader # for jupyter notebooks uncomment the following two lines of code: # import nest_asyncio diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/trafilatura_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/trafilatura_web/README.md index 2dc5b29dadee6..a75908bb1d6c9 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/trafilatura_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/trafilatura_web/README.md @@ -1,5 +1,9 @@ # Trafilatura Website Loader +```bash +pip install llama-index-readers-web +``` + This loader is a web scraper that fetches the text from static websites using the `trafilatura` Python package. ## Usage @@ -7,9 +11,7 @@ This loader is a web scraper that fetches the text from static websites using th To use this loader, you need to pass in an array of URLs. ```python -from llama_index import download_loader - -TrafilaturaWebReader = download_loader("TrafilaturaWebReader") +from llama_index.readers.web import TrafilaturaWebReader loader = TrafilaturaWebReader() documents = loader.load_data(urls=["https://google.com"]) @@ -22,9 +24,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -TrafilaturaWebReader = download_loader("TrafilaturaWebReader") +from llama_index.readers.web import TrafilaturaWebReader loader = TrafilaturaWebReader() documents = loader.load_data(urls=["https://google.com"]) @@ -37,12 +39,12 @@ index.query("What language is on this website?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -TrafilaturaWebReader = download_loader("TrafilaturaWebReader") +from llama_index.readers.web import TrafilaturaWebReader loader = TrafilaturaWebReader() documents = loader.load_data(urls=["https://google.com"]) diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/unstructured_web/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/unstructured_web/README.md index de555a882e7b0..671e1d915bd3b 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/unstructured_web/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/unstructured_web/README.md @@ -1,14 +1,16 @@ # Unstructured.io URL Loader +```bash +pip install llama-index-readers-web +``` + This loader extracts the text from URLs using [Unstructured.io](https://github.com/Unstructured-IO/unstructured). The partition_html function partitions an HTML document and returns a list of document Element objects. ## Usage ```python -from llama_index import download_loader - -UnstructuredURLLoader = download_loader("UnstructuredURLLoader") +from llama_index.readers.web import UnstructuredURLLoader urls = [ "https://www.understandingwar.org/backgrounder/russian-offensive-campaign-assessment-february-8-2023", diff --git a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/whole_site/README.md b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/whole_site/README.md index 4a7f9268f950f..7a758d467393c 100644 --- a/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/whole_site/README.md +++ b/llama-index-integrations/readers/llama-index-readers-web/llama_index/readers/web/whole_site/README.md @@ -1,5 +1,9 @@ # WholeSiteReader +```bash +pip install llama-index-readers-web +``` + The WholeSiteReader is a sophisticated web scraping tool that employs a breadth-first search (BFS) algorithm. It's designed to methodically traverse and extract content from entire websites, focusing specifically on predefined URL paths. ## Features @@ -10,9 +14,8 @@ The WholeSiteReader is a sophisticated web scraping tool that employs a breadth- - **Selenium-Based:** Leverages Selenium for dynamic interaction with web pages, supporting JavaScript-rendered content. ```python -from llama_index import download_loader +from llama_index.readers.web import WholeSiteReader -WholeSiteReader = download_loader("WholeSiteReader") # Initialize the scraper with a prefix URL and maximum depth scraper = WholeSiteReader( prefix="https://www.paulgraham.com/", max_depth=10 # Example prefix @@ -31,9 +34,9 @@ This loader is designed to be used as a way to load data into [LlamaIndex](https ### LlamaIndex ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader -WholeSiteReader = download_loader("WholeSiteReader") +from llama_index.readers.web import WholeSiteReader # Initialize the scraper with a prefix URL and maximum depth scraper = WholeSiteReader( @@ -54,12 +57,12 @@ index.query("What language is on this website?") Note: Make sure you change the description of the `Tool` to match your use-case. ```python -from llama_index import VectorStoreIndex, download_loader +from llama_index.core import VectorStoreIndex, download_loader from langchain.agents import initialize_agent, Tool from langchain.llms import OpenAI from langchain.chains.conversation.memory import ConversationBufferMemory -WholeSiteReader = download_loader("WholeSiteReader") +from llama_index.readers.web import WholeSiteReader # Initialize the scraper with a prefix URL and maximum depth scraper = WholeSiteReader( diff --git a/llama-index-integrations/readers/llama-index-readers-whatsapp/README.md b/llama-index-integrations/readers/llama-index-readers-whatsapp/README.md index 062ddad7e41c3..7e02868f20b02 100644 --- a/llama-index-integrations/readers/llama-index-readers-whatsapp/README.md +++ b/llama-index-integrations/readers/llama-index-readers-whatsapp/README.md @@ -1,5 +1,9 @@ # Whatsapp chat loader +```bash +pip install llama-index-readers-whatsapp +``` + ## Export a Whatsapp chat 1. Open a chat @@ -16,9 +20,8 @@ For more info see [Whatsapp's Help Center](https://faq.whatsapp.com/118041407917 ```python from pathlib import Path -from llama_index import download_loader -WhatsappChatLoader = download_loader("WhatsappChatLoader") +from llama_index.readers.whatsapp import WhatsappChatLoader path = "whatsapp.txt" loader = WhatsappChatLoader(path=path) diff --git a/llama-index-integrations/readers/llama-index-readers-wordlift/README.md b/llama-index-integrations/readers/llama-index-readers-wordlift/README.md index 38a2b9c3c7948..ef3f79e7acc93 100644 --- a/llama-index-integrations/readers/llama-index-readers-wordlift/README.md +++ b/llama-index-integrations/readers/llama-index-readers-wordlift/README.md @@ -1,5 +1,9 @@ # WordLift Reader +```bash +pip install llama-index-readers-wordlift +``` + The WordLift GraphQL Reader is a connector to fetch and transform data from a WordLift Knowledge Graph using your the WordLift Key. The connector provides a convenient way to load data from WordLift using a GraphQL query and transform it into a list of documents for further processing. ## Usage @@ -15,10 +19,10 @@ Here's an example of how to use the WordLift GraphQL Reader: ```python import json -from llama_index import VectorStoreIndex -from llama_index.readers.schema import Document +from llama_index.core import VectorStoreIndex +from llama_index.core import Document from langchain.llms import OpenAI -from llama_hub.wordlift import WordLiftLoader +from llama_index.readers.wordlift import WordLiftLoader # Set up the necessary configuration options endpoint = "https://api.wordlift.io/graphql" diff --git a/llama-index-integrations/readers/llama-index-readers-wordpress/README.md b/llama-index-integrations/readers/llama-index-readers-wordpress/README.md index e46aadebd707d..7c57428410868 100644 --- a/llama-index-integrations/readers/llama-index-readers-wordpress/README.md +++ b/llama-index-integrations/readers/llama-index-readers-wordpress/README.md @@ -1,5 +1,9 @@ # Wordpress Loader +```bash +pip install llama-index-readers-wordpress +``` + This loader fetches the text from Wordpress blog posts using the Wordpress API. It also uses the BeautifulSoup library to parse the HTML and extract the text from the articles. ## Usage @@ -7,9 +11,7 @@ This loader fetches the text from Wordpress blog posts using the Wordpress API. To use this loader, you need to pass base url of the Wordpress installation (e.g. `https://www.mysite.com`), a username, and an application password for the user (more about application passwords [here](https://www.paidmembershipspro.com/create-application-password-wordpress/)) ```python -from llama_index import download_loader - -WordpressReader = download_loader("WordpressReader") +from llama_index.readers.wordpress import WordpressReader loader = WordpressReader( url="https://www.mysite.com", diff --git a/llama-index-integrations/readers/llama-index-readers-youtube-transcript/README.md b/llama-index-integrations/readers/llama-index-readers-youtube-transcript/README.md index cbd593ac41045..86333283ffed1 100644 --- a/llama-index-integrations/readers/llama-index-readers-youtube-transcript/README.md +++ b/llama-index-integrations/readers/llama-index-readers-youtube-transcript/README.md @@ -1,5 +1,11 @@ # Youtube Transcript Loader +```bash +pip install llama-hub-youtube-transcript + +pip install llama-index-readers-youtube-transcript +``` + This loader fetches the text transcript of Youtube videos using the `youtube_transcript_api` Python package. ## Usage @@ -9,7 +15,7 @@ To use this loader, you will need to first `pip install youtube_transcript_api`. Then, simply pass an array of YouTube links into `load_data`: ```python -from llama_hub.youtube_transcript import YoutubeTranscriptReader +from llama_index.readers.youtube_transcript import YoutubeTranscriptReader loader = YoutubeTranscriptReader() documents = loader.load_data( @@ -22,10 +28,10 @@ Supported URL formats: + youtube.com/watch?v={video_id} (with or without 'www.') To programmatically check if a URL is supported: ```python -from llama_hub.youtube_transcript import is_youtube_video +from llama_index.readers.youtube_transcript.utils import is_youtube_video is_youtube_video("https://youtube.com/watch?v=j83jrh2") # => True is_youtube_video("https://vimeo.com/272134160") # => False ``` -This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. See [here](https://github.com/emptycrown/llama-hub/tree/main) for examples. +This loader is designed to be used as a way to load data into [LlamaIndex](https://github.com/run-llama/llama_index/tree/main/llama_index) and/or subsequently used as a Tool in a [LangChain](https://github.com/hwchase17/langchain) Agent. diff --git a/llama-index-integrations/readers/llama-index-readers-zendesk/README.md b/llama-index-integrations/readers/llama-index-readers-zendesk/README.md index 11aeec68fb237..126da790a3309 100644 --- a/llama-index-integrations/readers/llama-index-readers-zendesk/README.md +++ b/llama-index-integrations/readers/llama-index-readers-zendesk/README.md @@ -1,5 +1,9 @@ # Zendesk Loader +```bash +pip install llama-index-readers-zendesk +``` + This loader fetches the text from Zendesk help articles using the Zendesk API. It also uses the BeautifulSoup library to parse the HTML and extract the text from the articles. ## Usage @@ -7,9 +11,7 @@ This loader fetches the text from Zendesk help articles using the Zendesk API. I To use this loader, you need to pass in the subdomain of a Zendesk account. No authentication is required. You can also set the locale of articles as needed. ```python -from llama_index import download_loader - -ZendeskReader = download_loader("ZendeskReader") +from llama_index.readers.zendesk import ZendeskReader loader = ZendeskReader(zendesk_subdomain="my_subdomain", locale="en-us") documents = loader.load_data() diff --git a/llama-index-integrations/readers/llama-index-readers-zep/README.md b/llama-index-integrations/readers/llama-index-readers-zep/README.md index dae8826f386e9..5b940f9e853b7 100644 --- a/llama-index-integrations/readers/llama-index-readers-zep/README.md +++ b/llama-index-integrations/readers/llama-index-readers-zep/README.md @@ -1,5 +1,9 @@ # Zep Reader +```bash +pip install llama-index-readers-zep +``` + The Zep Reader returns a set of texts corresponding to a text query or embeddings retrieved from a Zep Collection. The Reader is initialized with a Zep API URL and optionally an API key. The Reader can then be used to load data from a Zep Document Collection. @@ -23,14 +27,13 @@ results. import time from uuid import uuid4 -from llama_index.node_parser import SimpleNodeParser -from llama_index.readers.schema import Document +from llama_index.core.node_parser import SimpleNodeParser +from llama_index.core import Document from zep_python import ZepClient from zep_python.document import Document as ZepDocument -from llama_index import download_loader -ZepReader = download_loader("ZepReader") +from llama_index.readers.zep import ZepReader # Create a Zep collection zep_api_url = "http://localhost:8000" # replace with your Zep API URL diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/.gitignore b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/.gitignore new file mode 100644 index 0000000000000..990c18de22908 --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/.gitignore @@ -0,0 +1,153 @@ +llama_index/_static +.DS_Store +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +bin/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +etc/ +include/ +lib/ +lib64/ +parts/ +sdist/ +share/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +.ruff_cache + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints +notebooks/ + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ +pyvenv.cfg + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# Jetbrains +.idea +modules/ +*.swp + +# VsCode +.vscode + +# pipenv +Pipfile +Pipfile.lock + +# pyright +pyrightconfig.json diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/BUILD b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/BUILD new file mode 100644 index 0000000000000..0896ca890d8bf --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/BUILD @@ -0,0 +1,3 @@ +poetry_requirements( + name="poetry", +) diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/MAKEFILE b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/MAKEFILE new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/MAKEFILE @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/README.md b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/README.md new file mode 100644 index 0000000000000..a24da704669bd --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/README.md @@ -0,0 +1,34 @@ +# VideoDB Retriever + +## Overview + +[VideoDB](https://videodb.io) is a serverless database designed to streamline the storage, search, editing, and streaming of video content. VideoDB offers random access to sequential video data by building indexes and developing interfaces for querying and browsing video content. Learn more at [docs.videodb.io](https://docs.videodb.io). + +## Getting Started + +### Prerequisites + +- Obtain API keys from [VideoDB dashboard](https://console.videodb.io) + +### Installation + +Install the necessary packages with the following command: + +``` +pip install llama-index llama-index-retrievers-videodb videodb +``` + +## Building Your Pipeline + +1. **Data Ingestion**: Upload your videos to VideoDB and leverage its managed indexing for efficient data organization, choosing between semantic or scene-based indexing. +2. **Querying**: Utilize `VideoDBRetriever` to retrieve relevant video segments and `llama-index` for constructing your RAG pipeline, enhancing your LLM's context with video-based insights. + +## 👨‍👩‍👧‍👦 Support & Community + +If you have any questions or feedback. +Please feel free to reach out to us + +- [Discord](https://discord.gg/py9P639jGz) +- [Github](https://github.com/video-db) +- [VideoDB](https://videodb.io) +- [Email](mailto:ashu@videodb.io) diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/BUILD b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/__init__.py b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/__init__.py new file mode 100644 index 0000000000000..d32cd9bb921f7 --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/__init__.py @@ -0,0 +1,4 @@ +from llama_index.retrievers.videodb.base import VideoDBRetriever + + +__all__ = ["VideoDBRetriever"] diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/base.py b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/base.py new file mode 100644 index 0000000000000..df317dac1486a --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/llama_index/retrievers/videodb/base.py @@ -0,0 +1,88 @@ +from llama_index.core.base.base_retriever import BaseRetriever +from llama_index.core.callbacks.base import CallbackManager +from llama_index.core.schema import NodeWithScore, QueryBundle, TextNode + +import logging +import os + +from typing import List, Optional +from videodb import connect + + +logger = logging.getLogger(__name__) + + +class SearchType: + keyword = "keyword" + semantic = "semantic" + + +class VideoDBRetriever(BaseRetriever): + def __init__( + self, + api_key: Optional[str] = None, + collection: Optional[str] = "default", + video: Optional[str] = None, + score_threshold: Optional[float] = 0.2, + result_threshold: Optional[int] = 5, + search_type: Optional[str] = SearchType.semantic, + base_url: Optional[str] = None, + callback_manager: Optional[CallbackManager] = None, + ) -> None: + """Creates a new VideoDB Retriever.""" + if api_key is None: + api_key = os.environ.get("VIDEO_DB_API_KEY") + if api_key is None: + raise Exception( + "No API key provided. Set an API key either as an environment variable (VIDEO_DB_API_KEY) or pass it as an argument." + ) + self._api_key = api_key + self._base_url = base_url + self.video = video + self.collection = collection + self.score_threshold = score_threshold + self.result_threshold = result_threshold + self.search_type = search_type + super().__init__(callback_manager) + + def _retrieve(self, query_bundle: QueryBundle) -> List[NodeWithScore]: + """Retrieve.""" + kwargs = {"api_key": self._api_key} + if self._base_url is not None: + kwargs["base_url"] = self._base_url + conn = connect(**kwargs) + if self.video: + coll = conn.get_collection(self.collection) + video = coll.get_video(self.video) + search_res = video.search( + query_bundle.query_str, + search_type=self.search_type, + score_threshold=self.score_threshold, + result_threshold=self.result_threshold, + ) + else: + coll = conn.get_collection(self.collection) + search_res = coll.search( + query_bundle.query_str, + search_type=self.search_type, + score_threshold=self.score_threshold, + result_threshold=self.result_threshold, + ) + + nodes = [] + collection_id = search_res.collection_id + for shot in search_res.get_shots(): + score = shot.search_score + textnode = TextNode( + text=shot.text, + metadata={ + "collection_id": collection_id, + "video_id": shot.video_id, + "length": shot.video_length, + "title": shot.video_title, + "start": shot.start, + "end": shot.end, + }, + ) + nodes.append(NodeWithScore(node=textnode, score=score)) + return nodes diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/pyproject.toml b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/pyproject.toml new file mode 100644 index 0000000000000..b0b5c24878516 --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/pyproject.toml @@ -0,0 +1,59 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +# Feel free to un-skip examples, and experimental, you will just need to +# work through many typos (--write-changes and --interactive will help) +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +classes = ["VideoDBRetriever"] +contains_example = true +import_path = "llama_index.retrievers.videodb" + +[tool.llamahub.class_authors] +VideoDBRetriever = "video-db" + +[tool.mypy] +disallow_untyped_defs = true +# Remove venv skip when integrated with pre-commit +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["VideoDB "] +description = "llama-index VideoDB Retriever integration" +license = "MIT" +maintainers = ["Rohit Garg "] +name = "llama-index-retrievers-videodb" +packages = [{include = "llama_index/"}] +readme = "README.md" +version = "0.1.0" + +[tool.poetry.dependencies] +python = ">=3.8.1,<4.0" +llama-index-core = "^0.10.0" +videodb = "^0.0" + +[tool.poetry.group.dev.dependencies] +black = {extras = ["jupyter"], version = "<=23.9.1,>=23.7.0"} +codespell = {extras = ["toml"], version = ">=v2.2.6"} +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" # TODO: unpin when mypy>0.991 +types-setuptools = "67.1.0.0" diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/BUILD b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/BUILD new file mode 100644 index 0000000000000..dabf212d7e716 --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/BUILD @@ -0,0 +1 @@ +python_tests() diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/__init__.py b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/test_retrievers_videdb.py b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/test_retrievers_videdb.py new file mode 100644 index 0000000000000..63e6392e00d6f --- /dev/null +++ b/llama-index-integrations/retrievers/llama-index-retrievers-videodb/tests/test_retrievers_videdb.py @@ -0,0 +1,7 @@ +from llama_index.core.base.base_retriever import BaseRetriever +from llama_index.retrievers.videodb import VideoDBRetriever + + +def test_class(): + names_of_base_classes = [b.__name__ for b in VideoDBRetriever.__mro__] + assert BaseRetriever.__name__ in names_of_base_classes diff --git a/llama-index-integrations/tools/llama-index-tools-arxiv/README.md b/llama-index-integrations/tools/llama-index-tools-arxiv/README.md index 7faed436c7979..32b4f0b0c7927 100644 --- a/llama-index-integrations/tools/llama-index-tools-arxiv/README.md +++ b/llama-index-integrations/tools/llama-index-tools-arxiv/README.md @@ -10,7 +10,7 @@ Here's an example usage of the ArxivToolSpec. ```python from llama_index.tools.arxiv import ArxivToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = ArxivToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-azure-cv/README.md b/llama-index-integrations/tools/llama-index-tools-azure-cv/README.md index d63a39a2020a6..4005de47f5af2 100644 --- a/llama-index-integrations/tools/llama-index-tools-azure-cv/README.md +++ b/llama-index-integrations/tools/llama-index-tools-azure-cv/README.md @@ -12,7 +12,7 @@ Here's an example usage of the AzureCVToolSpec. ```python from llama_index.tools.azure_cv import AzureCVToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = AzureCVToolSpec(api_key="your-key", resource="your-resource") diff --git a/llama-index-integrations/tools/llama-index-tools-azure-speech/README.md b/llama-index-integrations/tools/llama-index-tools-azure-speech/README.md index 227278529a138..d0e573a223a3a 100644 --- a/llama-index-integrations/tools/llama-index-tools-azure-speech/README.md +++ b/llama-index-integrations/tools/llama-index-tools-azure-speech/README.md @@ -8,7 +8,7 @@ This tool has a more extensive example usage documented in a Jupyter notebook [h ```python from llama_index.tools.azure_speech import AzureSpeechToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent speech_tool = AzureSpeechToolSpec(speech_key="your-key", region="eastus") diff --git a/llama-index-integrations/tools/llama-index-tools-azure-translate/README.md b/llama-index-integrations/tools/llama-index-tools-azure-translate/README.md index 69124ea986f0d..ce5554c1b8102 100644 --- a/llama-index-integrations/tools/llama-index-tools-azure-translate/README.md +++ b/llama-index-integrations/tools/llama-index-tools-azure-translate/README.md @@ -13,7 +13,7 @@ This tool has a more extensive example usage documented in a Jupyter notebook [h Here's an example usage of the AzureTranslateToolSpec. ```python -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent from llama_index.tools.azure_translate import AzureTranslateToolSpec translate_tool = AzureTranslateToolSpec(api_key="your-key", region="eastus") diff --git a/llama-index-integrations/tools/llama-index-tools-bing-search/README.md b/llama-index-integrations/tools/llama-index-tools-bing-search/README.md index 762c18eecd7be..d23c9f8773c6e 100644 --- a/llama-index-integrations/tools/llama-index-tools-bing-search/README.md +++ b/llama-index-integrations/tools/llama-index-tools-bing-search/README.md @@ -12,7 +12,7 @@ Here's an example usage of the BingSearchToolSpec. ```python from llama_index.tools.bing_search import BingSearchToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = BingSearchToolSpec(api_key="your-key") diff --git a/llama-index-integrations/tools/llama-index-tools-chatgpt-plugin/README.md b/llama-index-integrations/tools/llama-index-tools-chatgpt-plugin/README.md index 6e607721802c9..e17ade24dd852 100644 --- a/llama-index-integrations/tools/llama-index-tools-chatgpt-plugin/README.md +++ b/llama-index-integrations/tools/llama-index-tools-chatgpt-plugin/README.md @@ -17,7 +17,7 @@ f = requests.get( manifest = yaml.safe_load(f) from llama_index.tools.chatgpt_plugin import ChatGPTPluginToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent from llama_index.tools.requests import RequestsToolSpec requests_spec = RequestsToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-code-interpreter/README.md b/llama-index-integrations/tools/llama-index-tools-code-interpreter/README.md index 879fb398d942e..82bf5353c6056 100644 --- a/llama-index-integrations/tools/llama-index-tools-code-interpreter/README.md +++ b/llama-index-integrations/tools/llama-index-tools-code-interpreter/README.md @@ -12,7 +12,7 @@ Here's an example usage of the CodeInterpreterToolSpec. ```python from llama_index.tools.code_interpreter import CodeInterpreterToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent code_spec = CodeInterpreterToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-cogniswitch/README.md b/llama-index-integrations/tools/llama-index-tools-cogniswitch/README.md index deb89d56e1aff..e90f35f43cb12 100644 --- a/llama-index-integrations/tools/llama-index-tools-cogniswitch/README.md +++ b/llama-index-integrations/tools/llama-index-tools-cogniswitch/README.md @@ -36,7 +36,7 @@ import warnings warnings.filterwarnings("ignore") import os from llama_index.tools.cogniswitch import CogniswitchToolSpec -from llama_index.agent import ReActAgent +from llama_index.core.agent import ReActAgent ``` ### Cogniswitch Credentials and OpenAI token diff --git a/llama-index-integrations/tools/llama-index-tools-database/README.md b/llama-index-integrations/tools/llama-index-tools-database/README.md index 28d91a29c4b01..e7e7e84257a83 100644 --- a/llama-index-integrations/tools/llama-index-tools-database/README.md +++ b/llama-index-integrations/tools/llama-index-tools-database/README.md @@ -10,7 +10,7 @@ Here's an example usage of the DatabaseToolSpec. ```python from llama_index.tools.database import DatabaseToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent db_tools = DatabaseToolSpec( scheme="postgresql", # Database Scheme diff --git a/llama-index-integrations/tools/llama-index-tools-duckduckgo/README.md b/llama-index-integrations/tools/llama-index-tools-duckduckgo/README.md index 81cea3fd91fa7..2eabbc8288d87 100644 --- a/llama-index-integrations/tools/llama-index-tools-duckduckgo/README.md +++ b/llama-index-integrations/tools/llama-index-tools-duckduckgo/README.md @@ -10,7 +10,7 @@ Here's an example usage of the DuckDuckGoSearchToolSpec. ```python from llama_index.tools.duckduckgo import DuckDuckGoSearchToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = DuckDuckGoSearchToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-exa/README.md b/llama-index-integrations/tools/llama-index-tools-exa/README.md index c1bbf5d78588b..0bd2e13572172 100644 --- a/llama-index-integrations/tools/llama-index-tools-exa/README.md +++ b/llama-index-integrations/tools/llama-index-tools-exa/README.md @@ -13,9 +13,7 @@ Here's an example usage of the ExaToolSpec. ```python from llama_index.tools.exa import ExaToolSpec -from llama_index.agent.openai import ( - OpenAIAgent, -) # requires llama-index-agent-openai +from llama_index.agent.openai import OpenAIAgent exa_tool = ExaToolSpec( api_key="your-key", diff --git a/llama-index-integrations/tools/llama-index-tools-graphql/README.md b/llama-index-integrations/tools/llama-index-tools-graphql/README.md index 669e3638ff08a..7924ba3637a16 100644 --- a/llama-index-integrations/tools/llama-index-tools-graphql/README.md +++ b/llama-index-integrations/tools/llama-index-tools-graphql/README.md @@ -12,7 +12,7 @@ This tool works best when the Agent has access to the GraphQL schema for the ser ```python from llama_index.tools.graphql import GraphQLToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = GraphQLToolSpec( url="https://spacex-production.up.railway.app/", diff --git a/llama-index-integrations/tools/llama-index-tools-ionic-shopping/README.md b/llama-index-integrations/tools/llama-index-tools-ionic-shopping/README.md index c4cf64e448b29..57670a76558f3 100644 --- a/llama-index-integrations/tools/llama-index-tools-ionic-shopping/README.md +++ b/llama-index-integrations/tools/llama-index-tools-ionic-shopping/README.md @@ -1,5 +1,9 @@ # LlamaIndex Tools Integration: Ionic Shopping +```bash +pip install llama-index-tools-ionic-shopping +``` + [Ionic](https://ioniccommerce.com) is a plug and play ecommerce marketplace for AI Assistants. By including the Ionic Tool in your agent, you are effortlessly providing your users with the ability to shop and transact directly within your agent, and you’ll get a cut of the transaction. @@ -10,7 +14,7 @@ Llearn more about how [Ionic attributes sales](https://docs.ioniccommerce.com/gu to your agent. Provide your Ionic API Key when instantiating the tool: ```python -from llama_hub.tools.ionic_shopping.base import IonicShoppingToolSpec +from llama_index.tools.ionic_shopping import IonicShoppingToolSpec ionic_tool = IonicShoppingToolSpec(api_key="").to_tool_list() ``` @@ -21,8 +25,10 @@ Try it out using the [Jupyter notebook](https://github.com/run-llama/llama-hub/b ```python import openai -from llama_index.agent import OpenAIAgent # requires llama-index-agent-openai -from llama_hub.tools.ionic_shopping.base import IonicShoppingToolSpec +from llama_index.core.agent import ( + OpenAIAgent, +) # requires llama-index-agent-openai +from llama_index.tools.ionic_shopping import IonicShoppingToolSpec openai.api_key = "sk-api-key" diff --git a/llama-index-integrations/tools/llama-index-tools-metaphor/README.md b/llama-index-integrations/tools/llama-index-tools-metaphor/README.md index 067f5964aece5..21f0d0514dc5d 100644 --- a/llama-index-integrations/tools/llama-index-tools-metaphor/README.md +++ b/llama-index-integrations/tools/llama-index-tools-metaphor/README.md @@ -19,7 +19,7 @@ Here's an example usage of the MetaphorToolSpec. ```python from llama_index.tools.metaphor import MetaphorToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent metaphor_tool = MetaphorToolSpec( api_key="your-key", diff --git a/llama-index-integrations/tools/llama-index-tools-multion/README.md b/llama-index-integrations/tools/llama-index-tools-multion/README.md index 9788c99f3c1aa..5eb221b6d3560 100644 --- a/llama-index-integrations/tools/llama-index-tools-multion/README.md +++ b/llama-index-integrations/tools/llama-index-tools-multion/README.md @@ -1,5 +1,9 @@ # MultiOn Tool +```bash +pip install llama-index-tools-multion +``` + This tool connects to [MultiOn](https://www.multion.ai/) to enable your agent to easily connect to the internet through your Chrome Web browser and act on your behalf @@ -13,8 +17,8 @@ This tool has more a extensive example usage documented in a Jupyter notebook [h Here's an example usage of the MultionToolSpec. ```python -from llama_index.tools.metaphor import MultionToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.tools.multion import MultionToolSpec +from llama_index.agent.openai import OpenAIAgent multion_tool = MultionToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-neo4j/README.md b/llama-index-integrations/tools/llama-index-tools-neo4j/README.md index 1f30d99f8bc10..9ae5a9c10b4f4 100644 --- a/llama-index-integrations/tools/llama-index-tools-neo4j/README.md +++ b/llama-index-integrations/tools/llama-index-tools-neo4j/README.md @@ -1,5 +1,9 @@ # Neo4j Schema Query Builder +```bash +pip install llama-index-tools-neo4j +``` + The `Neo4jQueryToolSpec` class provides a way to query a Neo4j graph database based on a provided schema definition. The class uses a language model to generate Cypher queries from user questions and has the capability to recover from Cypher syntax errors through a self-healing mechanism. ## Table of Contents @@ -16,9 +20,9 @@ The `Neo4jQueryToolSpec` class provides a way to query a Neo4j graph database ba Initialize the `Neo4jQueryToolSpec` class with: ```python -from llama_index.tools.neo4j_db import Neo4jQueryToolSpec -from llama_index.llms import OpenAI -from llama_index.agent import OpenAIAgent +from llama_index.tools.neo4j import Neo4jQueryToolSpec +from llama_index.llms.openai import OpenAI +from llama_index.agent.openai import OpenAIAgent llm = OpenAI(model="gpt-4", openai_api_key="XXXX-XXXX", temperature=0) diff --git a/llama-index-integrations/tools/llama-index-tools-notion/README.md b/llama-index-integrations/tools/llama-index-tools-notion/README.md index 9b574669358fd..6945e6ad9e458 100644 --- a/llama-index-integrations/tools/llama-index-tools-notion/README.md +++ b/llama-index-integrations/tools/llama-index-tools-notion/README.md @@ -10,7 +10,7 @@ Here's an example usage of the NotionToolSpec. ```python from llama_index.tools.notion import NotionToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = NotionToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-openai/README.md b/llama-index-integrations/tools/llama-index-tools-openai/README.md index f91e6ad6d7b63..fb1c3367fcbe5 100644 --- a/llama-index-integrations/tools/llama-index-tools-openai/README.md +++ b/llama-index-integrations/tools/llama-index-tools-openai/README.md @@ -9,9 +9,7 @@ This tool has a more extensive example usage documented in a Jupyter notebook [h ### Usage with Agent ```python -from llama_index.tools.openai.image_generation import ( - OpenAIImageGenerationToolSpec, -) +from llama_index.tools.openai import OpenAIImageGenerationToolSpec image_generation_tool = OpenAIImageGenerationToolSpec( api_key=os.environ["OPENAI_API_KEY"] @@ -32,9 +30,7 @@ print(response) ### Usage directly ```python -from llama_index.tools.openai.image_generation import ( - OpenAIImageGenerationToolSpec, -) +from llama_index.tools.openai import OpenAIImageGenerationToolSpec image_generation_tool = OpenAIImageGenerationToolSpec( api_key=os.environ["OPENAI_API_KEY"] diff --git a/llama-index-integrations/tools/llama-index-tools-openapi/README.md b/llama-index-integrations/tools/llama-index-tools-openapi/README.md index c010ad25e1260..58bda6d03d99a 100644 --- a/llama-index-integrations/tools/llama-index-tools-openapi/README.md +++ b/llama-index-integrations/tools/llama-index-tools-openapi/README.md @@ -1,5 +1,9 @@ # OpenAPI Tool +```bash +pip install llama-index-tools-openapi +``` + This tool loads an OpenAPI spec and allow the Agent to retrieve endpoints and details about endpoints. The RequestsToolSpec can also be loaded into the agent to allow the agent to hit the necessary endpoints with a REST request. ## Usage @@ -9,8 +13,8 @@ This tool has more extensive example usage documented in a Jupyter notebook [her Here's an example usage of the OpenAPIToolSpec. ```python -from llama_hub.tools.openapi import OpenAPIToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.tools.openapi import OpenAPIToolSpec +from llama_index.agent.openai import OpenAIAgent f = requests.get( "https://raw.githubusercontent.com/APIs-guru/openapi-directory/main/APIs/openai.com/1.2.0/openapi.yaml" diff --git a/llama-index-integrations/tools/llama-index-tools-playgrounds/README.md b/llama-index-integrations/tools/llama-index-tools-playgrounds/README.md index 084401a3da10a..10e41c325aeb3 100644 --- a/llama-index-integrations/tools/llama-index-tools-playgrounds/README.md +++ b/llama-index-integrations/tools/llama-index-tools-playgrounds/README.md @@ -2,6 +2,10 @@ ## playgrounds_subgraph_connector +```bash +pip install llama-index-tools-playgrounds +``` + Playgrounds API is a service provided by [Playgrounds Analytics](https://playgrounds.network) to streamline interfacing with decentralized subgraphs (indexed blockchain datasets). The `PlaygroundsSubgraphConnector` is a tool designed for LLM agents to seamlessly interface with and query subgraphs on The Graph's decentralized network via Playgrounds API. @@ -23,10 +27,8 @@ To utilize the tool, simply initialize it with the appropriate `identifier` (Sub ```python import openai -from llama_index.agent import OpenAIAgent -from llama_index.tools.playgrounds_subgraph_connector import ( - PlaygroundsSubgraphConnectorToolSpec, -) +from llama_index.agent.openai import OpenAIAgent +from llama_index.tools.playgrounds import PlaygroundsSubgraphConnectorToolSpec def simple_test(): @@ -85,10 +87,8 @@ To utilize the tool, initialize it with the appropriate `identifier` (Subgraph I ```python import openai -from llama_index.agent import OpenAIAgent -from llama_index.tools.playgrounds_subgraph_inspector import ( - PlaygroundsSubgraphInspectorToolSpec, -) +from llama_index.agent.openai import OpenAIAgent +from llama_index.tools.playgrounds import PlaygroundsSubgraphInspectorToolSpec def inspect_subgraph( diff --git a/llama-index-integrations/tools/llama-index-tools-python-file/README.md b/llama-index-integrations/tools/llama-index-tools-python-file/README.md index bb21b84c7705e..424ed6212d2f5 100644 --- a/llama-index-integrations/tools/llama-index-tools-python-file/README.md +++ b/llama-index-integrations/tools/llama-index-tools-python-file/README.md @@ -10,7 +10,7 @@ Here's an example usage of the PythonFileToolSpec. ```python from llama_index.tools.python_file import PythonFileToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent pyfile = PythonFileToolSpec("./numpy_linalg.py") diff --git a/llama-index-integrations/tools/llama-index-tools-requests/README.md b/llama-index-integrations/tools/llama-index-tools-requests/README.md index ae2b99dc1a7e1..541f772c584d3 100644 --- a/llama-index-integrations/tools/llama-index-tools-requests/README.md +++ b/llama-index-integrations/tools/llama-index-tools-requests/README.md @@ -12,7 +12,7 @@ Here's an example usage of the RequestsToolSpec. ```python from llama_index.tools.requests import RequestsToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent domain_headers = { "api.openai.com": { diff --git a/llama-index-integrations/tools/llama-index-tools-shopify/README.md b/llama-index-integrations/tools/llama-index-tools-shopify/README.md index 32f530f504e77..c316c2f41f5f4 100644 --- a/llama-index-integrations/tools/llama-index-tools-shopify/README.md +++ b/llama-index-integrations/tools/llama-index-tools-shopify/README.md @@ -8,12 +8,16 @@ This tool has more extensive example usage documented in a Jupyter notebook [her In particular, the tool is very effective when combined with a method of retrieving data from the GraphQL schema definition. +```bash +pip install llama-index llama-index-readers-file llama-index-tools-shopify unstructured +``` + ```python from llama_index.tools.shopify import ShopifyToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent -from llama_index.file.unstructured import UnstructuredReader -from llama_index.tools.ondemand_loader_tool import OnDemandLoaderTool +from llama_index.readers.file import UnstructuredReader +from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool documentation_tool = OnDemandLoaderTool.from_defaults( UnstructuredReader(), diff --git a/llama-index-integrations/tools/llama-index-tools-slack/README.md b/llama-index-integrations/tools/llama-index-tools-slack/README.md index 50eef495a8227..77a5fc2fdd4c9 100644 --- a/llama-index-integrations/tools/llama-index-tools-slack/README.md +++ b/llama-index-integrations/tools/llama-index-tools-slack/README.md @@ -6,7 +6,7 @@ This tool fetches the text from a list of Slack channels. You will need to initi ```python from llama_index.tools.slack import SlackToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = SlackToolSpec(slack_token="token") diff --git a/llama-index-integrations/tools/llama-index-tools-tavily-research/README.md b/llama-index-integrations/tools/llama-index-tools-tavily-research/README.md index 36ed8c5aee8a2..60a1bc317be0f 100644 --- a/llama-index-integrations/tools/llama-index-tools-tavily-research/README.md +++ b/llama-index-integrations/tools/llama-index-tools-tavily-research/README.md @@ -20,7 +20,7 @@ Here's an example usage of the TavilyToolSpec. ```python from llama_index.tools.tavily_research import TavilyToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tavily_tool = TavilyToolSpec( api_key="your-key", diff --git a/llama-index-integrations/tools/llama-index-tools-text-to-image/README.md b/llama-index-integrations/tools/llama-index-tools-text-to-image/README.md index 32c697453d579..5c6a010901235 100644 --- a/llama-index-integrations/tools/llama-index-tools-text-to-image/README.md +++ b/llama-index-integrations/tools/llama-index-tools-text-to-image/README.md @@ -10,7 +10,7 @@ Another example showcases retrieval augmentation over a knowledge corpus with te ```python from llama_index.tools.text_to_image import TextToImageToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent openai.api_key = "sk-your-key" tool_spec = TextToImageToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-vector-db/README.md b/llama-index-integrations/tools/llama-index-tools-vector-db/README.md index d7a7140a7f96f..69f377837f590 100644 --- a/llama-index-integrations/tools/llama-index-tools-vector-db/README.md +++ b/llama-index-integrations/tools/llama-index-tools-vector-db/README.md @@ -6,9 +6,9 @@ This tool wraps a VectorStoreIndex and enables a agent to call it with queries a ```python from llama_index.tools.vector_db import VectorDB -from llama_index.agent import OpenAIAgent -from llama_index.vector_stores.types import VectorStoreInfo -from llama_index import VectorStoreIndex +from llama_index.agent.openai import OpenAIAgent +from llama_index.core.vector_stores import VectorStoreInfo +from llama_index.core import VectorStoreIndex index = VectorStoreIndex(nodes=nodes) tool_spec = VectorDB(index=index) diff --git a/llama-index-integrations/tools/llama-index-tools-waii/README.md b/llama-index-integrations/tools/llama-index-tools-waii/README.md index f1b5c6ca291ad..1da3f82813084 100644 --- a/llama-index-integrations/tools/llama-index-tools-waii/README.md +++ b/llama-index-integrations/tools/llama-index-tools-waii/README.md @@ -52,8 +52,8 @@ print(index.query("Which table contains most columns?")) #### Initialize the agent: ```python -from llama_index.agent import OpenAIAgent -from llama_index.llms import OpenAI +from llama_index.agent.openai import OpenAIAgent +from llama_index.llms.openai import OpenAI agent = OpenAIAgent.from_tools( waii_tool.to_tool_list(), llm=OpenAI(model="gpt-4-1106-preview") diff --git a/llama-index-integrations/tools/llama-index-tools-weather/README.md b/llama-index-integrations/tools/llama-index-tools-weather/README.md index 251f674566450..434a965cca14e 100644 --- a/llama-index-integrations/tools/llama-index-tools-weather/README.md +++ b/llama-index-integrations/tools/llama-index-tools-weather/README.md @@ -13,7 +13,7 @@ Here's an example usage of the OpenWeatherMapToolSpec. ```python from llama_index.tools.weather import OpenWeatherMapToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = OpenWeatherMapToolSpec(key="...") diff --git a/llama-index-integrations/tools/llama-index-tools-wikipedia/README.md b/llama-index-integrations/tools/llama-index-tools-wikipedia/README.md index 0b6915d30da48..9c8e83aa66f0b 100644 --- a/llama-index-integrations/tools/llama-index-tools-wikipedia/README.md +++ b/llama-index-integrations/tools/llama-index-tools-wikipedia/README.md @@ -8,7 +8,7 @@ This tool has more extensive example usage documented in a Jupyter notebook [her ```python from llama_index.tools.wikipedia import WikipediaToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = WikipediaToolSpec() diff --git a/llama-index-integrations/tools/llama-index-tools-wolfram-alpha/README.md b/llama-index-integrations/tools/llama-index-tools-wolfram-alpha/README.md index d7dc202b317fb..c6619a7015cae 100644 --- a/llama-index-integrations/tools/llama-index-tools-wolfram-alpha/README.md +++ b/llama-index-integrations/tools/llama-index-tools-wolfram-alpha/README.md @@ -12,7 +12,7 @@ Here's an example usage of the WolframAlphaToolSpec. ```python from llama_index.tools.wolfram_alpha import WolframAlphaToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent wolfram_spec = WolframAlphaToolSpec(app_id="API-key") diff --git a/llama-index-integrations/tools/llama-index-tools-yahoo-finance/README.md b/llama-index-integrations/tools/llama-index-tools-yahoo-finance/README.md index 21779bb953c08..b2c3a4ef84692 100644 --- a/llama-index-integrations/tools/llama-index-tools-yahoo-finance/README.md +++ b/llama-index-integrations/tools/llama-index-tools-yahoo-finance/README.md @@ -8,7 +8,7 @@ Here's an example of how to use this tool: ```python from llama_index.tools.yahoo_finance import YahooFinanceToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent tool_spec = YahooFinanceToolSpec() agent = OpenAIAgent.from_tools(tool_spec.to_tool_list()) diff --git a/llama-index-integrations/tools/llama-index-tools-zapier/README.md b/llama-index-integrations/tools/llama-index-tools-zapier/README.md index d26c068576aa8..cb3060d8299e5 100644 --- a/llama-index-integrations/tools/llama-index-tools-zapier/README.md +++ b/llama-index-integrations/tools/llama-index-tools-zapier/README.md @@ -10,7 +10,7 @@ Here's an example usage of the ZapierToolSpec. ```python from llama_index.tools.zapier import ZapierToolSpec -from llama_index.agent import OpenAIAgent +from llama_index.agent.openai import OpenAIAgent zapier_spec = ZapierToolSpec(api_key="sk-ak-your-key") diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/llama_index/vector_stores/azurecosmosmongo/base.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/llama_index/vector_stores/azurecosmosmongo/base.py index 146807f16a136..9eb6dd10c166e 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/llama_index/vector_stores/azurecosmosmongo/base.py +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/llama_index/vector_stores/azurecosmosmongo/base.py @@ -3,14 +3,16 @@ An index that is built on top of an existing vector store. """ + import logging import os from typing import Any, Dict, List, Optional, cast import pymongo +from llama_index.core.bridge.pydantic import PrivateAttr from llama_index.core.schema import BaseNode, MetadataMode, TextNode from llama_index.core.vector_stores.types import ( - VectorStore, + BasePydanticVectorStore, VectorStoreQuery, VectorStoreQueryResult, ) @@ -23,7 +25,7 @@ logger = logging.getLogger(__name__) -class AzureCosmosDBMongoDBVectorSearch(VectorStore): +class AzureCosmosDBMongoDBVectorSearch(BasePydanticVectorStore): """Azure CosmosDB MongoDB vCore Vector Store. To use, you should have both: @@ -34,6 +36,18 @@ class AzureCosmosDBMongoDBVectorSearch(VectorStore): stores_text: bool = True flat_metadata: bool = True + _collection: Any = PrivateAttr() + _index_name: str = PrivateAttr() + _embedding_key: str = PrivateAttr() + _id_key: str = PrivateAttr() + _text_key: str = PrivateAttr() + _metadata_key: str = PrivateAttr() + _insert_kwargs: dict = PrivateAttr() + _db_name: str = PrivateAttr() + _collection_name: str = PrivateAttr() + _cosmos_search_kwargs: dict = PrivateAttr() + _mongodb_client: Any = PrivateAttr() + def __init__( self, mongodb_client: Optional[Any] = None, @@ -65,6 +79,8 @@ def __init__( contain search options, such as kind, numLists, similarity, and dimensions. insert_kwargs: The kwargs used during `insert`. """ + super().__init__() + if mongodb_client is not None: self._mongodb_client = cast(pymongo.MongoClient, mongodb_client) else: diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/pyproject.toml b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/pyproject.toml index f3be49f41cbea..ed34b87db49fe 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/pyproject.toml +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-vector-stores-azurecosmosmongo" readme = "README.md" -version = "0.1.2" +version = "0.1.3" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/tests/test_vector_stores_azurecosmosmongo.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/tests/test_vector_stores_azurecosmosmongo.py index 30ed0dd360de6..04f035c4c26ec 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/tests/test_vector_stores_azurecosmosmongo.py +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-azurecosmosmongo/tests/test_vector_stores_azurecosmosmongo.py @@ -1,4 +1,4 @@ -from llama_index.core.vector_stores.types import VectorStore +from llama_index.core.vector_stores.types import BasePydanticVectorStore from llama_index.vector_stores.azurecosmosmongo import AzureCosmosDBMongoDBVectorSearch @@ -6,4 +6,4 @@ def test_class(): names_of_base_classes = [ b.__name__ for b in AzureCosmosDBMongoDBVectorSearch.__mro__ ] - assert VectorStore.__name__ in names_of_base_classes + assert BasePydanticVectorStore.__name__ in names_of_base_classes diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/llama_index/vector_stores/clickhouse/base.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/llama_index/vector_stores/clickhouse/base.py index 7f8d306d6a3b5..c10f2b206153f 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/llama_index/vector_stores/clickhouse/base.py +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/llama_index/vector_stores/clickhouse/base.py @@ -3,15 +3,15 @@ An index that is built on top of an existing ClickHouse cluster. """ + import importlib import json import logging import re from typing import Any, Dict, List, Optional, cast -from pydantic import PrivateAttr - from llama_index.core import ServiceContext +from llama_index.core.bridge.pydantic import PrivateAttr from llama_index.core.schema import ( BaseNode, MetadataMode, diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/pyproject.toml b/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/pyproject.toml index 3989d9967b141..a43bfd3335635 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/pyproject.toml +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-clickhouse/pyproject.toml @@ -27,7 +27,7 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-vector-stores-clickhouse" readme = "README.md" -version = "0.1.2" +version = "0.1.3" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-milvus/llama_index/vector_stores/milvus/base.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-milvus/llama_index/vector_stores/milvus/base.py index 6358c077dc5be..c152cc89c7f45 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-milvus/llama_index/vector_stores/milvus/base.py +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-milvus/llama_index/vector_stores/milvus/base.py @@ -273,7 +273,7 @@ def query(self, query: VectorStoreQuery, **kwargs: Any) -> VectorStoreQueryResul # Convert to string expression string_expr = "" if len(expr) != 0: - string_expr = " and ".join(expr) + string_expr = f" {query.filters.condition.value} ".join(expr) # Perform the search res = self._milvusclient.search( diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/llama_index/vector_stores/opensearch/base.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/llama_index/vector_stores/opensearch/base.py index 508ef45752dea..baf04a321c8eb 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/llama_index/vector_stores/opensearch/base.py +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/llama_index/vector_stores/opensearch/base.py @@ -1,7 +1,12 @@ """Elasticsearch/Opensearch vector store.""" + +import asyncio import json import uuid from typing import Any, Dict, Iterable, List, Optional, Union, cast + +import nest_asyncio + from llama_index.core.bridge.pydantic import PrivateAttr from llama_index.core.schema import BaseNode, MetadataMode, TextNode @@ -16,9 +21,9 @@ metadata_dict_to_node, node_to_metadata_dict, ) -from opensearchpy import OpenSearch +from opensearchpy import AsyncOpenSearch from opensearchpy.exceptions import NotFoundError -from opensearchpy.helpers import bulk +from opensearchpy.helpers import async_bulk IMPORT_OPENSEARCH_PY_ERROR = ( "Could not import OpenSearch. Please install it with `pip install opensearch-py`." @@ -29,14 +34,14 @@ MATCH_ALL_QUERY = {"match_all": {}} # type: Dict -def _import_opensearch() -> Any: +def _import_async_opensearch() -> Any: """Import OpenSearch if available, otherwise raise error.""" - return OpenSearch + return AsyncOpenSearch -def _import_bulk() -> Any: +def _import_async_bulk() -> Any: """Import bulk if available, otherwise raise error.""" - return bulk + return async_bulk def _import_not_found_error() -> Any: @@ -44,21 +49,21 @@ def _import_not_found_error() -> Any: return NotFoundError -def _get_opensearch_client(opensearch_url: str, **kwargs: Any) -> Any: - """Get OpenSearch client from the opensearch_url, otherwise raise error.""" +def _get_async_opensearch_client(opensearch_url: str, **kwargs: Any) -> Any: + """Get AsyncOpenSearch client from the opensearch_url, otherwise raise error.""" try: - opensearch = _import_opensearch() + opensearch = _import_async_opensearch() client = opensearch(opensearch_url, **kwargs) except ValueError as e: raise ValueError( - f"OpenSearch client string provided is not in proper format. " + f"AsyncOpenSearch client string provided is not in proper format. " f"Got error: {e} " ) return client -def _bulk_ingest_embeddings( +async def _bulk_ingest_embeddings( client: Any, index_name: str, embeddings: List[List[float]], @@ -71,20 +76,20 @@ def _bulk_ingest_embeddings( max_chunk_bytes: Optional[int] = 1 * 1024 * 1024, is_aoss: bool = False, ) -> List[str]: - """Bulk Ingest Embeddings into given index.""" + """Async Bulk Ingest Embeddings into given index.""" if not mapping: mapping = {} - bulk = _import_bulk() + async_bulk = _import_async_bulk() not_found_error = _import_not_found_error() requests = [] return_ids = [] mapping = mapping try: - client.indices.get(index=index_name) + await client.indices.get(index=index_name) except not_found_error: - client.indices.create(index=index_name, body=mapping) + await client.indices.create(index=index_name, body=mapping) for i, text in enumerate(texts): metadata = metadatas[i] if metadatas else {} @@ -102,9 +107,9 @@ def _bulk_ingest_embeddings( request["_id"] = _id requests.append(request) return_ids.append(_id) - bulk(client, requests, max_chunk_bytes=max_chunk_bytes) + await async_bulk(client, requests, max_chunk_bytes=max_chunk_bytes) if not is_aoss: - client.indices.refresh(index=index_name) + await client.indices.refresh(index=index_name) return return_ids @@ -135,7 +140,8 @@ def _knn_search_query( k: int, filters: Optional[MetadataFilters] = None, ) -> Dict: - """Do knn search. + """ + Do knn search. If there are no filters do approx-knn search. If there are (pre)-filters, do an exhaustive exact knn search using 'painless @@ -243,7 +249,8 @@ def _is_aoss_enabled(http_auth: Any) -> bool: class OpensearchVectorClient: - """Object encapsulating an Opensearch index that has vector search enabled. + """ + Object encapsulating an Opensearch index that has vector search enabled. If the index does not yet exist, it is created during init. Therefore, the underlying index is assumed to either: @@ -311,15 +318,24 @@ def __init__( } }, } - self._os_client = _get_opensearch_client(self._endpoint, **kwargs) + self._os_client = _get_async_opensearch_client(self._endpoint, **kwargs) not_found_error = _import_not_found_error() + + nest_asyncio.apply() + event_loop = asyncio.get_event_loop() try: - self._os_client.indices.get(index=self._index) + event_loop.run_until_complete( + self._os_client.indices.get(index=self._index) + ) except not_found_error: - self._os_client.indices.create(index=self._index, body=idx_conf) - self._os_client.indices.refresh(index=self._index) + event_loop.run_until_complete( + self._os_client.indices.create(index=self._index, body=idx_conf) + ) + event_loop.run_until_complete( + self._os_client.indices.refresh(index=self._index) + ) - def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]: + async def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]: """Store results in the index.""" embeddings: List[List[float]] = [] texts: List[str] = [] @@ -331,7 +347,7 @@ def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]: texts.append(node.get_content(metadata_mode=MetadataMode.NONE)) metadatas.append(node_to_metadata_dict(node, remove_text=True)) - return _bulk_ingest_embeddings( + return await _bulk_ingest_embeddings( self._os_client, self._index, embeddings, @@ -345,16 +361,16 @@ def index_results(self, nodes: List[BaseNode], **kwargs: Any) -> List[str]: is_aoss=self.is_aoss, ) - def delete_doc_id(self, doc_id: str) -> None: - """Delete a document. + async def delete_doc_id(self, doc_id: str) -> None: + """ + Delete a document. Args: doc_id (str): document id """ - body = {"query": {"match": {"metadata.ref_doc_id": doc_id}}} - self._os_client.delete_by_query(index=self._index, body=body) + await self._os_client.delete(index=self._index, id=doc_id) - def query( + async def aquery( self, query_mode: VectorStoreQueryMode, query_str: Optional[str], @@ -380,7 +396,7 @@ def query( ) params = None - res = self._os_client.search( + res = await self._os_client.search( index=self._index, body=search_query, params=params ) nodes = [] @@ -421,7 +437,8 @@ def query( class OpensearchVectorStore(BasePydanticVectorStore): - """Elasticsearch/Opensearch vector store. + """ + Elasticsearch/Opensearch vector store. Args: client (OpensearchVectorClient): Vector index client to use @@ -437,6 +454,7 @@ def __init__( ) -> None: """Initialize params.""" super().__init__() + nest_asyncio.apply() self._client = client @property @@ -449,13 +467,30 @@ def add( nodes: List[BaseNode], **add_kwargs: Any, ) -> List[str]: - """Add nodes to index. + """ + Add nodes to index. Args: nodes: List[BaseNode]: list of nodes with embeddings. """ - self._client.index_results(nodes) + return asyncio.get_event_loop().run_until_complete( + self.async_add(nodes, **add_kwargs) + ) + + async def async_add( + self, + nodes: List[BaseNode], + **add_kwargs: Any, + ) -> List[str]: + """ + Async add nodes to index. + + Args: + nodes: List[BaseNode]: list of nodes with embeddings. + + """ + await self._client.index_results(nodes) return [result.node_id for result in nodes] def delete(self, ref_doc_id: str, **delete_kwargs: Any) -> None: @@ -466,10 +501,35 @@ def delete(self, ref_doc_id: str, **delete_kwargs: Any) -> None: ref_doc_id (str): The doc_id of the document to delete. """ - self._client.delete_doc_id(ref_doc_id) + asyncio.get_event_loop().run_until_complete( + self.adelete(ref_doc_id, **delete_kwargs) + ) + + async def adelete(self, ref_doc_id: str, **delete_kwargs: Any) -> None: + """ + Async delete nodes using with ref_doc_id. + + Args: + ref_doc_id (str): The doc_id of the document to delete. + + """ + await self._client.delete_doc_id(ref_doc_id) def query(self, query: VectorStoreQuery, **kwargs: Any) -> VectorStoreQueryResult: - """Query index for top k most similar nodes. + """ + Query index for top k most similar nodes. + + Args: + query (VectorStoreQuery): Store query object. + + """ + return asyncio.get_event_loop().run_until_complete(self.aquery(query, **kwargs)) + + async def aquery( + self, query: VectorStoreQuery, **kwargs: Any + ) -> VectorStoreQueryResult: + """ + Async query index for top k most similar nodes. Args: query (VectorStoreQuery): Store query object. @@ -477,7 +537,7 @@ def query(self, query: VectorStoreQuery, **kwargs: Any) -> VectorStoreQueryResul """ query_embedding = cast(List[float], query.query_embedding) - return self._client.query( + return await self._client.aquery( query.mode, query.query_str, query_embedding, diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/pyproject.toml b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/pyproject.toml index 88d546fb78ebe..5b2ff54568f5e 100644 --- a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/pyproject.toml +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/pyproject.toml @@ -27,12 +27,15 @@ exclude = ["**/BUILD"] license = "MIT" name = "llama-index-vector-stores-opensearch" readme = "README.md" -version = "0.1.4" +version = "0.1.6" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" llama-index-core = "^0.10.1" -opensearch-py = "^2.4.2" + +[tool.poetry.dependencies.opensearch-py] +extras = ["async"] +version = "^2.4.2" [tool.poetry.group.dev.dependencies] ipython = "8.10.0" diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/docker-compose.yml b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/docker-compose.yml new file mode 100644 index 0000000000000..753e6b3621132 --- /dev/null +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/docker-compose.yml @@ -0,0 +1,11 @@ +version: "3" + +services: + opensearch: + image: opensearchproject/opensearch:latest + environment: + - discovery.type=single-node + - plugins.security.disabled=true + - OPENSEARCH_INITIAL_ADMIN_PASSWORD=Asd234%@#% + ports: + - "9200:9200" diff --git a/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/test_opensearch_client.py b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/test_opensearch_client.py new file mode 100644 index 0000000000000..399749dd811a3 --- /dev/null +++ b/llama-index-integrations/vector_stores/llama-index-vector-stores-opensearch/tests/test_opensearch_client.py @@ -0,0 +1,158 @@ +import asyncio +import logging +import pytest +import uuid +from typing import List, Generator + +from llama_index.core.schema import TextNode +from llama_index.vector_stores.opensearch import ( + OpensearchVectorClient, + OpensearchVectorStore, +) +from llama_index.core.vector_stores.types import VectorStoreQuery + +## +# Start Opensearch locally +# cd tests +# docker-compose up +# +# Run tests +# pytest test_opensearch_client.py + +logging.basicConfig(level=logging.DEBUG) +evt_loop = asyncio.get_event_loop() + +try: + from opensearchpy import AsyncOpenSearch + + os_client = AsyncOpenSearch("localhost:9200") + evt_loop.run_until_complete(os_client.info()) + opensearch_not_available = False +except (ImportError, Exception): + opensearch_not_available = True +finally: + evt_loop.run_until_complete(os_client.close()) + + +@pytest.mark.skipif(opensearch_not_available, reason="opensearch is not available") +def test_connection() -> None: + assert True + + +@pytest.fixture() +def index_name() -> str: + """Return the index name.""" + return f"test_{uuid.uuid4().hex}" + + +@pytest.fixture() +def os_store(index_name: str) -> Generator[OpensearchVectorStore, None, None]: + client = OpensearchVectorClient( + endpoint="localhost:9200", + index=index_name, + dim=3, + ) + + yield OpensearchVectorStore(client) + + # teardown step + # delete index + evt_loop.run_until_complete(client._os_client.indices.delete(index=index_name)) + # close client aiohttp session + evt_loop.run_until_complete(client._os_client.close()) + + +@pytest.fixture(scope="session") +def node_embeddings() -> List[TextNode]: + return [ + TextNode( + text="lorem ipsum", + id_="c330d77f-90bd-4c51-9ed2-57d8d693b3b0", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="test-0")}, + metadata={ + "author": "Stephen King", + "theme": "Friendship", + }, + embedding=[1.0, 0.0, 0.0], + ), + TextNode( + text="lorem ipsum", + id_="c3d1e1dd-8fb4-4b8f-b7ea-7fa96038d39d", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="test-1")}, + metadata={ + "director": "Francis Ford Coppola", + "theme": "Mafia", + }, + embedding=[0.0, 1.0, 0.0], + ), + TextNode( + text="lorem ipsum", + id_="c3ew11cd-8fb4-4b8f-b7ea-7fa96038d39d", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="test-2")}, + metadata={ + "director": "Christopher Nolan", + }, + embedding=[0.0, 0.0, 1.0], + ), + TextNode( + text="I was taught that the way of progress was neither swift nor easy.", + id_="0b31ae71-b797-4e88-8495-031371a7752e", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="text-3")}, + metadate={ + "author": "Marie Curie", + }, + embedding=[0.0, 0.0, 0.9], + ), + TextNode( + text=( + "The important thing is not to stop questioning." + + " Curiosity has its own reason for existing." + ), + id_="bd2e080b-159a-4030-acc3-d98afd2ba49b", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="text-4")}, + metadate={ + "author": "Albert Einstein", + }, + embedding=[0.0, 0.0, 0.5], + ), + TextNode( + text=( + "I am no bird; and no net ensnares me;" + + " I am a free human being with an independent will." + ), + id_="f658de3b-8cef-4d1c-8bed-9a263c907251", + # relationships={NodeRelationship.SOURCE: RelatedNodeInfo(node_id="text-5")}, + metadate={ + "author": "Charlotte Bronte", + }, + embedding=[0.0, 0.0, 0.3], + ), + ] + + +def count_docs_in_index(os_store: OpensearchVectorStore) -> int: + """Refresh indices and return the count of documents in the index.""" + evt_loop.run_until_complete( + os_store.client._os_client.indices.refresh(index=os_store.client._index) + ) + count = evt_loop.run_until_complete( + os_store.client._os_client.count(index=os_store.client._index) + ) + return count["count"] + + +@pytest.mark.skipif(opensearch_not_available, reason="opensearch is not available") +def test_functionality( + os_store: OpensearchVectorStore, node_embeddings: List[TextNode] +) -> None: + # add + assert len(os_store.add(node_embeddings)) == len(node_embeddings) + # query + exp_node = node_embeddings[3] + query = VectorStoreQuery(query_embedding=exp_node.embedding, similarity_top_k=1) + query_result = os_store.query(query) + assert query_result.nodes + assert query_result.nodes[0].get_content() == exp_node.text + # delete + os_store.delete(exp_node.id_) + assert count_docs_in_index(os_store) == len(node_embeddings) - 1 diff --git a/llama-index-legacy/llama_index/legacy/callbacks/__init__.py b/llama-index-legacy/llama_index/legacy/callbacks/__init__.py index d419baa947969..097353e3bd341 100644 --- a/llama-index-legacy/llama_index/legacy/callbacks/__init__.py +++ b/llama-index-legacy/llama_index/legacy/callbacks/__init__.py @@ -5,7 +5,6 @@ from .open_inference_callback import OpenInferenceCallbackHandler from .schema import CBEvent, CBEventType, EventPayload from .token_counting import TokenCountingHandler -from .uptrain_callback import UpTrainCallbackHandler from .utils import trace_method from .wandb_callback import WandbCallbackHandler @@ -22,5 +21,4 @@ "OpenAIFineTuningHandler", "GradientAIFineTuningHandler", "trace_method", - "UpTrainCallbackHandler", ] diff --git a/llama-index-legacy/llama_index/legacy/callbacks/global_handlers.py b/llama-index-legacy/llama_index/legacy/callbacks/global_handlers.py index c52ed3ed354f1..f191de2181bda 100644 --- a/llama-index-legacy/llama_index/legacy/callbacks/global_handlers.py +++ b/llama-index-legacy/llama_index/legacy/callbacks/global_handlers.py @@ -14,7 +14,6 @@ ) from llama_index.legacy.callbacks.promptlayer_handler import PromptLayerHandler from llama_index.legacy.callbacks.simple_llm_handler import SimpleLLMHandler -from llama_index.legacy.callbacks.uptrain_callback import UpTrainCallbackHandler from llama_index.legacy.callbacks.wandb_callback import WandbCallbackHandler @@ -41,8 +40,6 @@ def create_global_handler(eval_mode: str, **eval_params: Any) -> BaseCallbackHan handler = deepeval_callback_handler(**eval_params) elif eval_mode == "simple": handler = SimpleLLMHandler(**eval_params) - elif eval_mode == "uptrain": - handler = UpTrainCallbackHandler(**eval_params) elif eval_mode == "argilla": handler = argilla_callback_handler(**eval_params) else: diff --git a/llama-index-legacy/llama_index/legacy/core/embeddings/base.py b/llama-index-legacy/llama_index/legacy/core/embeddings/base.py index 263d96dd9eb7d..1e7edcd23cfcf 100644 --- a/llama-index-legacy/llama_index/legacy/core/embeddings/base.py +++ b/llama-index-legacy/llama_index/legacy/core/embeddings/base.py @@ -289,16 +289,13 @@ async def aget_text_embedding_batch( nested_embeddings = [] if show_progress: try: - from tqdm.auto import tqdm - - nested_embeddings = [ - await f - for f in tqdm( - asyncio.as_completed(embeddings_coroutines), - total=len(embeddings_coroutines), - desc="Generating embeddings", - ) - ] + from tqdm.asyncio import tqdm_asyncio + + nested_embeddings = await tqdm_asyncio.gather( + *embeddings_coroutines, + total=len(embeddings_coroutines), + desc="Generating embeddings", + ) except ImportError: nested_embeddings = await asyncio.gather(*embeddings_coroutines) else: diff --git a/llama-index-legacy/llama_index/legacy/embeddings/multi_modal_base.py b/llama-index-legacy/llama_index/legacy/embeddings/multi_modal_base.py index 82f5088099e75..a3a6eba662f82 100644 --- a/llama-index-legacy/llama_index/legacy/embeddings/multi_modal_base.py +++ b/llama-index-legacy/llama_index/legacy/embeddings/multi_modal_base.py @@ -155,16 +155,13 @@ async def aget_image_embedding_batch( nested_embeddings = [] if show_progress: try: - from tqdm.auto import tqdm - - nested_embeddings = [ - await f - for f in tqdm( - asyncio.as_completed(embeddings_coroutines), - total=len(embeddings_coroutines), - desc="Generating image embeddings", - ) - ] + from tqdm.asyncio import tqdm_asyncio + + nested_embeddings = await tqdm_asyncio.gather( + *embeddings_coroutines, + total=len(embeddings_coroutines), + desc="Generating embeddings", + ) except ImportError: nested_embeddings = await asyncio.gather(*embeddings_coroutines) else: diff --git a/llama-index-legacy/llama_index/legacy/retrievers/fusion_retriever.py b/llama-index-legacy/llama_index/legacy/retrievers/fusion_retriever.py index 8b9f2859307f1..caa900bacf9f7 100644 --- a/llama-index-legacy/llama_index/legacy/retrievers/fusion_retriever.py +++ b/llama-index-legacy/llama_index/legacy/retrievers/fusion_retriever.py @@ -127,7 +127,11 @@ def _simple_fusion( for nodes_with_scores in results.values(): for node_with_score in nodes_with_scores: text = node_with_score.node.get_content() - all_nodes[text] = node_with_score + if text in all_nodes: + score = max(node_with_score.score, all_nodes[text].score) + all_nodes[text].score = score + else: + all_nodes[text] = node_with_score return sorted(all_nodes.values(), key=lambda x: x.score or 0.0, reverse=True) diff --git a/llama-index-packs/llama-index-packs-chroma-autoretrieval/README.md b/llama-index-packs/llama-index-packs-chroma-autoretrieval/README.md index 7f70de593e16d..dc46644c7ba66 100644 --- a/llama-index-packs/llama-index-packs-chroma-autoretrieval/README.md +++ b/llama-index-packs/llama-index-packs-chroma-autoretrieval/README.md @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo vector_store_info = VectorStoreInfo( content_info="brief biography of celebrities", diff --git a/llama-index-packs/llama-index-packs-cogniswitch-agent/README.md b/llama-index-packs/llama-index-packs-cogniswitch-agent/README.md index 476ee35eb431c..0723ca6d75c41 100644 --- a/llama-index-packs/llama-index-packs-cogniswitch-agent/README.md +++ b/llama-index-packs/llama-index-packs-cogniswitch-agent/README.md @@ -42,7 +42,7 @@ llamaindex-cli download-llamapack CogniswitchAgentPack --download-dir ./cs_pack import warnings warnings.filterwarnings("ignore") -from llama_index.core.llama_packs import CogniswitchAgentPack +from llama_index.packs.cogniswitch_agent import CogniswitchAgentPack import os diff --git a/llama-index-packs/llama-index-packs-deeplake-deepmemory-retriever/README.md b/llama-index-packs/llama-index-packs-deeplake-deepmemory-retriever/README.md index 7546a55058a75..2be08da526be6 100644 --- a/llama-index-packs/llama-index-packs-deeplake-deepmemory-retriever/README.md +++ b/llama-index-packs/llama-index-packs-deeplake-deepmemory-retriever/README.md @@ -17,7 +17,7 @@ You can then inspect the files at `./deepmemory_pack` and use them as a template You can download the pack to a `./deepmemory_pack` directory: ```python -from llama_hub.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies DeepMemoryRetriever = download_llama_pack( @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo nodes = [...] diff --git a/llama-index-packs/llama-index-packs-deeplake-multimodal-retrieval/README.md b/llama-index-packs/llama-index-packs-deeplake-multimodal-retrieval/README.md index 50427fe9d3d16..72fc3f3910702 100644 --- a/llama-index-packs/llama-index-packs-deeplake-multimodal-retrieval/README.md +++ b/llama-index-packs/llama-index-packs-deeplake-multimodal-retrieval/README.md @@ -17,7 +17,7 @@ You can then inspect the files at `./deeplake_multimodal_pack` and use them as a You can download the pack to a `./deeplake_multimodal_pack` directory: ```python -from llama_hub.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies DeepLakeMultimodalRetriever = download_llama_pack( @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo # collection of image and text nodes nodes = [...] diff --git a/llama-index-packs/llama-index-packs-dense-x-retrieval/README.md b/llama-index-packs/llama-index-packs-dense-x-retrieval/README.md index 4219bb4489931..0b8bf6c6ae2a0 100644 --- a/llama-index-packs/llama-index-packs-dense-x-retrieval/README.md +++ b/llama-index-packs/llama-index-packs-dense-x-retrieval/README.md @@ -29,7 +29,7 @@ You can then inspect the files at `./dense_pack` and use them as a template for You can download the pack to a the `./dense_pack` directory: ```python -from llama_index import SimpleDirectoryReader +from llama_index.core import SimpleDirectoryReader from llama_index.core.llama_pack import download_llama_pack # download and install dependencies diff --git a/llama-index-packs/llama-index-packs-evaluator-benchmarker/README.md b/llama-index-packs/llama-index-packs-evaluator-benchmarker/README.md index 3fff5c2aca9e1..ba1ea63b00cd7 100644 --- a/llama-index-packs/llama-index-packs-evaluator-benchmarker/README.md +++ b/llama-index-packs/llama-index-packs-evaluator-benchmarker/README.md @@ -32,8 +32,8 @@ single-grading evaluation — in this case, the usage flow remains the same. from llama_index.core.llama_dataset import download_llama_dataset from llama_index.core.llama_pack import download_llama_pack from llama_index.core.evaluation import PairwiseComparisonEvaluator -from llama_index.core.llms import OpenAI -from llama_index import ServiceContext +from llama_index.llms.openai import OpenAI +from llama_index.core import ServiceContext # download a LabelledRagDataset from llama-hub pairwise_dataset = download_llama_dataset( diff --git a/llama-index-packs/llama-index-packs-fuzzy-citation/README.md b/llama-index-packs/llama-index-packs-fuzzy-citation/README.md index edb6f077ac1dc..4b90e932aafa6 100644 --- a/llama-index-packs/llama-index-packs-fuzzy-citation/README.md +++ b/llama-index-packs/llama-index-packs-fuzzy-citation/README.md @@ -21,7 +21,7 @@ You can then inspect the files at `./fuzzy_citation_pack` and use them as a temp You can download the pack to a the `./fuzzy_citation_pack` directory: ```python -from llama_index import Document, VectorStoreIndex +from llama_index.core import Document, VectorStoreIndex from llama_index.core.llama_pack import download_llama_pack # download and install dependencies diff --git a/llama-index-packs/llama-index-packs-gmail-openai-agent/README.md b/llama-index-packs/llama-index-packs-gmail-openai-agent/README.md index a8cd8cec53bbd..1e13d1329d6a2 100644 --- a/llama-index-packs/llama-index-packs-gmail-openai-agent/README.md +++ b/llama-index-packs/llama-index-packs-gmail-openai-agent/README.md @@ -43,7 +43,7 @@ agent = gmail_agent_pack.agent response = agent.chat("What is my most recent email?") # Use the tool spec in another agent -from llama_index.core.agents import ReActAgent +from llama_index.core.agent import ReActAgent tool_spec = gmail_agent_pack.tool_spec agent = ReActAgent.from_tools(tool_spec.to_tool_lost()) diff --git a/llama-index-packs/llama-index-packs-koda-retriever/README.md b/llama-index-packs/llama-index-packs-koda-retriever/README.md index 582d67388a106..c703e1467de2f 100644 --- a/llama-index-packs/llama-index-packs-koda-retriever/README.md +++ b/llama-index-packs/llama-index-packs-koda-retriever/README.md @@ -29,7 +29,7 @@ Please see the [examples](./examples/) folder for more specific examples. from llama_index.packs.koda_retriever import KodaRetriever from llama_index.core import VectorStoreIndex from llama_index.llms.openai import OpenAI -from llama_index.embeddings.openai.base import OpenAIEmbedding +from llama_index.embeddings.openai import OpenAIEmbedding from llama_index.core.postprocessor import LLMRerank from llama_index.core import Settings diff --git a/llama-index-packs/llama-index-packs-multidoc-autoretrieval/README.md b/llama-index-packs/llama-index-packs-multidoc-autoretrieval/README.md index d8250aa7652d5..f5ddbcdd8dcc2 100644 --- a/llama-index-packs/llama-index-packs-multidoc-autoretrieval/README.md +++ b/llama-index-packs/llama-index-packs-multidoc-autoretrieval/README.md @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo import weaviate diff --git a/llama-index-packs/llama-index-packs-nebulagraph-query-engine/README.md b/llama-index-packs/llama-index-packs-nebulagraph-query-engine/README.md index a776ac5c2c001..5b3538fda58c9 100644 --- a/llama-index-packs/llama-index-packs-nebulagraph-query-engine/README.md +++ b/llama-index-packs/llama-index-packs-nebulagraph-query-engine/README.md @@ -37,11 +37,15 @@ From here, you can use the pack, or inspect and modify the pack in `./nebulagrap Then, you can set up the pack like so: +```bash +pip install llama-index-readers-wikipedia +``` + ```python # Load the docs (example of Paleo diet from Wikipedia) -from llama_index import download_loader -WikipediaReader = download_loader("WikipediaReader") +from llama_index.readers.wikipedia import WikipediaReader + loader = WikipediaReader() docs = loader.load_data(pages=["Paleolithic diet"], auto_suggest=False) print(f"Loaded {len(docs)} documents") @@ -75,7 +79,7 @@ nebulagraph_pack = NebulaGraphQueryEnginePack( Optionally, you can pass in the `query_engine_type` from `NebulaGraphQueryEngineType` to construct `NebulaGraphQueryEnginePack`. If `query_engine_type` is not defined, it defaults to Knowledge Graph vector based entity retrieval. ```python -from llama_index.packs.nebulagraph_query_engine.base import ( +from llama_index.core.packs.nebulagraph_query_engine.base import ( NebulaGraphQueryEngineType, ) diff --git a/llama-index-packs/llama-index-packs-neo4j-query-engine/README.md b/llama-index-packs/llama-index-packs-neo4j-query-engine/README.md index c508cc743a6d3..2582fe676a260 100644 --- a/llama-index-packs/llama-index-packs-neo4j-query-engine/README.md +++ b/llama-index-packs/llama-index-packs-neo4j-query-engine/README.md @@ -37,11 +37,15 @@ From here, you can use the pack, or inspect and modify the pack in `./neo4j_pack Then, you can set up the pack like so: +```bash +pip install llama-index-readers-wikipedia +``` + ```python # Load the docs (example of Paleo diet from Wikipedia) -from llama_index import download_loader -WikipediaReader = download_loader("WikipediaReader") +from llama_index.readers.wikipedia import WikipediaReader + loader = WikipediaReader() docs = loader.load_data(pages=["Paleolithic diet"], auto_suggest=False) print(f"Loaded {len(docs)} documents") @@ -63,7 +67,7 @@ neo4j_pack = Neo4jQueryEnginePack( Optionally, you can pass in the `query_engine_type` from `Neo4jQueryEngineType` to construct `Neo4jQueryEnginePack`. If `query_engine_type` is not defined, it defaults to Knowledge Graph vector based entity retrieval. ```python -from llama_index.packs.neo4j_query_engine.base import Neo4jQueryEngineType +from llama_index.core.packs.neo4j_query_engine.base import Neo4jQueryEngineType # create the pack neo4j_pack = Neo4jQueryEnginePack( diff --git a/llama-index-packs/llama-index-packs-rag-cli-local/README.md b/llama-index-packs/llama-index-packs-rag-cli-local/README.md index 90352835e6f1e..ee3ba4a0d2eab 100644 --- a/llama-index-packs/llama-index-packs-rag-cli-local/README.md +++ b/llama-index-packs/llama-index-packs-rag-cli-local/README.md @@ -21,7 +21,7 @@ which makes it hard to load directly. We will show you how to import the agent from these files! ```python -from llama_index.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies download_llama_pack("LocalRAGCLIPack", "./local_rag_cli_pack", skip_load=True) diff --git a/llama-index-packs/llama-index-packs-rag-evaluator/README.md b/llama-index-packs/llama-index-packs-rag-evaluator/README.md index abe136c89642a..d5a6d405f75f8 100644 --- a/llama-index-packs/llama-index-packs-rag-evaluator/README.md +++ b/llama-index-packs/llama-index-packs-rag-evaluator/README.md @@ -25,7 +25,7 @@ built off of its source documents. ```python from llama_index.core.llama_dataset import download_llama_dataset from llama_index.core.llama_pack import download_llama_pack -from llama_index import VectorStoreIndex +from llama_index.core import VectorStoreIndex # download a LabelledRagDataset from llama-hub rag_dataset, documents = download_llama_dataset( diff --git a/llama-index-packs/llama-index-packs-raptor/.gitignore b/llama-index-packs/llama-index-packs-raptor/.gitignore new file mode 100644 index 0000000000000..990c18de22908 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/.gitignore @@ -0,0 +1,153 @@ +llama_index/_static +.DS_Store +# Byte-compiled / optimized / DLL files +__pycache__/ +*.py[cod] +*$py.class + +# C extensions +*.so + +# Distribution / packaging +.Python +bin/ +build/ +develop-eggs/ +dist/ +downloads/ +eggs/ +.eggs/ +etc/ +include/ +lib/ +lib64/ +parts/ +sdist/ +share/ +var/ +wheels/ +pip-wheel-metadata/ +share/python-wheels/ +*.egg-info/ +.installed.cfg +*.egg +MANIFEST + +# PyInstaller +# Usually these files are written by a python script from a template +# before PyInstaller builds the exe, so as to inject date/other infos into it. +*.manifest +*.spec + +# Installer logs +pip-log.txt +pip-delete-this-directory.txt + +# Unit test / coverage reports +htmlcov/ +.tox/ +.nox/ +.coverage +.coverage.* +.cache +nosetests.xml +coverage.xml +*.cover +*.py,cover +.hypothesis/ +.pytest_cache/ +.ruff_cache + +# Translations +*.mo +*.pot + +# Django stuff: +*.log +local_settings.py +db.sqlite3 +db.sqlite3-journal + +# Flask stuff: +instance/ +.webassets-cache + +# Scrapy stuff: +.scrapy + +# Sphinx documentation +docs/_build/ + +# PyBuilder +target/ + +# Jupyter Notebook +.ipynb_checkpoints +notebooks/ + +# IPython +profile_default/ +ipython_config.py + +# pyenv +.python-version + +# pipenv +# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. +# However, in case of collaboration, if having platform-specific dependencies or dependencies +# having no cross-platform support, pipenv may install dependencies that don't work, or not +# install all needed dependencies. +#Pipfile.lock + +# PEP 582; used by e.g. github.com/David-OConnor/pyflow +__pypackages__/ + +# Celery stuff +celerybeat-schedule +celerybeat.pid + +# SageMath parsed files +*.sage.py + +# Environments +.env +.venv +env/ +venv/ +ENV/ +env.bak/ +venv.bak/ +pyvenv.cfg + +# Spyder project settings +.spyderproject +.spyproject + +# Rope project settings +.ropeproject + +# mkdocs documentation +/site + +# mypy +.mypy_cache/ +.dmypy.json +dmypy.json + +# Pyre type checker +.pyre/ + +# Jetbrains +.idea +modules/ +*.swp + +# VsCode +.vscode + +# pipenv +Pipfile +Pipfile.lock + +# pyright +pyrightconfig.json diff --git a/llama-index-packs/llama-index-packs-raptor/BUILD b/llama-index-packs/llama-index-packs-raptor/BUILD new file mode 100644 index 0000000000000..09bd1b6726c8f --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/BUILD @@ -0,0 +1,4 @@ +poetry_requirements( + name="poetry", + module_mapping={"umap-learn": ["umap"], "scikit-learn": ["sklearn"]} +) diff --git a/llama-index-packs/llama-index-packs-raptor/Makefile b/llama-index-packs/llama-index-packs-raptor/Makefile new file mode 100644 index 0000000000000..b9eab05aa3706 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/Makefile @@ -0,0 +1,17 @@ +GIT_ROOT ?= $(shell git rev-parse --show-toplevel) + +help: ## Show all Makefile targets. + @grep -E '^[a-zA-Z_-]+:.*?## .*$$' $(MAKEFILE_LIST) | awk 'BEGIN {FS = ":.*?## "}; {printf "\033[33m%-30s\033[0m %s\n", $$1, $$2}' + +format: ## Run code autoformatters (black). + pre-commit install + git ls-files | xargs pre-commit run black --files + +lint: ## Run linters: pre-commit (black, ruff, codespell) and mypy + pre-commit install && git ls-files | xargs pre-commit run --show-diff-on-failure --files + +test: ## Run tests via pytest. + pytest tests + +watch-docs: ## Build and watch documentation. + sphinx-autobuild docs/ docs/_build/html --open-browser --watch $(GIT_ROOT)/llama_index/ diff --git a/llama-index-packs/llama-index-packs-raptor/README.md b/llama-index-packs/llama-index-packs-raptor/README.md new file mode 100644 index 0000000000000..4b9b07fb5a549 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/README.md @@ -0,0 +1,78 @@ +# Raptor Retriever LlamaPack + +This LlamaPack shows how to use an implementation of RAPTOR with llama-index, leveraging the RAPTOR pack. + +RAPTOR works by recursively clustering and summarizing clusters in layers for retrieval. + +There two retrieval modes: + +- tree_traversal -- traversing the tree of clusters, performing top-k at each level in the tree. +- collapsed -- treat the entire tree as a giant pile of nodes, perform simple top-k. + +See [the paper](https://arxiv.org/abs/2401.18059) for full algorithm details. + +## CLI Usage + +You can download llamapacks directly using `llamaindex-cli`, which comes installed with the `llama-index` python package: + +```bash +llamaindex-cli download-llamapack RaptorPack --download-dir ./raptor_pack +``` + +You can then inspect/modify the files at `./raptor_pack` and use them as a template for your own project. + +## Code Usage + +You can alternaitvely install the package: + +`pip install llama-index-packs-raptor` + +Then, you can import and initialize the pack! This will perform clustering and summarization over your data. + +```python +from llama_index.packs.raptor import RaptorPack + +pack = RaptorPack(documents, llm=llm, embed_model=embed_model) +``` + +The `run()` function is a light wrapper around `retriever.retrieve()`. + +```python +nodes = pack.run( + "query", + mode="collapsed", # or tree_traversal +) +``` + +You can also use modules individually. + +```python +# get the retriever +retriever = pack.retriever +``` + +## Persistence + +The `RaptorPack` comes with the `RaptorRetriever`, which offers ways of saving/reloading! + +If you are using a remote vector-db, just pass it in + +```python +# Pack usage +pack = RaptorPack(..., vector_store=vector_store) + +# RaptorRetriever usage +retriever = RaptorRetriever(..., vector_store=vector_store) +``` + +Then, to re-connect, just pass in the vector store again and an empty list of documents + +```python +# Pack usage +pack = RaptorPack([], ..., vector_store=vector_store) + +# RaptorRetriever usage +retriever = RaptorRetriever([], ..., vector_store=vector_store) +``` + +Check out the [notebook here for complete details!](https://github.com/run-llama/llama_index/blob/main/llama-index-packs/llama-index-packs-raptor/examples/raptor.ipynb). diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor.ipynb b/llama-index-packs/llama-index-packs-raptor/examples/raptor.ipynb new file mode 100644 index 0000000000000..1f550dc52375e --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/examples/raptor.ipynb @@ -0,0 +1,379 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# RAPTOR: Recursive Abstractive Processing for Tree-Organized Retrieval\n", + "\n", + "This notebook shows how to use an implementation of RAPTOR with llama-index, leveraging the RAPTOR llama-pack.\n", + "\n", + "RAPTOR works by recursively clustering and summarizing clusters in layers for retrieval.\n", + "\n", + "There two retrieval modes:\n", + "- tree_traversal -- traversing the tree of clusters, performing top-k at each level in the tree.\n", + "- collapsed -- treat the entire tree as a giant pile of nodes, perform simple top-k.\n", + "\n", + "See [the paper](https://arxiv.org/abs/2401.18059) for full algorithm details." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Setup" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "!pip install llama-index llama-index-packs-raptor llama-index-vector-stores-qdrant" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.packs.raptor import RaptorPack\n", + "\n", + "# optionally download the pack to inspect/modify it yourself!\n", + "# from llama_index.core.llama_pack import download_llama_pack\n", + "# RaptorPack = download_llama_pack(\"RaptorPack\", \"./raptor_pack\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Will not apply HSTS. The HSTS database must be a regular and non-world-writable file.\n", + "ERROR: could not open HSTS store at '/home/loganm/.wget-hsts'. HSTS will be disabled.\n", + "--2024-02-29 22:16:11-- https://arxiv.org/pdf/2401.18059.pdf\n", + "Resolving arxiv.org (arxiv.org)... 151.101.3.42, 151.101.195.42, 151.101.131.42, ...\n", + "Connecting to arxiv.org (arxiv.org)|151.101.3.42|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 2547113 (2.4M) [application/pdf]\n", + "Saving to: ‘./raptor_paper.pdf’\n", + "\n", + "./raptor_paper.pdf 100%[===================>] 2.43M 12.5MB/s in 0.2s \n", + "\n", + "2024-02-29 22:16:12 (12.5 MB/s) - ‘./raptor_paper.pdf’ saved [2547113/2547113]\n", + "\n" + ] + } + ], + "source": [ + "!wget https://arxiv.org/pdf/2401.18059.pdf -O ./raptor_paper.pdf" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "\n", + "os.environ[\"OPENAI_API_KEY\"] = \"sk-...\"" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Constructing the Clusters/Hierarchy Tree" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import nest_asyncio\n", + "\n", + "nest_asyncio.apply()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core import SimpleDirectoryReader\n", + "\n", + "documents = SimpleDirectoryReader(input_files=[\"./raptor_paper.pdf\"]).load_data()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Generating embeddings for level 0.\n", + "Performing clustering for level 0.\n", + "Generating summaries for level 0 with 10 clusters.\n", + "Level 0 created summaries/clusters: 10\n", + "Generating embeddings for level 1.\n", + "Performing clustering for level 1.\n", + "Generating summaries for level 1 with 1 clusters.\n", + "Level 1 created summaries/clusters: 1\n", + "Generating embeddings for level 2.\n", + "Performing clustering for level 2.\n", + "Generating summaries for level 2 with 1 clusters.\n", + "Level 2 created summaries/clusters: 1\n" + ] + } + ], + "source": [ + "from llama_index.core.node_parser import SentenceSplitter\n", + "from llama_index.llms.openai import OpenAI\n", + "from llama_index.embeddings.openai import OpenAIEmbedding\n", + "from llama_index.vector_stores.chroma import ChromaVectorStore\n", + "import chromadb\n", + "\n", + "client = chromadb.PersistentClient(path=\"./raptor_paper_db\")\n", + "collection = client.get_or_create_collection(\"raptor\")\n", + "\n", + "vector_store = ChromaVectorStore(chroma_collection=collection)\n", + "\n", + "raptor_pack = RaptorPack(\n", + " documents,\n", + " embed_model=OpenAIEmbedding(\n", + " model=\"text-embedding-3-small\"\n", + " ), # used for embedding clusters\n", + " llm=OpenAI(model=\"gpt-3.5-turbo\", temperature=0.1), # used for generating summaries\n", + " vector_store=vector_store, # used for storage\n", + " similarity_top_k=2, # top k for each layer, or overall top-k for collapsed\n", + " mode=\"collapsed\", # sets default mode\n", + " transformations=[\n", + " SentenceSplitter(chunk_size=400, chunk_overlap=50)\n", + " ], # transformations applied for ingestion\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Retrieval" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2\n", + "Specifically, RAPTOR’s F-1 scores are at least 1.8% points higher than DPR and at least 5.3% points\n", + "higher than BM25.\n", + "Retriever GPT-3 F-1 Match GPT-4 F-1 Match UnifiedQA F-1 Match\n", + "Title + Abstract 25.2 22.2 17.5\n", + "BM25 46.6 50.2 26.4\n", + "DPR 51.3 53.0 32.1\n", + "RAPTOR 53.1 55.7 36.6\n", + "Table 4: Comparison of accuracies on the QuAL-\n", + "ITY dev dataset for two different language mod-\n", + "els (GPT-3, UnifiedQA 3B) using various retrieval\n", + "methods. RAPTOR outperforms the baselines of\n", + "BM25 and DPR by at least 2.0% in accuracy.\n", + "Model GPT-3 Acc. UnifiedQA Acc.\n", + "BM25 57.3 49.9\n", + "DPR 60.4 53.9\n", + "RAPTOR 62.4 56.6\n", + "Table 5: Results on F-1 Match scores of various\n", + "models on the QASPER dataset.\n", + "Model F-1 Match\n", + "LongT5 XL (Guo et al., 2022) 53.1\n", + "CoLT5 XL (Ainslie et al., 2023) 53.9\n", + "RAPTOR + GPT-4 55.7Comparison to State-of-the-art Systems\n", + "Building upon our controlled comparisons,\n", + "we examine RAPTOR’s performance relative\n", + "to other state-of-the-art models.\n" + ] + } + ], + "source": [ + "nodes = raptor_pack.run(\"What baselines is raptor compared against?\", mode=\"collapsed\")\n", + "print(len(nodes))\n", + "print(nodes[0].text)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Retrieved parent IDs from level 2: ['cc3b3f41-f4ca-4020-b11f-be7e0ce04c4f']\n", + "Retrieved 1 from parents at level 2.\n", + "Retrieved parent IDs from level 1: ['a4ca9426-a312-4a01-813a-c9b02aefc7e8']\n", + "Retrieved 2 from parents at level 1.\n", + "Retrieved parent IDs from level 0: ['63126782-2778-449f-99c0-1e8fd90caa36', 'd8f68d31-d878-41f1-aeb6-a7dde8ed5143']\n", + "Retrieved 4 from parents at level 0.\n", + "4\n", + "Specifically, RAPTOR’s F-1 scores are at least 1.8% points higher than DPR and at least 5.3% points\n", + "higher than BM25.\n", + "Retriever GPT-3 F-1 Match GPT-4 F-1 Match UnifiedQA F-1 Match\n", + "Title + Abstract 25.2 22.2 17.5\n", + "BM25 46.6 50.2 26.4\n", + "DPR 51.3 53.0 32.1\n", + "RAPTOR 53.1 55.7 36.6\n", + "Table 4: Comparison of accuracies on the QuAL-\n", + "ITY dev dataset for two different language mod-\n", + "els (GPT-3, UnifiedQA 3B) using various retrieval\n", + "methods. RAPTOR outperforms the baselines of\n", + "BM25 and DPR by at least 2.0% in accuracy.\n", + "Model GPT-3 Acc. UnifiedQA Acc.\n", + "BM25 57.3 49.9\n", + "DPR 60.4 53.9\n", + "RAPTOR 62.4 56.6\n", + "Table 5: Results on F-1 Match scores of various\n", + "models on the QASPER dataset.\n", + "Model F-1 Match\n", + "LongT5 XL (Guo et al., 2022) 53.1\n", + "CoLT5 XL (Ainslie et al., 2023) 53.9\n", + "RAPTOR + GPT-4 55.7Comparison to State-of-the-art Systems\n", + "Building upon our controlled comparisons,\n", + "we examine RAPTOR’s performance relative\n", + "to other state-of-the-art models.\n" + ] + } + ], + "source": [ + "nodes = raptor_pack.run(\n", + " \"What baselines is raptor compared against?\", mode=\"tree_traversal\"\n", + ")\n", + "print(len(nodes))\n", + "print(nodes[0].text)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Loading\n", + "\n", + "Since we saved to a vector store, we can also use it again! (For local vector stores, there is a `persist` and `from_persist_dir` method on the retriever)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.packs.raptor import RaptorRetriever\n", + "\n", + "retriever = RaptorRetriever(\n", + " [],\n", + " embed_model=OpenAIEmbedding(\n", + " model=\"text-embedding-3-small\"\n", + " ), # used for embedding clusters\n", + " llm=OpenAI(model=\"gpt-3.5-turbo\", temperature=0.1), # used for generating summaries\n", + " vector_store=vector_store, # used for storage\n", + " similarity_top_k=2, # top k for each layer, or overall top-k for collapsed\n", + " mode=\"tree_traversal\", # sets default mode\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# if using a default vector store\n", + "# retriever.persist(\"./persist\")\n", + "# retriever = RaptorRetriever.from_persist_dir(\"./persist\", ...)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Query Engine" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from llama_index.core.query_engine import RetrieverQueryEngine\n", + "\n", + "query_engine = RetrieverQueryEngine.from_args(\n", + " raptor_pack.retriever, llm=OpenAI(model=\"gpt-3.5-turbo\", temperature=0.1)\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "response = query_engine.query(\"What baselines was RAPTOR compared against?\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "BM25 and DPR\n" + ] + } + ], + "source": [ + "print(str(response))" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "llama-index-4aB9_5sa-py3.10", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/data_level0.bin b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/data_level0.bin new file mode 100644 index 0000000000000..ea3192e8ec511 Binary files /dev/null and b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/data_level0.bin differ diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/header.bin b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/header.bin new file mode 100644 index 0000000000000..3e0932a7d0033 Binary files /dev/null and b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/header.bin differ diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/length.bin b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/length.bin new file mode 100644 index 0000000000000..45bfe72ed91d6 Binary files /dev/null and b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/length.bin differ diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/link_lists.bin b/llama-index-packs/llama-index-packs-raptor/examples/raptor/81db1dbe-a06d-43a6-ba07-875398bc33a7/link_lists.bin new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-packs/llama-index-packs-raptor/examples/raptor/chroma.sqlite3 b/llama-index-packs/llama-index-packs-raptor/examples/raptor/chroma.sqlite3 new file mode 100644 index 0000000000000..ca77f198baaba Binary files /dev/null and b/llama-index-packs/llama-index-packs-raptor/examples/raptor/chroma.sqlite3 differ diff --git a/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/BUILD b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/BUILD new file mode 100644 index 0000000000000..db46e8d6c978c --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/BUILD @@ -0,0 +1 @@ +python_sources() diff --git a/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/__init__.py b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/__init__.py new file mode 100644 index 0000000000000..7bc9f986b42d1 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/__init__.py @@ -0,0 +1,4 @@ +from llama_index.packs.raptor.base import RaptorPack, RaptorRetriever + + +__all__ = ["RaptorPack", "RaptorRetriever"] diff --git a/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/base.py b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/base.py new file mode 100644 index 0000000000000..89a539ee07aa8 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/base.py @@ -0,0 +1,366 @@ +from typing import Any, Dict, List, Optional + +import asyncio +from enum import Enum + +from llama_index.core import ( + StorageContext, + VectorStoreIndex, + get_response_synthesizer, + load_index_from_storage, +) +from llama_index.core.base.response.schema import Response +from llama_index.core.base.base_retriever import BaseRetriever, QueryType +from llama_index.core.bridge.pydantic import BaseModel, Field +from llama_index.core.embeddings import BaseEmbedding +from llama_index.core.ingestion import run_transformations +from llama_index.core.llama_pack.base import BaseLlamaPack +from llama_index.core.llms.llm import LLM +from llama_index.core.response_synthesizers import BaseSynthesizer +from llama_index.core.schema import ( + BaseNode, + NodeWithScore, + QueryBundle, + TextNode, + TransformComponent, +) +from llama_index.core.vector_stores.types import ( + MetadataFilter, + MetadataFilters, + VectorStore, +) +from llama_index.packs.raptor.clustering import get_clusters + + +DEFAULT_SUMMARY_PROMPT = ( + "Summarize the provided text, including as many key details as needed." +) + + +class QueryModes(str, Enum): + """Query modes.""" + + tree_traversal = "tree_traversal" + collapsed = "collapsed" + + +class SummaryModule(BaseModel): + response_synthesizer: BaseSynthesizer = Field(description="LLM") + summary_prompt: str = Field( + default=DEFAULT_SUMMARY_PROMPT, + description="Summary prompt.", + ) + num_workers: int = Field( + default=4, description="Number of workers to generate summaries." + ) + show_progress: bool = Field(default=True, description="Show progress.") + + class Config: + arbitrary_types_allowed = True + + def __init__( + self, llm: Optional[LLM] = None, summary_prompt: str = DEFAULT_SUMMARY_PROMPT + ) -> None: + response_synthesizer = get_response_synthesizer( + response_mode="tree_summarize", use_async=True, llm=llm + ) + super().__init__( + response_synthesizer=response_synthesizer, summary_prompt=summary_prompt + ) + + async def generate_summaries( + self, documents_per_cluster: List[List[BaseNode]] + ) -> List[str]: + """Generate summaries of documents per cluster. + + Args: + documents_per_cluster (List[List[BaseNode]]): List of documents per cluster + + Returns: + List[str]: List of summary for each cluster + """ + jobs = [] + for documents in documents_per_cluster: + with_scores = [NodeWithScore(node=doc, score=1.0) for doc in documents] + jobs.append( + self.response_synthesizer.asynthesize(self.summary_prompt, with_scores) + ) + + lock = asyncio.Semaphore(self.num_workers) + responses = [] + + # run the jobs while limiting the number of concurrent jobs to num_workers + for job in jobs: + async with lock: + responses.append(await job) + + return [str(response) for response in responses] + + +class RaptorRetriever(BaseRetriever): + """Raptor indexing retriever.""" + + def __init__( + self, + documents: List[BaseNode], + tree_depth: int = 3, + similarity_top_k: int = 2, + llm: Optional[LLM] = None, + embed_model: Optional[BaseEmbedding] = None, + vector_store: Optional[VectorStore] = None, + transformations: Optional[List[TransformComponent]] = None, + summary_module: Optional[SummaryModule] = None, + existing_index: Optional[VectorStoreIndex] = None, + mode: QueryModes = "collapsed", + **kwargs: Any, + ) -> None: + """Init params.""" + super().__init__( + **kwargs, + ) + + self.mode = mode + self.summary_module = summary_module or SummaryModule(llm=llm) + self.index = existing_index or VectorStoreIndex( + nodes=[], + storage_context=StorageContext.from_defaults(vector_store=vector_store), + embed_model=embed_model, + transformations=transformations, + ) + self.tree_depth = tree_depth + self.similarity_top_k = similarity_top_k + + if len(documents) > 0: + asyncio.run(self.insert(documents)) + + def _get_embeddings_per_level(self, level: int = 0) -> List[float]: + """Retrieve embeddings per level in the abstraction tree. + + Args: + level (int, optional): Target level. Defaults to 0 which stands for leaf nodes. + + Returns: + List[float]: List of embeddings + """ + filters = MetadataFilters(filters=[MetadataFilter("level", level)]) + + # kind of janky, but should work with any vector index + source_nodes = self.index.as_retriever( + similarity_top_k=10000, filters=filters + ).retrieve("retrieve") + + return [x.node for x in source_nodes] + + async def insert(self, documents: List[BaseNode]) -> None: + """Given a set of documents, this function inserts higher level of abstractions within the index. + + For later retrieval + + Args: + documents (List[BaseNode]): List of Documents + """ + embed_model = self.index._embed_model + transformations = self.index._transformations + + cur_nodes = run_transformations(documents, transformations, in_place=False) + for level in range(self.tree_depth): + # get the embeddings for the current documents + + if self._verbose: + print(f"Generating embeddings for level {level}.") + + embeddings = await embed_model.aget_text_embedding_batch( + [node.get_content(metadata_mode="embed") for node in cur_nodes] + ) + assert len(embeddings) == len(cur_nodes) + id_to_embedding = { + node.id_: embedding for node, embedding in zip(cur_nodes, embeddings) + } + + if self._verbose: + print(f"Performing clustering for level {level}.") + + # cluster the documents + nodes_per_cluster = get_clusters(cur_nodes, id_to_embedding) + + if self._verbose: + print( + f"Generating summaries for level {level} with {len(nodes_per_cluster)} clusters." + ) + summaries_per_cluster = await self.summary_module.generate_summaries( + nodes_per_cluster + ) + + if self._verbose: + print( + f"Level {level} created summaries/clusters: {len(nodes_per_cluster)}" + ) + + # replace the current nodes with their summaries + new_nodes = [ + TextNode( + text=summary, + metadata={"level": level}, + excluded_embed_metadata_keys=["level"], + excluded_llm_metadata_keys=["level"], + ) + for summary in summaries_per_cluster + ] + + # insert the nodes with their embeddings and parent_id + nodes_with_embeddings = [] + for cluster, summary_doc in zip(nodes_per_cluster, new_nodes): + for node in cluster: + node.metadata["parent_id"] = summary_doc.id_ + node.excluded_embed_metadata_keys.append("parent_id") + node.excluded_llm_metadata_keys.append("parent_id") + node.embedding = id_to_embedding[node.id_] + nodes_with_embeddings.append(node) + + self.index.insert_nodes(nodes_with_embeddings) + + # set the current nodes to the new nodes + cur_nodes = new_nodes + + self.index.insert_nodes(cur_nodes) + + async def collapsed_retrieval(self, query_str: str) -> Response: + """Query the index as a collapsed tree -- i.e. a single pool of nodes.""" + return await self.index.as_retriever( + similarity_top_k=self.similarity_top_k + ).aretrieve(query_str) + + async def tree_traversal_retrieval(self, query_str: str) -> Response: + """Query the index as a tree, traversing the tree from the top down.""" + # get top k nodes for each level, starting with the top + parent_ids = None + nodes = [] + level = self.tree_depth - 1 + while level >= 0: + # retrieve nodes at the current level + if parent_ids is None: + nodes = await self.index.as_retriever( + similarity_top_k=self.similarity_top_k, + filters=MetadataFilters( + filters=[MetadataFilter(key="level", value=level)] + ), + ).aretrieve(query_str) + + parent_ids = [node.id_ for node in nodes] + if self._verbose: + print(f"Retrieved parent IDs from level {level}: {parent_ids!s}") + # retrieve nodes that are children of the nodes at the previous level + elif parent_ids is not None and len(parent_ids) > 0: + nested_nodes = await asyncio.gather( + *[ + self.index.as_retriever( + similarity_top_k=self.similarity_top_k, + filters=MetadataFilters( + filters=[MetadataFilter(key="parent_id", value=id_)] + ), + ).aretrieve(query_str) + for id_ in parent_ids + ] + ) + + nodes = [node for nested in nested_nodes for node in nested] + + if self._verbose: + print(f"Retrieved {len(nodes)} from parents at level {level}.") + + level -= 1 + parent_ids = None + + return nodes + + def _retrieve(self, query_bundle: QueryBundle) -> List[NodeWithScore]: + """Retrieve nodes given query and mode.""" + # not used, needed for type checking + + def retrieve( + self, query_str_or_bundle: QueryType, mode: Optional[QueryModes] = None + ) -> List[NodeWithScore]: + """Retrieve nodes given query and mode.""" + if isinstance(query_str_or_bundle, QueryBundle): + query_str = query_str_or_bundle.query_str + else: + query_str = query_str_or_bundle + + return asyncio.run(self.aretrieve(query_str, mode or self.mode)) + + async def aretrieve( + self, query_str_or_bundle: QueryType, mode: Optional[QueryModes] = None + ) -> List[NodeWithScore]: + """Retrieve nodes given query and mode.""" + if isinstance(query_str_or_bundle, QueryBundle): + query_str = query_str_or_bundle.query_str + else: + query_str = query_str_or_bundle + + mode = mode or self.mode + if mode == "tree_traversal": + return await self.tree_traversal_retrieval(query_str) + elif mode == "collapsed": + return await self.collapsed_retrieval(query_str) + else: + raise ValueError(f"Invalid mode: {mode}") + + def persist(self, persist_dir: str) -> None: + self.index.storage_context.persist(persist_dir=persist_dir) + + @classmethod + def from_persist_dir( + cls: "RaptorRetriever", + persist_dir: str, + embed_model: Optional[BaseEmbedding] = None, + **kwargs: Any, + ) -> "RaptorRetriever": + storage_context = StorageContext.from_defaults(persist_dir=persist_dir) + return cls( + [], + existing_index=load_index_from_storage( + storage_context, embed_model=embed_model + ), + **kwargs, + ) + + +class RaptorPack(BaseLlamaPack): + """Raptor pack.""" + + def __init__( + self, + documents: List[BaseNode], + llm: Optional[LLM] = None, + embed_model: Optional[BaseEmbedding] = None, + vector_store: Optional[VectorStore] = None, + similarity_top_k: int = 2, + mode: QueryModes = "collapsed", + verbose: bool = True, + **kwargs: Any, + ) -> None: + """Init params.""" + self.retriever = RaptorRetriever( + documents, + embed_model=embed_model, + llm=llm, + similarity_top_k=similarity_top_k, + vector_store=vector_store, + mode=mode, + verbose=verbose, + **kwargs, + ) + + def get_modules(self) -> Dict[str, Any]: + """Get modules.""" + return { + "retriever": self.retriever, + } + + def run( + self, + query: str, + mode: Optional[QueryModes] = None, + ) -> Any: + """Run the pipeline.""" + return self.retriever.retrieve(query, mode=mode) diff --git a/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/clustering.py b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/clustering.py new file mode 100644 index 0000000000000..3969446f53ac0 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/llama_index/packs/raptor/clustering.py @@ -0,0 +1,169 @@ +""" +Minorly tweaked from https://github.com/parthsarthi03/raptor/blob/master/raptor/cluster_tree_builder.py. + +Full credits to the original authors! +""" + +import numpy as np +import random +import tiktoken +import umap +from sklearn.mixture import GaussianMixture +from typing import Dict, List, Optional + +from llama_index.core.schema import BaseNode + + +# Set a random seed for reproducibility +RANDOM_SEED = 224 +random.seed(RANDOM_SEED) + + +def global_cluster_embeddings( + embeddings: np.ndarray, + dim: int, + n_neighbors: Optional[int] = None, + metric: str = "cosine", +) -> np.ndarray: + if n_neighbors is None: + n_neighbors = int((len(embeddings) - 1) ** 0.5) + return umap.UMAP( + n_neighbors=n_neighbors, n_components=dim, metric=metric + ).fit_transform(embeddings) + + +def local_cluster_embeddings( + embeddings: np.ndarray, dim: int, num_neighbors: int = 10, metric: str = "cosine" +) -> np.ndarray: + return umap.UMAP( + n_neighbors=num_neighbors, n_components=dim, metric=metric + ).fit_transform(embeddings) + + +def get_optimal_clusters( + embeddings: np.ndarray, max_clusters: int = 50, random_state: int = RANDOM_SEED +) -> int: + max_clusters = min(max_clusters, len(embeddings)) + n_clusters = np.arange(1, max_clusters) + bics = [] + for n in n_clusters: + gm = GaussianMixture(n_components=n, random_state=random_state) + gm.fit(embeddings) + bics.append(gm.bic(embeddings)) + return n_clusters[np.argmin(bics)] + + +def GMM_cluster(embeddings: np.ndarray, threshold: float, random_state: int = 0): + n_clusters = get_optimal_clusters(embeddings) + gm = GaussianMixture(n_components=n_clusters, random_state=random_state) + gm.fit(embeddings) + probs = gm.predict_proba(embeddings) + labels = [np.where(prob > threshold)[0] for prob in probs] + return labels, n_clusters + + +def perform_clustering( + embeddings: np.ndarray, + dim: int, + threshold: float, +) -> List[np.ndarray]: + # If the number of embeddings is less than or equal to the dimension, return a list of zeros + # This means all nodes are in the same cluster. + # Otherwise, we will get an error when trying to cluster. + if len(embeddings) <= dim + 1: + return [np.array([0]) for _ in range(len(embeddings))] + + reduced_embeddings_global = global_cluster_embeddings(embeddings, dim) + global_clusters, n_global_clusters = GMM_cluster( + reduced_embeddings_global, threshold + ) + + all_local_clusters = [np.array([]) for _ in range(len(embeddings))] + total_clusters = 0 + + for i in range(n_global_clusters): + global_cluster_embeddings_ = embeddings[ + np.array([i in gc for gc in global_clusters]) + ] + + if len(global_cluster_embeddings_) == 0: + continue + if len(global_cluster_embeddings_) <= dim + 1: + local_clusters = [np.array([0]) for _ in global_cluster_embeddings_] + n_local_clusters = 1 + else: + reduced_embeddings_local = local_cluster_embeddings( + global_cluster_embeddings_, dim + ) + local_clusters, n_local_clusters = GMM_cluster( + reduced_embeddings_local, threshold + ) + + for j in range(n_local_clusters): + local_cluster_embeddings_ = global_cluster_embeddings_[ + np.array([j in lc for lc in local_clusters]) + ] + indices = np.where( + (embeddings == local_cluster_embeddings_[:, None]).all(-1) + )[1] + for idx in indices: + all_local_clusters[idx] = np.append( + all_local_clusters[idx], j + total_clusters + ) + + total_clusters += n_local_clusters + + return all_local_clusters + + +def get_clusters( + nodes: List[BaseNode], + embedding_map: Dict[str, List[List[float]]], + max_length_in_cluster: int = 10000, # 10k tokens max per cluster + tokenizer: tiktoken.Encoding = tiktoken.get_encoding("cl100k_base"), + reduction_dimension: int = 10, + threshold: float = 0.1, +) -> List[List[BaseNode]]: + # get embeddings + embeddings = np.array([np.array(embedding_map[node.id_]) for node in nodes]) + + # Perform the clustering + clusters = perform_clustering( + embeddings, dim=reduction_dimension, threshold=threshold + ) + + # Initialize an empty list to store the clusters of nodes + node_clusters = [] + + # Iterate over each unique label in the clusters + for label in np.unique(np.concatenate(clusters)): + # Get the indices of the nodes that belong to this cluster + indices = [i for i, cluster in enumerate(clusters) if label in cluster] + + # Add the corresponding nodes to the node_clusters list + cluster_nodes = [nodes[i] for i in indices] + + # Base case: if the cluster only has one node, do not attempt to recluster it + if len(cluster_nodes) == 1: + node_clusters.append(cluster_nodes) + continue + + # Calculate the total length of the text in the nodes + total_length = sum([len(tokenizer.encode(node.text)) for node in cluster_nodes]) + + # If the total length exceeds the maximum allowed length, recluster this cluster + if total_length > max_length_in_cluster: + node_clusters.extend( + get_clusters( + cluster_nodes, + embedding_map, + max_length_in_cluster=max_length_in_cluster, + tokenizer=tokenizer, + reduction_dimension=reduction_dimension, + threshold=threshold, + ) + ) + else: + node_clusters.append(cluster_nodes) + + return node_clusters diff --git a/llama-index-packs/llama-index-packs-raptor/pyproject.toml b/llama-index-packs/llama-index-packs-raptor/pyproject.toml new file mode 100644 index 0000000000000..4e0202df446b8 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/pyproject.toml @@ -0,0 +1,60 @@ +[build-system] +build-backend = "poetry.core.masonry.api" +requires = ["poetry-core"] + +[tool.codespell] +check-filenames = true +check-hidden = true +# Feel free to un-skip examples, and experimental, you will just need to +# work through many typos (--write-changes and --interactive will help) +skip = "*.csv,*.html,*.json,*.jsonl,*.pdf,*.txt,*.ipynb" + +[tool.llamahub] +contains_example = true +import_path = "llama_index.packs.raptor" + +[tool.llamahub.class_authors] +RaptorPack = "logan-markewich" + +[tool.mypy] +disallow_untyped_defs = true +# Remove venv skip when integrated with pre-commit +exclude = ["_static", "build", "examples", "notebooks", "venv"] +ignore_missing_imports = true +python_version = "3.8" + +[tool.poetry] +authors = ["Logan Markewich "] +description = "llama-index packs raptor integration" +keywords = ["cluster", "raptor", "retrieval"] +license = "MIT" +name = "llama-index-packs-raptor" +packages = [{include = "llama_index/"}] +readme = "README.md" +version = "0.1.1" + +[tool.poetry.dependencies] +python = ">=3.9,<4.0" +llama-index-core = "^0.10.0" +llama-index-llms-openai = "^0.1.6" +umap-learn = ">=0.5.5" +scikit-learn = "*" + +[tool.poetry.group.dev.dependencies] +black = {extras = ["jupyter"], version = "<=23.9.1,>=23.7.0"} +codespell = {extras = ["toml"], version = ">=v2.2.6"} +ipython = "8.10.0" +jupyter = "^1.0.0" +mypy = "0.991" +pre-commit = "3.2.0" +pylint = "2.15.10" +pytest = "7.2.1" +pytest-mock = "3.11.1" +ruff = "0.0.292" +tree-sitter-languages = "^1.8.0" +types-Deprecated = ">=0.1.0" +types-PyYAML = "^6.0.12.12" +types-protobuf = "^4.24.0.4" +types-redis = "4.5.5.0" +types-requests = "2.28.11.8" # TODO: unpin when mypy>0.991 +types-setuptools = "67.1.0.0" diff --git a/llama-index-packs/llama-index-packs-raptor/tests/BUILD b/llama-index-packs/llama-index-packs-raptor/tests/BUILD new file mode 100644 index 0000000000000..dabf212d7e716 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/tests/BUILD @@ -0,0 +1 @@ +python_tests() diff --git a/llama-index-packs/llama-index-packs-raptor/tests/__init__.py b/llama-index-packs/llama-index-packs-raptor/tests/__init__.py new file mode 100644 index 0000000000000..e69de29bb2d1d diff --git a/llama-index-packs/llama-index-packs-raptor/tests/test_packs_raptor.py b/llama-index-packs/llama-index-packs-raptor/tests/test_packs_raptor.py new file mode 100644 index 0000000000000..a8deb2a261a69 --- /dev/null +++ b/llama-index-packs/llama-index-packs-raptor/tests/test_packs_raptor.py @@ -0,0 +1,30 @@ +from llama_index.core import Document, MockEmbedding +from llama_index.core.llms import MockLLM +from llama_index.packs.raptor.base import RaptorRetriever + + +def test_raptor() -> None: + retriever = RaptorRetriever( + [ + Document(text="one"), + Document(text="two"), + Document(text="three"), + Document(text="four"), + Document(text="five"), + Document(text="six"), + Document(text="seven"), + Document(text="eight"), + Document(text="nine"), + Document(text="ten"), + ], + embed_model=MockEmbedding(embed_dim=1536), + llm=MockLLM(), + ) + + assert len(retriever.index.docstore.docs) == 13 + + nodes = retriever.retrieve("test", mode="collapsed") + assert len(nodes) == 2 + + nodes = retriever.retrieve("text", mode="tree_traversal") + assert len(nodes) == 2 diff --git a/llama-index-packs/llama-index-packs-redis-ingestion-pipeline/README.md b/llama-index-packs/llama-index-packs-redis-ingestion-pipeline/README.md index 6c4dc6de2f12f..cbe2a65e5148c 100644 --- a/llama-index-packs/llama-index-packs-redis-ingestion-pipeline/README.md +++ b/llama-index-packs/llama-index-packs-redis-ingestion-pipeline/README.md @@ -30,8 +30,8 @@ From here, you can use the pack, or inspect and modify the pack in `./redis_inge Then, you can set up the pack like so: ```python -from llama_index.core.text_splitter import SentenceSplitter -from llama_index.core.embeddings import OpenAIEmbedding +from llama_index.core.node_parser import SentenceSplitter +from llama_index.embeddings.openai import OpenAIEmbedding transformations = [SentenceSplitter(), OpenAIEmbedding()] diff --git a/llama-index-packs/llama-index-packs-retry-engine-weaviate/README.md b/llama-index-packs/llama-index-packs-retry-engine-weaviate/README.md index 345ca13440b3a..5f88ce6597dc5 100644 --- a/llama-index-packs/llama-index-packs-retry-engine-weaviate/README.md +++ b/llama-index-packs/llama-index-packs-retry-engine-weaviate/README.md @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo vector_store_info = VectorStoreInfo( content_info="brief biography of celebrities", diff --git a/llama-index-packs/llama-index-packs-self-discover/README.md b/llama-index-packs/llama-index-packs-self-discover/README.md index b7b923ca17238..51ce36fc26b2d 100644 --- a/llama-index-packs/llama-index-packs-self-discover/README.md +++ b/llama-index-packs/llama-index-packs-self-discover/README.md @@ -36,7 +36,7 @@ There are two ways using LlamaPack: ### Using `download_llama_pack` ```python -from llama_index.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies SelfDiscoverPack = download_llama_pack( diff --git a/llama-index-packs/llama-index-packs-self-rag/README.md b/llama-index-packs/llama-index-packs-self-rag/README.md index 56bf4cec94b54..5caf1f240c704 100644 --- a/llama-index-packs/llama-index-packs-self-rag/README.md +++ b/llama-index-packs/llama-index-packs-self-rag/README.md @@ -28,7 +28,7 @@ huggingface-cli download m4r1/selfrag_llama2_7b-GGUF selfrag_llama2_7b.q4_k_m.gg ``` ```python -from llama_index.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies SelfRAGPack = download_llama_pack("SelfRAGPack", "./self_rag_pack") diff --git a/llama-index-packs/llama-index-packs-sub-question-weaviate/README.md b/llama-index-packs/llama-index-packs-sub-question-weaviate/README.md index 0ef0cdfb83171..5d258b12f1ad7 100644 --- a/llama-index-packs/llama-index-packs-sub-question-weaviate/README.md +++ b/llama-index-packs/llama-index-packs-sub-question-weaviate/README.md @@ -31,7 +31,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo vector_store_info = VectorStoreInfo( content_info="brief biography of celebrities", diff --git a/llama-index-packs/llama-index-packs-timescale-vector-autoretrieval/README.md b/llama-index-packs/llama-index-packs-timescale-vector-autoretrieval/README.md index a9204d506b642..56a07d28ee741 100644 --- a/llama-index-packs/llama-index-packs-timescale-vector-autoretrieval/README.md +++ b/llama-index-packs/llama-index-packs-timescale-vector-autoretrieval/README.md @@ -51,7 +51,7 @@ You can then inspect the files at `./tsv_pack` and use them as a template for yo You can download the pack to a the `./tsv_pack` directory: ```python -from llama_hub.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies TimescaleVectorAutoretrievalPack = download_llama_pack( @@ -65,7 +65,7 @@ Then, you can set up the pack like so: ```python # setup pack arguments -from llama_index.core.vector_stores.types import MetadataInfo, VectorStoreInfo +from llama_index.core.vector_stores import MetadataInfo, VectorStoreInfo from timescale_vector import client from dotenv import load_dotenv, find_dotenv import os diff --git a/llama-index-packs/llama-index-packs-vanna/README.md b/llama-index-packs/llama-index-packs-vanna/README.md index d4b42ec9cc5d3..42fde06f552d0 100644 --- a/llama-index-packs/llama-index-packs-vanna/README.md +++ b/llama-index-packs/llama-index-packs-vanna/README.md @@ -24,7 +24,7 @@ You can then inspect the files at `./vanna_pack` and use them as a template for You can download the pack to a `./vanna_pack` directory: ```python -from llama_index.llama_pack import download_llama_pack +from llama_index.core.llama_pack import download_llama_pack # download and install dependencies VannaPack = download_llama_pack("VannaPack", "./vanna_pack") diff --git a/poetry.lock b/poetry.lock index cdf83badcd93f..063032b09a51d 100644 --- a/poetry.lock +++ b/poetry.lock @@ -423,18 +423,18 @@ beautifulsoup4 = "*" [[package]] name = "build" -version = "1.0.3" +version = "1.1.1" description = "A simple, correct Python build frontend" optional = false python-versions = ">= 3.7" files = [ - {file = "build-1.0.3-py3-none-any.whl", hash = "sha256:589bf99a67df7c9cf07ec0ac0e5e2ea5d4b37ac63301c4986d1acb126aa83f8f"}, - {file = "build-1.0.3.tar.gz", hash = "sha256:538aab1b64f9828977f84bc63ae570b060a8ed1be419e7870b8b4fc5e6ea553b"}, + {file = "build-1.1.1-py3-none-any.whl", hash = "sha256:8ed0851ee76e6e38adce47e4bee3b51c771d86c64cf578d0c2245567ee200e73"}, + {file = "build-1.1.1.tar.gz", hash = "sha256:8eea65bb45b1aac2e734ba2cc8dad3a6d97d97901a395bd0ed3e7b46953d2a31"}, ] [package.dependencies] colorama = {version = "*", markers = "os_name == \"nt\""} -importlib-metadata = {version = ">=4.6", markers = "python_version < \"3.10\""} +importlib-metadata = {version = ">=4.6", markers = "python_full_version < \"3.10.2\""} packaging = ">=19.0" pyproject_hooks = "*" tomli = {version = ">=1.1.0", markers = "python_version < \"3.11\""} @@ -1254,13 +1254,13 @@ grpc = ["grpcio (>=1.44.0,<2.0.0.dev0)"] [[package]] name = "graphlib-backport" -version = "1.0.3" +version = "1.1.0" description = "Backport of the Python 3.9 graphlib module for Python 3.6+" optional = false python-versions = ">=3.6,<4.0" files = [ - {file = "graphlib_backport-1.0.3-py3-none-any.whl", hash = "sha256:24246967b9e7e6a91550bc770e6169585d35aa32790258579a8a3899a8c18fde"}, - {file = "graphlib_backport-1.0.3.tar.gz", hash = "sha256:7bb8fc7757b8ae4e6d8000a26cd49e9232aaa9a3aa57edb478474b8424bfaae2"}, + {file = "graphlib_backport-1.1.0-py3-none-any.whl", hash = "sha256:eccacf9f2126cdf89ce32a6018c88e1ecd3e4898a07568add6e1907a439055ba"}, + {file = "graphlib_backport-1.1.0.tar.gz", hash = "sha256:00a7888b21e5393064a133209cb5d3b3ef0a2096cf023914c9d778dff5644125"}, ] [[package]] @@ -1506,13 +1506,13 @@ socks = ["socksio (==1.*)"] [[package]] name = "huggingface-hub" -version = "0.21.2" +version = "0.21.3" description = "Client library to download and publish models, datasets and other repos on the huggingface.co hub" optional = false python-versions = ">=3.8.0" files = [ - {file = "huggingface_hub-0.21.2-py3-none-any.whl", hash = "sha256:16955c2b60bcff32a0778f84b9e9ae8f61d7f003da6aa1fbb7bc897a0c37b28c"}, - {file = "huggingface_hub-0.21.2.tar.gz", hash = "sha256:839f2fc69fc51797b76dcffa7edbf7fb1150176f74cb1dc2d87ca00e5e0b5611"}, + {file = "huggingface_hub-0.21.3-py3-none-any.whl", hash = "sha256:b183144336fdf2810a8c109822e0bb6ef1fd61c65da6fb60e8c3f658b7144016"}, + {file = "huggingface_hub-0.21.3.tar.gz", hash = "sha256:26a15b604e4fc7bad37c467b76456543ec849386cbca9cd7e1e135f53e500423"}, ] [package.dependencies] @@ -1969,13 +1969,13 @@ llama-index-llms-openai = ">=0.1.5,<0.2.0" [[package]] name = "llama-index-cli" -version = "0.1.5" +version = "0.1.7" description = "llama-index cli" optional = false python-versions = ">=3.8.1,<4.0" files = [ - {file = "llama_index_cli-0.1.5-py3-none-any.whl", hash = "sha256:a0fcfc3239d8b05158558423ca5c1a426d2a455eab44128b2b786cab566f74ad"}, - {file = "llama_index_cli-0.1.5.tar.gz", hash = "sha256:e2493ff7ecfd1983fd15c28c6c0c7bfdba66662c1d8960f6aea229db3d7fafda"}, + {file = "llama_index_cli-0.1.7-py3-none-any.whl", hash = "sha256:48a81fc33d4005dbe91b77ebe840ac69e0102e7e2a59770308f94fae1b792544"}, + {file = "llama_index_cli-0.1.7.tar.gz", hash = "sha256:55a77e3c370eb760c42cb74a0df6f650e41ec17928b72b07ff8b927cb94b15b4"}, ] [package.dependencies] @@ -1986,16 +1986,46 @@ llama-index-vector-stores-chroma = ">=0.1.1,<0.2.0" [[package]] name = "llama-index-core" -version = "0.10.14" +version = "0.10.16" description = "Interface between LLMs and your data" optional = false -python-versions = "*" -files = [] -develop = true +python-versions = ">=3.8.1,<4.0" +files = [ + {file = "llama_index_core-0.10.16-py3-none-any.whl", hash = "sha256:189c808b9c92d871b4c27f78e71186f5edbe202c9fafa28ff4e276197c1a05ff"}, + {file = "llama_index_core-0.10.16.tar.gz", hash = "sha256:a20b246b75e2e5b2dd679953fcede921e8b9896f06e61f473a31ee96d24cd446"}, +] -[package.source] -type = "directory" -url = "llama-index-core" +[package.dependencies] +aiohttp = ">=3.8.6,<4.0.0" +dataclasses-json = "*" +deprecated = ">=1.2.9.3" +dirtyjson = ">=1.0.8,<2.0.0" +fsspec = ">=2023.5.0" +httpx = "*" +llamaindex-py-client = ">=0.1.13,<0.2.0" +nest-asyncio = ">=1.5.8,<2.0.0" +networkx = ">=3.0" +nltk = ">=3.8.1,<4.0.0" +numpy = "*" +openai = ">=1.1.0" +pandas = "*" +pillow = ">=9.0.0" +PyYAML = ">=6.0.1" +requests = ">=2.31.0" +SQLAlchemy = {version = ">=1.4.49", extras = ["asyncio"]} +tenacity = ">=8.2.0,<9.0.0" +tiktoken = ">=0.3.3" +tqdm = ">=4.66.1,<5.0.0" +typing-extensions = ">=4.5.0" +typing-inspect = ">=0.8.0" + +[package.extras] +gradientai = ["gradientai (>=1.4.0)"] +html = ["beautifulsoup4 (>=4.12.2,<5.0.0)"] +langchain = ["langchain (>=0.0.303)"] +local-models = ["optimum[onnxruntime] (>=1.13.2,<2.0.0)", "sentencepiece (>=0.1.99,<0.2.0)", "transformers[torch] (>=4.33.1,<5.0.0)"] +postgres = ["asyncpg (>=0.28.0,<0.29.0)", "pgvector (>=0.1.0,<0.2.0)", "psycopg2-binary (>=2.9.9,<3.0.0)"] +query-tools = ["guidance (>=0.0.64,<0.0.65)", "jsonpath-ng (>=1.6.0,<2.0.0)", "lm-format-enforcer (>=0.4.3,<0.5.0)", "rank-bm25 (>=0.2.2,<0.3.0)", "scikit-learn", "spacy (>=3.7.1,<4.0.0)"] [[package]] name = "llama-index-embeddings-openai" @@ -2067,13 +2097,13 @@ query-tools = ["guidance (>=0.0.64,<0.0.65)", "jsonpath-ng (>=1.6.0,<2.0.0)", "l [[package]] name = "llama-index-llms-openai" -version = "0.1.6" +version = "0.1.7" description = "llama-index llms openai integration" optional = false python-versions = ">=3.8.1,<4.0" files = [ - {file = "llama_index_llms_openai-0.1.6-py3-none-any.whl", hash = "sha256:4260ad31c3444e97ec8a8d061cb6dbf1074262b82341a2b69d2b27e8a23efe62"}, - {file = "llama_index_llms_openai-0.1.6.tar.gz", hash = "sha256:15530dfa3893b15c5576ebc71e01b77acbf47abd689219436fdf7b6ca567a9fd"}, + {file = "llama_index_llms_openai-0.1.7-py3-none-any.whl", hash = "sha256:162a7f1064b389d0db6f731bcedaca80e87ceca8aa919d7425ca32107e756243"}, + {file = "llama_index_llms_openai-0.1.7.tar.gz", hash = "sha256:5ddb405c0a5847a7c2098a70ced270555f036c2793412a8992456bd32f83ff0f"}, ] [package.dependencies] @@ -2128,13 +2158,13 @@ llama-index-program-openai = ">=0.1.1,<0.2.0" [[package]] name = "llama-index-readers-file" -version = "0.1.6" +version = "0.1.7" description = "llama-index readers file integration" optional = false python-versions = ">=3.8.1,<4.0" files = [ - {file = "llama_index_readers_file-0.1.6-py3-none-any.whl", hash = "sha256:f583bd90353a0c0985213af02c97aa2f2f22e702d4311fe719de91382c9ad8dd"}, - {file = "llama_index_readers_file-0.1.6.tar.gz", hash = "sha256:d9fc0ca84926d04bd757c57fe87841cd9dbc2606aab5f2ce927deec14aaa1a74"}, + {file = "llama_index_readers_file-0.1.7-py3-none-any.whl", hash = "sha256:46cf03a141b3fa5fd50c81fa607e9de3060aa67ab9a79dd64bea18962776d2de"}, + {file = "llama_index_readers_file-0.1.7.tar.gz", hash = "sha256:63827ab51e8f66d97f08e1a20be67f86b92484ae120253b5f756fef2371d61bf"}, ] [package.dependencies] @@ -2178,13 +2208,13 @@ tokenizers = ">=0.15.1,<0.16.0" [[package]] name = "llama-parse" -version = "0.3.4" +version = "0.3.5" description = "Parse files into RAG-Optimized formats." optional = false python-versions = ">=3.8.1,<4.0" files = [ - {file = "llama_parse-0.3.4-py3-none-any.whl", hash = "sha256:b667c78d4c32fc5d0561e6e3ca6c53648a6701b436f21d0d252cd46774927660"}, - {file = "llama_parse-0.3.4.tar.gz", hash = "sha256:5a30569c390ab9089dad66cf2a8c967f8c21d77641deec0a922672df4e16cfa3"}, + {file = "llama_parse-0.3.5-py3-none-any.whl", hash = "sha256:8e6e7a0986ad30cb82c5c67a29b7e2c3892620dd2a422afc909654a9d0f1c82c"}, + {file = "llama_parse-0.3.5.tar.gz", hash = "sha256:736a80e4fc5970b9cbef1048171908021ebd26be43f07b806889f0d1bb3875fe"}, ] [package.dependencies] @@ -2315,13 +2345,13 @@ files = [ [[package]] name = "marshmallow" -version = "3.21.0" +version = "3.21.1" description = "A lightweight library for converting complex datatypes to and from native Python datatypes." optional = false python-versions = ">=3.8" files = [ - {file = "marshmallow-3.21.0-py3-none-any.whl", hash = "sha256:e7997f83571c7fd476042c2c188e4ee8a78900ca5e74bd9c8097afa56624e9bd"}, - {file = "marshmallow-3.21.0.tar.gz", hash = "sha256:20f53be28c6e374a711a16165fb22a8dc6003e3f7cda1285e3ca777b9193885b"}, + {file = "marshmallow-3.21.1-py3-none-any.whl", hash = "sha256:f085493f79efb0644f270a9bf2892843142d80d7174bbbd2f3713f2a589dc633"}, + {file = "marshmallow-3.21.1.tar.gz", hash = "sha256:4e65e9e0d80fc9e609574b9983cf32579f305c718afb30d7233ab818571768c3"}, ] [package.dependencies] @@ -2940,13 +2970,13 @@ sympy = "*" [[package]] name = "openai" -version = "1.12.0" +version = "1.13.3" description = "The official Python library for the openai API" optional = false python-versions = ">=3.7.1" files = [ - {file = "openai-1.12.0-py3-none-any.whl", hash = "sha256:a54002c814e05222e413664f651b5916714e4700d041d5cf5724d3ae1a3e3481"}, - {file = "openai-1.12.0.tar.gz", hash = "sha256:99c5d257d09ea6533d689d1cc77caa0ac679fa21efef8893d8b0832a86877f1b"}, + {file = "openai-1.13.3-py3-none-any.whl", hash = "sha256:5769b62abd02f350a8dd1a3a242d8972c947860654466171d60fb0972ae0a41c"}, + {file = "openai-1.13.3.tar.gz", hash = "sha256:ff6c6b3bc7327e715e4b3592a923a5a1c7519ff5dd764a83d69f633d49e77a7b"}, ] [package.dependencies] @@ -3324,6 +3354,91 @@ files = [ {file = "pickleshare-0.7.5.tar.gz", hash = "sha256:87683d47965c1da65cdacaf31c8441d12b8044cdec9aca500cd78fc2c683afca"}, ] +[[package]] +name = "pillow" +version = "10.2.0" +description = "Python Imaging Library (Fork)" +optional = false +python-versions = ">=3.8" +files = [ + {file = "pillow-10.2.0-cp310-cp310-macosx_10_10_x86_64.whl", hash = "sha256:7823bdd049099efa16e4246bdf15e5a13dbb18a51b68fa06d6c1d4d8b99a796e"}, + {file = "pillow-10.2.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:83b2021f2ade7d1ed556bc50a399127d7fb245e725aa0113ebd05cfe88aaf588"}, + {file = "pillow-10.2.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6fad5ff2f13d69b7e74ce5b4ecd12cc0ec530fcee76356cac6742785ff71c452"}, + {file = "pillow-10.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:da2b52b37dad6d9ec64e653637a096905b258d2fc2b984c41ae7d08b938a67e4"}, + {file = "pillow-10.2.0-cp310-cp310-manylinux_2_28_aarch64.whl", hash = "sha256:47c0995fc4e7f79b5cfcab1fc437ff2890b770440f7696a3ba065ee0fd496563"}, + {file = "pillow-10.2.0-cp310-cp310-manylinux_2_28_x86_64.whl", hash = "sha256:322bdf3c9b556e9ffb18f93462e5f749d3444ce081290352c6070d014c93feb2"}, + {file = "pillow-10.2.0-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:51f1a1bffc50e2e9492e87d8e09a17c5eea8409cda8d3f277eb6edc82813c17c"}, + {file = "pillow-10.2.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:69ffdd6120a4737710a9eee73e1d2e37db89b620f702754b8f6e62594471dee0"}, + {file = "pillow-10.2.0-cp310-cp310-win32.whl", hash = "sha256:c6dafac9e0f2b3c78df97e79af707cdc5ef8e88208d686a4847bab8266870023"}, + {file = "pillow-10.2.0-cp310-cp310-win_amd64.whl", hash = "sha256:aebb6044806f2e16ecc07b2a2637ee1ef67a11840a66752751714a0d924adf72"}, + {file = "pillow-10.2.0-cp310-cp310-win_arm64.whl", hash = "sha256:7049e301399273a0136ff39b84c3678e314f2158f50f517bc50285fb5ec847ad"}, + {file = "pillow-10.2.0-cp311-cp311-macosx_10_10_x86_64.whl", hash = "sha256:35bb52c37f256f662abdfa49d2dfa6ce5d93281d323a9af377a120e89a9eafb5"}, + {file = "pillow-10.2.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:9c23f307202661071d94b5e384e1e1dc7dfb972a28a2310e4ee16103e66ddb67"}, + {file = "pillow-10.2.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:773efe0603db30c281521a7c0214cad7836c03b8ccff897beae9b47c0b657d61"}, + {file = "pillow-10.2.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:11fa2e5984b949b0dd6d7a94d967743d87c577ff0b83392f17cb3990d0d2fd6e"}, + {file = "pillow-10.2.0-cp311-cp311-manylinux_2_28_aarch64.whl", hash = "sha256:716d30ed977be8b37d3ef185fecb9e5a1d62d110dfbdcd1e2a122ab46fddb03f"}, + {file = "pillow-10.2.0-cp311-cp311-manylinux_2_28_x86_64.whl", hash = "sha256:a086c2af425c5f62a65e12fbf385f7c9fcb8f107d0849dba5839461a129cf311"}, + {file = "pillow-10.2.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:c8de2789052ed501dd829e9cae8d3dcce7acb4777ea4a479c14521c942d395b1"}, + {file = "pillow-10.2.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:609448742444d9290fd687940ac0b57fb35e6fd92bdb65386e08e99af60bf757"}, + {file = "pillow-10.2.0-cp311-cp311-win32.whl", hash = "sha256:823ef7a27cf86df6597fa0671066c1b596f69eba53efa3d1e1cb8b30f3533068"}, + {file = "pillow-10.2.0-cp311-cp311-win_amd64.whl", hash = "sha256:1da3b2703afd040cf65ec97efea81cfba59cdbed9c11d8efc5ab09df9509fc56"}, + {file = "pillow-10.2.0-cp311-cp311-win_arm64.whl", hash = "sha256:edca80cbfb2b68d7b56930b84a0e45ae1694aeba0541f798e908a49d66b837f1"}, + {file = "pillow-10.2.0-cp312-cp312-macosx_10_10_x86_64.whl", hash = "sha256:1b5e1b74d1bd1b78bc3477528919414874748dd363e6272efd5abf7654e68bef"}, + {file = "pillow-10.2.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:0eae2073305f451d8ecacb5474997c08569fb4eb4ac231ffa4ad7d342fdc25ac"}, + {file = "pillow-10.2.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b7c2286c23cd350b80d2fc9d424fc797575fb16f854b831d16fd47ceec078f2c"}, + {file = "pillow-10.2.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1e23412b5c41e58cec602f1135c57dfcf15482013ce6e5f093a86db69646a5aa"}, + {file = "pillow-10.2.0-cp312-cp312-manylinux_2_28_aarch64.whl", hash = "sha256:52a50aa3fb3acb9cf7213573ef55d31d6eca37f5709c69e6858fe3bc04a5c2a2"}, + {file = "pillow-10.2.0-cp312-cp312-manylinux_2_28_x86_64.whl", hash = "sha256:127cee571038f252a552760076407f9cff79761c3d436a12af6000cd182a9d04"}, + {file = "pillow-10.2.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:8d12251f02d69d8310b046e82572ed486685c38f02176bd08baf216746eb947f"}, + {file = "pillow-10.2.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:54f1852cd531aa981bc0965b7d609f5f6cc8ce8c41b1139f6ed6b3c54ab82bfb"}, + {file = "pillow-10.2.0-cp312-cp312-win32.whl", hash = "sha256:257d8788df5ca62c980314053197f4d46eefedf4e6175bc9412f14412ec4ea2f"}, + {file = "pillow-10.2.0-cp312-cp312-win_amd64.whl", hash = "sha256:154e939c5f0053a383de4fd3d3da48d9427a7e985f58af8e94d0b3c9fcfcf4f9"}, + {file = "pillow-10.2.0-cp312-cp312-win_arm64.whl", hash = "sha256:f379abd2f1e3dddb2b61bc67977a6b5a0a3f7485538bcc6f39ec76163891ee48"}, + {file = "pillow-10.2.0-cp38-cp38-macosx_10_10_x86_64.whl", hash = "sha256:8373c6c251f7ef8bda6675dd6d2b3a0fcc31edf1201266b5cf608b62a37407f9"}, + {file = "pillow-10.2.0-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:870ea1ada0899fd0b79643990809323b389d4d1d46c192f97342eeb6ee0b8483"}, + {file = "pillow-10.2.0-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b4b6b1e20608493548b1f32bce8cca185bf0480983890403d3b8753e44077129"}, + {file = "pillow-10.2.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:3031709084b6e7852d00479fd1d310b07d0ba82765f973b543c8af5061cf990e"}, + {file = "pillow-10.2.0-cp38-cp38-manylinux_2_28_aarch64.whl", hash = "sha256:3ff074fc97dd4e80543a3e91f69d58889baf2002b6be64347ea8cf5533188213"}, + {file = "pillow-10.2.0-cp38-cp38-manylinux_2_28_x86_64.whl", hash = "sha256:cb4c38abeef13c61d6916f264d4845fab99d7b711be96c326b84df9e3e0ff62d"}, + {file = "pillow-10.2.0-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:b1b3020d90c2d8e1dae29cf3ce54f8094f7938460fb5ce8bc5c01450b01fbaf6"}, + {file = "pillow-10.2.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:170aeb00224ab3dc54230c797f8404507240dd868cf52066f66a41b33169bdbe"}, + {file = "pillow-10.2.0-cp38-cp38-win32.whl", hash = "sha256:c4225f5220f46b2fde568c74fca27ae9771536c2e29d7c04f4fb62c83275ac4e"}, + {file = "pillow-10.2.0-cp38-cp38-win_amd64.whl", hash = "sha256:0689b5a8c5288bc0504d9fcee48f61a6a586b9b98514d7d29b840143d6734f39"}, + {file = "pillow-10.2.0-cp39-cp39-macosx_10_10_x86_64.whl", hash = "sha256:b792a349405fbc0163190fde0dc7b3fef3c9268292586cf5645598b48e63dc67"}, + {file = "pillow-10.2.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:c570f24be1e468e3f0ce7ef56a89a60f0e05b30a3669a459e419c6eac2c35364"}, + {file = "pillow-10.2.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:d8ecd059fdaf60c1963c58ceb8997b32e9dc1b911f5da5307aab614f1ce5c2fb"}, + {file = "pillow-10.2.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:c365fd1703040de1ec284b176d6af5abe21b427cb3a5ff68e0759e1e313a5e7e"}, + {file = "pillow-10.2.0-cp39-cp39-manylinux_2_28_aarch64.whl", hash = "sha256:70c61d4c475835a19b3a5aa42492409878bbca7438554a1f89d20d58a7c75c01"}, + {file = "pillow-10.2.0-cp39-cp39-manylinux_2_28_x86_64.whl", hash = "sha256:b6f491cdf80ae540738859d9766783e3b3c8e5bd37f5dfa0b76abdecc5081f13"}, + {file = "pillow-10.2.0-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:9d189550615b4948f45252d7f005e53c2040cea1af5b60d6f79491a6e147eef7"}, + {file = "pillow-10.2.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:49d9ba1ed0ef3e061088cd1e7538a0759aab559e2e0a80a36f9fd9d8c0c21591"}, + {file = "pillow-10.2.0-cp39-cp39-win32.whl", hash = "sha256:babf5acfede515f176833ed6028754cbcd0d206f7f614ea3447d67c33be12516"}, + {file = "pillow-10.2.0-cp39-cp39-win_amd64.whl", hash = "sha256:0304004f8067386b477d20a518b50f3fa658a28d44e4116970abfcd94fac34a8"}, + {file = "pillow-10.2.0-cp39-cp39-win_arm64.whl", hash = "sha256:0fb3e7fc88a14eacd303e90481ad983fd5b69c761e9e6ef94c983f91025da869"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-macosx_10_10_x86_64.whl", hash = "sha256:322209c642aabdd6207517e9739c704dc9f9db943015535783239022002f054a"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3eedd52442c0a5ff4f887fab0c1c0bb164d8635b32c894bc1faf4c618dd89df2"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:cb28c753fd5eb3dd859b4ee95de66cc62af91bcff5db5f2571d32a520baf1f04"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:33870dc4653c5017bf4c8873e5488d8f8d5f8935e2f1fb9a2208c47cdd66efd2"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:3c31822339516fb3c82d03f30e22b1d038da87ef27b6a78c9549888f8ceda39a"}, + {file = "pillow-10.2.0-pp310-pypy310_pp73-win_amd64.whl", hash = "sha256:a2b56ba36e05f973d450582fb015594aaa78834fefe8dfb8fcd79b93e64ba4c6"}, + {file = "pillow-10.2.0-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:d8e6aeb9201e655354b3ad049cb77d19813ad4ece0df1249d3c793de3774f8c7"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-macosx_10_10_x86_64.whl", hash = "sha256:2247178effb34a77c11c0e8ac355c7a741ceca0a732b27bf11e747bbc950722f"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:15587643b9e5eb26c48e49a7b33659790d28f190fc514a322d55da2fb5c2950e"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:753cd8f2086b2b80180d9b3010dd4ed147efc167c90d3bf593fe2af21265e5a5"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:7c8f97e8e7a9009bcacbe3766a36175056c12f9a44e6e6f2d5caad06dcfbf03b"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:d1b35bcd6c5543b9cb547dee3150c93008f8dd0f1fef78fc0cd2b141c5baf58a"}, + {file = "pillow-10.2.0-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:fe4c15f6c9285dc54ce6553a3ce908ed37c8f3825b5a51a15c91442bb955b868"}, + {file = "pillow-10.2.0.tar.gz", hash = "sha256:e87f0b2c78157e12d7686b27d63c070fd65d994e8ddae6f328e0dcf4a0cd007e"}, +] + +[package.extras] +docs = ["furo", "olefile", "sphinx (>=2.4)", "sphinx-copybutton", "sphinx-inline-tabs", "sphinx-removed-in", "sphinxext-opengraph"] +fpx = ["olefile"] +mic = ["olefile"] +tests = ["check-manifest", "coverage", "defusedxml", "markdown2", "olefile", "packaging", "pyroma", "pytest", "pytest-cov", "pytest-timeout"] +typing = ["typing-extensions"] +xmp = ["defusedxml"] + [[package]] name = "pkgutil-resolve-name" version = "1.3.10" @@ -3352,13 +3467,13 @@ test = ["appdirs (==1.4.4)", "covdefaults (>=2.3)", "pytest (>=7.4.3)", "pytest- [[package]] name = "posthog" -version = "3.4.2" +version = "3.5.0" description = "Integrate PostHog into any python application." optional = false python-versions = "*" files = [ - {file = "posthog-3.4.2-py2.py3-none-any.whl", hash = "sha256:c7e79b2e585d16e93749874bcbcdad78d857037398ce0d8d6c474a04d0bd3bbe"}, - {file = "posthog-3.4.2.tar.gz", hash = "sha256:f0eafa663fbc4a942b49b6168a62a890635407044bbc7593051dcb9cc1208873"}, + {file = "posthog-3.5.0-py2.py3-none-any.whl", hash = "sha256:3c672be7ba6f95d555ea207d4486c171d06657eb34b3ce25eb043bfe7b6b5b76"}, + {file = "posthog-3.5.0.tar.gz", hash = "sha256:8f7e3b2c6e8714d0c0c542a2109b83a7549f63b7113a133ab2763a89245ef2ef"}, ] [package.dependencies] @@ -3659,42 +3774,42 @@ testutils = ["gitpython (>3)"] [[package]] name = "pymupdf" -version = "1.23.25" +version = "1.23.26" description = "A high performance Python library for data extraction, analysis, conversion & manipulation of PDF (and other) documents." optional = false python-versions = ">=3.8" files = [ - {file = "PyMuPDF-1.23.25-cp310-none-macosx_10_9_x86_64.whl", hash = "sha256:6be2b20fbff40602f673fc8e60fde3e5911397f8ca9ed6aa2d15be94b12cc2c4"}, - {file = "PyMuPDF-1.23.25-cp310-none-macosx_11_0_arm64.whl", hash = "sha256:0f6923a44fbeaeefaabb2fa10955dcef3624e8826db661201951f3b3409fed32"}, - {file = "PyMuPDF-1.23.25-cp310-none-manylinux2014_aarch64.whl", hash = "sha256:8eeb2e97347586ec293fddaf61e8dfc58d6b2763406e8f7a6e45b560bf9b15a3"}, - {file = "PyMuPDF-1.23.25-cp310-none-manylinux2014_x86_64.whl", hash = "sha256:dca46799c152051697c5e88d66c17ba6d0244668d0c4dd8a2ba2d8d3cb745988"}, - {file = "PyMuPDF-1.23.25-cp310-none-win32.whl", hash = "sha256:88bfed1bd13ec84869489fc7b97381016cb8b99956073f4c3e8ac8c840bbb15a"}, - {file = "PyMuPDF-1.23.25-cp310-none-win_amd64.whl", hash = "sha256:98a78582c8a0c61b372e2bcd63dc61efc873e40b7d1f0b896a195e1a9ef9ffa7"}, - {file = "PyMuPDF-1.23.25-cp311-none-macosx_10_9_x86_64.whl", hash = "sha256:d7792810634036a745ea3eb3c4ccf2b6adab55ca9644e3352747d2b5aa5327f9"}, - {file = "PyMuPDF-1.23.25-cp311-none-macosx_11_0_arm64.whl", hash = "sha256:03bd1985b0234c3d2b8e26bb3e9ab1d2641dbada1e199b838a6bf884f35224c8"}, - {file = "PyMuPDF-1.23.25-cp311-none-manylinux2014_aarch64.whl", hash = "sha256:638fcb1f7551eb5ab582e412e204e8ded94acbbc37bc7f1e891a5dfc428881ee"}, - {file = "PyMuPDF-1.23.25-cp311-none-manylinux2014_x86_64.whl", hash = "sha256:067c88b4e6609cb7e74d98d0b0a35c11eb8e29f4fc51dc7ed1dd448b81d347c7"}, - {file = "PyMuPDF-1.23.25-cp311-none-win32.whl", hash = "sha256:a694f160d1701285cf3152951430740878d168511cd9ea0a3adcfaf3cac00322"}, - {file = "PyMuPDF-1.23.25-cp311-none-win_amd64.whl", hash = "sha256:514bcb679926b33413637b0bd73b223c90fb0d19352caf3395d0f23b1d47e8af"}, - {file = "PyMuPDF-1.23.25-cp312-none-macosx_10_9_x86_64.whl", hash = "sha256:bba342321e1b5574631894d7d34ec046605d953a23553b7d2f9c0e4d3c27254b"}, - {file = "PyMuPDF-1.23.25-cp312-none-macosx_11_0_arm64.whl", hash = "sha256:b2cb058c8229f9697deebe0574f7d95e4b9a5e295ceafd554346bbd464141e89"}, - {file = "PyMuPDF-1.23.25-cp312-none-manylinux2014_aarch64.whl", hash = "sha256:2479473b533936593428ce78499a1e9901570110ac602f03f1f3174efa0fa6a8"}, - {file = "PyMuPDF-1.23.25-cp312-none-manylinux2014_x86_64.whl", hash = "sha256:a247a4be1e43a6127ee305eae9f65767ee7519a2aa0cb1a2aa6acfd4e7fe7a9b"}, - {file = "PyMuPDF-1.23.25-cp312-none-win32.whl", hash = "sha256:b062be400bbaff6e8b17c0a8da9481e01ec935f97967e0870e9aacd7ba60a52a"}, - {file = "PyMuPDF-1.23.25-cp312-none-win_amd64.whl", hash = "sha256:b12e608761e1586a65f6e96a34417a91f814dbab29f2929b41d825ab32fab6ef"}, - {file = "PyMuPDF-1.23.25-cp38-none-macosx_10_9_x86_64.whl", hash = "sha256:ac97691c0e0e23607626d394bd660a46ea33f64921dc9288cf24daee207f9fe3"}, - {file = "PyMuPDF-1.23.25-cp38-none-macosx_11_0_arm64.whl", hash = "sha256:c0a16cda5dc9b59d494ae23bdd9c4a3db53d04f2b6390265f5c0fe6269777975"}, - {file = "PyMuPDF-1.23.25-cp38-none-manylinux2014_aarch64.whl", hash = "sha256:23d735db51722a889bb50636d161d2747f08fa0b82cc2e4a7eb8e228b25d1c4e"}, - {file = "PyMuPDF-1.23.25-cp38-none-manylinux2014_x86_64.whl", hash = "sha256:cbc1407dcf01b2e3e547b2d7643b97cc44c0950d2bb4b12c74322664c5cb37d7"}, - {file = "PyMuPDF-1.23.25-cp38-none-win32.whl", hash = "sha256:c29518701d6360beb01c25cf69a77b6426db90a9e7cd11179b3bd783c7fb4cb1"}, - {file = "PyMuPDF-1.23.25-cp38-none-win_amd64.whl", hash = "sha256:c1bb6fa9e00c846e6829dec2bee8326754adaef5c80626b99233c01923f0342c"}, - {file = "PyMuPDF-1.23.25-cp39-none-macosx_10_9_x86_64.whl", hash = "sha256:514b272bfcd897f9ae29384da04167dcdea3b13ce0f2b9099b645314355d037d"}, - {file = "PyMuPDF-1.23.25-cp39-none-macosx_11_0_arm64.whl", hash = "sha256:ef345a5b050d0869ef404845075edd5f4bd7fd99e235f4d32ce85f423779a120"}, - {file = "PyMuPDF-1.23.25-cp39-none-manylinux2014_aarch64.whl", hash = "sha256:b3ade5b349c38ddffb24f8c266fbcd7161f488c43960ff0f03f977d40d4df967"}, - {file = "PyMuPDF-1.23.25-cp39-none-manylinux2014_x86_64.whl", hash = "sha256:111d795a3e840aec2ad66beebd90a5327994ec85ed56fd68312f5463062dbbfa"}, - {file = "PyMuPDF-1.23.25-cp39-none-win32.whl", hash = "sha256:2237ce9897771f4af686cc0c81517ffb020fc1a011b95ccf5ccf05383492bd6d"}, - {file = "PyMuPDF-1.23.25-cp39-none-win_amd64.whl", hash = "sha256:251c9c321a2112716068d5ae11deedd1911d0387cbdd0ef19adb216a3adf882c"}, - {file = "PyMuPDF-1.23.25.tar.gz", hash = "sha256:eb414e92f08107f43576a1fedea28aa837220b15ad58c8e32015435fe96cc03e"}, + {file = "PyMuPDF-1.23.26-cp310-none-macosx_10_9_x86_64.whl", hash = "sha256:645a05321aecc8c45739f71f0eb574ce33138d19189582ffa5241fea3a8e2549"}, + {file = "PyMuPDF-1.23.26-cp310-none-macosx_11_0_arm64.whl", hash = "sha256:2dfc9e010669ae92fade6fb72aaea49ebe3b8dcd7ee4dcbbe50115abcaa4d3fe"}, + {file = "PyMuPDF-1.23.26-cp310-none-manylinux2014_aarch64.whl", hash = "sha256:734ee380b3abd038602be79114194a3cb74ac102b7c943bcb333104575922c50"}, + {file = "PyMuPDF-1.23.26-cp310-none-manylinux2014_x86_64.whl", hash = "sha256:b22f8d854f8196ad5b20308c1cebad3d5189ed9f0988acbafa043947ea7e6c55"}, + {file = "PyMuPDF-1.23.26-cp310-none-win32.whl", hash = "sha256:cc0f794e3466bc96b5bf79d42fbc1551428751e3fef38ebc10ac70396b676144"}, + {file = "PyMuPDF-1.23.26-cp310-none-win_amd64.whl", hash = "sha256:2eb701247d8e685a24e45899d1175f01a3ce5fc792a4431c91fbb68633b29298"}, + {file = "PyMuPDF-1.23.26-cp311-none-macosx_10_9_x86_64.whl", hash = "sha256:e2804a64bb57da414781e312fb0561f6be67658ad57ed4a73dce008b23fc70a6"}, + {file = "PyMuPDF-1.23.26-cp311-none-macosx_11_0_arm64.whl", hash = "sha256:97b40bb22e3056874634617a90e0ed24a5172cf71791b9e25d1d91c6743bc567"}, + {file = "PyMuPDF-1.23.26-cp311-none-manylinux2014_aarch64.whl", hash = "sha256:fab8833559bc47ab26ce736f915b8fc1dd37c108049b90396f7cd5e1004d7593"}, + {file = "PyMuPDF-1.23.26-cp311-none-manylinux2014_x86_64.whl", hash = "sha256:f25aafd3e7fb9d7761a22acf2b67d704f04cc36d4dc33a3773f0eb3f4ec3606f"}, + {file = "PyMuPDF-1.23.26-cp311-none-win32.whl", hash = "sha256:05e672ed3e82caca7ef02a88ace30130b1dd392a1190f03b2b58ffe7aa331400"}, + {file = "PyMuPDF-1.23.26-cp311-none-win_amd64.whl", hash = "sha256:92b3c4dd4d0491d495f333be2d41f4e1c155a409bc9d04b5ff29655dccbf4655"}, + {file = "PyMuPDF-1.23.26-cp312-none-macosx_10_9_x86_64.whl", hash = "sha256:a217689ede18cc6991b4e6a78afee8a440b3075d53b9dec4ba5ef7487d4547e9"}, + {file = "PyMuPDF-1.23.26-cp312-none-macosx_11_0_arm64.whl", hash = "sha256:42ad2b819b90ce1947e11b90ec5085889df0a2e3aa0207bc97ecacfc6157cabc"}, + {file = "PyMuPDF-1.23.26-cp312-none-manylinux2014_aarch64.whl", hash = "sha256:99607649f89a02bba7d8ebe96e2410664316adc95e9337f7dfeff6a154f93049"}, + {file = "PyMuPDF-1.23.26-cp312-none-manylinux2014_x86_64.whl", hash = "sha256:bb42d4b8407b4de7cb58c28f01449f16f32a6daed88afb41108f1aeb3552bdd4"}, + {file = "PyMuPDF-1.23.26-cp312-none-win32.whl", hash = "sha256:c40d044411615e6f0baa7d3d933b3032cf97e168c7fa77d1be8a46008c109aee"}, + {file = "PyMuPDF-1.23.26-cp312-none-win_amd64.whl", hash = "sha256:3f876533aa7f9a94bcd9a0225ce72571b7808260903fec1d95c120bc842fb52d"}, + {file = "PyMuPDF-1.23.26-cp38-none-macosx_10_9_x86_64.whl", hash = "sha256:52df831d46beb9ff494f5fba3e5d069af6d81f49abf6b6e799ee01f4f8fa6799"}, + {file = "PyMuPDF-1.23.26-cp38-none-macosx_11_0_arm64.whl", hash = "sha256:0bbb0cf6593e53524f3fc26fb5e6ead17c02c64791caec7c4afe61b677dedf80"}, + {file = "PyMuPDF-1.23.26-cp38-none-manylinux2014_aarch64.whl", hash = "sha256:5ef4360f20015673c20cf59b7e19afc97168795188c584254ed3778cde43ce77"}, + {file = "PyMuPDF-1.23.26-cp38-none-manylinux2014_x86_64.whl", hash = "sha256:d7cd88842b2e7f4c71eef4d87c98c35646b80b60e6375392d7ce40e519261f59"}, + {file = "PyMuPDF-1.23.26-cp38-none-win32.whl", hash = "sha256:6577e2f473625e2d0df5f5a3bf1e4519e94ae749733cc9937994d1b256687bfa"}, + {file = "PyMuPDF-1.23.26-cp38-none-win_amd64.whl", hash = "sha256:fbe1a3255b2cd0d769b2da2c4efdd0c0f30d4961a1aac02c0f75cf951b337aa4"}, + {file = "PyMuPDF-1.23.26-cp39-none-macosx_10_9_x86_64.whl", hash = "sha256:73fce034f2afea886a59ead2d0caedf27e2b2a8558b5da16d0286882e0b1eb82"}, + {file = "PyMuPDF-1.23.26-cp39-none-macosx_11_0_arm64.whl", hash = "sha256:b3de8618b7cb5b36db611083840b3bcf09b11a893e2d8262f4e042102c7e65de"}, + {file = "PyMuPDF-1.23.26-cp39-none-manylinux2014_aarch64.whl", hash = "sha256:879e7f5ad35709d8760ab6103c3d5dac8ab8043a856ab3653fd324af7358ee87"}, + {file = "PyMuPDF-1.23.26-cp39-none-manylinux2014_x86_64.whl", hash = "sha256:deee96c2fd415ded7b5070d8d5b2c60679aee6ed0e28ac0d2cb998060d835c2c"}, + {file = "PyMuPDF-1.23.26-cp39-none-win32.whl", hash = "sha256:9f7f4ef99dd8ac97fb0b852efa3dcbee515798078b6c79a6a13c7b1e7c5d41a4"}, + {file = "PyMuPDF-1.23.26-cp39-none-win_amd64.whl", hash = "sha256:ba9a54552c7afb9ec85432c765e2fa9a81413acfaa7d70db7c9b528297749e5b"}, + {file = "PyMuPDF-1.23.26.tar.gz", hash = "sha256:a904261b317b761b0aa2bd2c1f6cd25d25aa4258be67a90c02a878efc5dca649"}, ] [package.dependencies] @@ -3716,13 +3831,13 @@ files = [ [[package]] name = "pypdf" -version = "4.0.2" +version = "4.1.0" description = "A pure-python PDF library capable of splitting, merging, cropping, and transforming PDF files" optional = false python-versions = ">=3.6" files = [ - {file = "pypdf-4.0.2-py3-none-any.whl", hash = "sha256:a62daa2a24d5a608ba1b6284dde185317ce3644f89b9ebe5314d0c5d1c9f257d"}, - {file = "pypdf-4.0.2.tar.gz", hash = "sha256:3316d9ddfcff5df67ae3cdfe8b945c432aa43e7f970bae7c2a4ab4fe129cd937"}, + {file = "pypdf-4.1.0-py3-none-any.whl", hash = "sha256:16cac912a05200099cef3f347c4c7e0aaf0a6d027603b8f9a973c0ea500dff89"}, + {file = "pypdf-4.1.0.tar.gz", hash = "sha256:01c3257ec908676efd60a4537e525b89d48e0852bc92b4e0aa4cc646feda17cc"}, ] [package.dependencies] @@ -3772,13 +3887,13 @@ files = [ [[package]] name = "python-dateutil" -version = "2.8.2" +version = "2.9.0.post0" description = "Extensions to the standard Python datetime module" optional = false python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,>=2.7" files = [ - {file = "python-dateutil-2.8.2.tar.gz", hash = "sha256:0123cacc1627ae19ddf3c27a5de5bd67ee4586fbdd6440d9748f8abb483d3e86"}, - {file = "python_dateutil-2.8.2-py2.py3-none-any.whl", hash = "sha256:961d03dc3453ebbc59dbdea9e4e11c5651520a876d0f4db161e8674aae935da9"}, + {file = "python-dateutil-2.9.0.post0.tar.gz", hash = "sha256:37dd54208da7e1cd875388217d5e00ebd4179249f90fb72437e91a35459a0ad3"}, + {file = "python_dateutil-2.9.0.post0-py2.py3-none-any.whl", hash = "sha256:a8b2bc7bffae282281c8140a97d3aa9c14da0b136dfe83f850eea9a5f7470427"}, ] [package.dependencies] @@ -4605,48 +4720,60 @@ test = ["pytest"] [[package]] name = "sqlalchemy" -version = "2.0.27" +version = "2.0.28" description = "Database Abstraction Library" optional = false python-versions = ">=3.7" files = [ - {file = "SQLAlchemy-2.0.27-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:d04e579e911562f1055d26dab1868d3e0bb905db3bccf664ee8ad109f035618a"}, - {file = "SQLAlchemy-2.0.27-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:fa67d821c1fd268a5a87922ef4940442513b4e6c377553506b9db3b83beebbd8"}, - {file = "SQLAlchemy-2.0.27-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:954d9735ee9c3fa74874c830d089a815b7b48df6f6b6e357a74130e478dbd951"}, - {file = "SQLAlchemy-2.0.27-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:03f448ffb731b48323bda68bcc93152f751436ad6037f18a42b7e16af9e91c07"}, - {file = "SQLAlchemy-2.0.27-cp310-cp310-win32.whl", hash = "sha256:d997c5938a08b5e172c30583ba6b8aad657ed9901fc24caf3a7152eeccb2f1b4"}, - {file = "SQLAlchemy-2.0.27-cp310-cp310-win_amd64.whl", hash = "sha256:eb15ef40b833f5b2f19eeae65d65e191f039e71790dd565c2af2a3783f72262f"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:6c5bad7c60a392850d2f0fee8f355953abaec878c483dd7c3836e0089f046bf6"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:a3012ab65ea42de1be81fff5fb28d6db893ef978950afc8130ba707179b4284a"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d177b7e82f6dd5e1aebd24d9c3297c70ce09cd1d5d37b43e53f39514379c029c"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:1306102f6d9e625cebaca3d4c9c8f10588735ef877f0360b5cdb4fdfd3fd7131"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-win32.whl", hash = "sha256:5b78aa9f4f68212248aaf8943d84c0ff0f74efc65a661c2fc68b82d498311fd5"}, - {file = "SQLAlchemy-2.0.27-cp311-cp311-win_amd64.whl", hash = "sha256:15e19a84b84528f52a68143439d0c7a3a69befcd4f50b8ef9b7b69d2628ae7c4"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:0de1263aac858f288a80b2071990f02082c51d88335a1db0d589237a3435fe71"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:ce850db091bf7d2a1f2fdb615220b968aeff3849007b1204bf6e3e50a57b3d32"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:c4fbe6a766301f2e8a4519f4500fe74ef0a8509a59e07a4085458f26228cd7cc"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:0fb3bffc0ced37e5aa4ac2416f56d6d858f46d4da70c09bb731a246e70bff4d5"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-win32.whl", hash = "sha256:7f470327d06400a0aa7926b375b8e8c3c31d335e0884f509fe272b3c700a7254"}, - {file = "SQLAlchemy-2.0.27-cp312-cp312-win_amd64.whl", hash = "sha256:f9374e270e2553653d710ece397df67db9d19c60d2647bcd35bfc616f1622dcd"}, - {file = "SQLAlchemy-2.0.27-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:e97cf143d74a7a5a0f143aa34039b4fecf11343eed66538610debc438685db4a"}, - {file = "SQLAlchemy-2.0.27-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e36aa62b765cf9f43a003233a8c2d7ffdeb55bc62eaa0a0380475b228663a38f"}, - {file = "SQLAlchemy-2.0.27-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:b1d9d1bfd96eef3c3faedb73f486c89e44e64e40e5bfec304ee163de01cf996f"}, - {file = "SQLAlchemy-2.0.27-cp37-cp37m-win32.whl", hash = "sha256:ca891af9f3289d24a490a5fde664ea04fe2f4984cd97e26de7442a4251bd4b7c"}, - {file = "SQLAlchemy-2.0.27-cp37-cp37m-win_amd64.whl", hash = "sha256:fd8aafda7cdff03b905d4426b714601c0978725a19efc39f5f207b86d188ba01"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:ec1f5a328464daf7a1e4e385e4f5652dd9b1d12405075ccba1df842f7774b4fc"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:ad862295ad3f644e3c2c0d8b10a988e1600d3123ecb48702d2c0f26771f1c396"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9e56afce6431450442f3ab5973156289bd5ec33dd618941283847c9fd5ff06bf"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:b86abba762ecfeea359112b2bb4490802b340850bbee1948f785141a5e020de8"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-win32.whl", hash = "sha256:30d81cc1192dc693d49d5671cd40cdec596b885b0ce3b72f323888ab1c3863d5"}, - {file = "SQLAlchemy-2.0.27-cp38-cp38-win_amd64.whl", hash = "sha256:120af1e49d614d2525ac247f6123841589b029c318b9afbfc9e2b70e22e1827d"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:d07ee7793f2aeb9b80ec8ceb96bc8cc08a2aec8a1b152da1955d64e4825fcbac"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:cb0845e934647232b6ff5150df37ceffd0b67b754b9fdbb095233deebcddbd4a"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b90053be91973a6fb6020a6e44382c97739736a5a9d74e08cc29b196639eb979"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:33e8bde8fff203de50399b9039c4e14e42d4d227759155c21f8da4a47fc8053c"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-win32.whl", hash = "sha256:d873c21b356bfaf1589b89090a4011e6532582b3a8ea568a00e0c3aab09399dd"}, - {file = "SQLAlchemy-2.0.27-cp39-cp39-win_amd64.whl", hash = "sha256:ff2f1b7c963961d41403b650842dc2039175b906ab2093635d8319bef0b7d620"}, - {file = "SQLAlchemy-2.0.27-py3-none-any.whl", hash = "sha256:1ab4e0448018d01b142c916cc7119ca573803a4745cfe341b8f95657812700ac"}, - {file = "SQLAlchemy-2.0.27.tar.gz", hash = "sha256:86a6ed69a71fe6b88bf9331594fa390a2adda4a49b5c06f98e47bf0d392534f8"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:e0b148ab0438f72ad21cb004ce3bdaafd28465c4276af66df3b9ecd2037bf252"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:bbda76961eb8f27e6ad3c84d1dc56d5bc61ba8f02bd20fcf3450bd421c2fcc9c"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:feea693c452d85ea0015ebe3bb9cd15b6f49acc1a31c28b3c50f4db0f8fb1e71"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5da98815f82dce0cb31fd1e873a0cb30934971d15b74e0d78cf21f9e1b05953f"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:4a5adf383c73f2d49ad15ff363a8748319ff84c371eed59ffd0127355d6ea1da"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:56856b871146bfead25fbcaed098269d90b744eea5cb32a952df00d542cdd368"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-win32.whl", hash = "sha256:943aa74a11f5806ab68278284a4ddd282d3fb348a0e96db9b42cb81bf731acdc"}, + {file = "SQLAlchemy-2.0.28-cp310-cp310-win_amd64.whl", hash = "sha256:c6c4da4843e0dabde41b8f2e8147438330924114f541949e6318358a56d1875a"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:46a3d4e7a472bfff2d28db838669fc437964e8af8df8ee1e4548e92710929adc"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:0d3dd67b5d69794cfe82862c002512683b3db038b99002171f624712fa71aeaa"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c61e2e41656a673b777e2f0cbbe545323dbe0d32312f590b1bc09da1de6c2a02"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:0315d9125a38026227f559488fe7f7cee1bd2fbc19f9fd637739dc50bb6380b2"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:af8ce2d31679006e7b747d30a89cd3ac1ec304c3d4c20973f0f4ad58e2d1c4c9"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:81ba314a08c7ab701e621b7ad079c0c933c58cdef88593c59b90b996e8b58fa5"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-win32.whl", hash = "sha256:1ee8bd6d68578e517943f5ebff3afbd93fc65f7ef8f23becab9fa8fb315afb1d"}, + {file = "SQLAlchemy-2.0.28-cp311-cp311-win_amd64.whl", hash = "sha256:ad7acbe95bac70e4e687a4dc9ae3f7a2f467aa6597049eeb6d4a662ecd990bb6"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:d3499008ddec83127ab286c6f6ec82a34f39c9817f020f75eca96155f9765097"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:9b66fcd38659cab5d29e8de5409cdf91e9986817703e1078b2fdaad731ea66f5"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:bea30da1e76cb1acc5b72e204a920a3a7678d9d52f688f087dc08e54e2754c67"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:124202b4e0edea7f08a4db8c81cc7859012f90a0d14ba2bf07c099aff6e96462"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:e23b88c69497a6322b5796c0781400692eca1ae5532821b39ce81a48c395aae9"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:4b6303bfd78fb3221847723104d152e5972c22367ff66edf09120fcde5ddc2e2"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-win32.whl", hash = "sha256:a921002be69ac3ab2cf0c3017c4e6a3377f800f1fca7f254c13b5f1a2f10022c"}, + {file = "SQLAlchemy-2.0.28-cp312-cp312-win_amd64.whl", hash = "sha256:b4a2cf92995635b64876dc141af0ef089c6eea7e05898d8d8865e71a326c0385"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:8e91b5e341f8c7f1e5020db8e5602f3ed045a29f8e27f7f565e0bdee3338f2c7"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:45c7b78dfc7278329f27be02c44abc0d69fe235495bb8e16ec7ef1b1a17952db"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:3eba73ef2c30695cb7eabcdb33bb3d0b878595737479e152468f3ba97a9c22a4"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:5df5d1dafb8eee89384fb7a1f79128118bc0ba50ce0db27a40750f6f91aa99d5"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:2858bbab1681ee5406650202950dc8f00e83b06a198741b7c656e63818633526"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-win32.whl", hash = "sha256:9461802f2e965de5cff80c5a13bc945abea7edaa1d29360b485c3d2b56cdb075"}, + {file = "SQLAlchemy-2.0.28-cp37-cp37m-win_amd64.whl", hash = "sha256:a6bec1c010a6d65b3ed88c863d56b9ea5eeefdf62b5e39cafd08c65f5ce5198b"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:843a882cadebecc655a68bd9a5b8aa39b3c52f4a9a5572a3036fb1bb2ccdc197"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:dbb990612c36163c6072723523d2be7c3eb1517bbdd63fe50449f56afafd1133"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:bd7e4baf9161d076b9a7e432fce06217b9bd90cfb8f1d543d6e8c4595627edb9"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e0a5354cb4de9b64bccb6ea33162cb83e03dbefa0d892db88a672f5aad638a75"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:fffcc8edc508801ed2e6a4e7b0d150a62196fd28b4e16ab9f65192e8186102b6"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:aca7b6d99a4541b2ebab4494f6c8c2f947e0df4ac859ced575238e1d6ca5716b"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-win32.whl", hash = "sha256:8c7f10720fc34d14abad5b647bc8202202f4948498927d9f1b4df0fb1cf391b7"}, + {file = "SQLAlchemy-2.0.28-cp38-cp38-win_amd64.whl", hash = "sha256:243feb6882b06a2af68ecf4bec8813d99452a1b62ba2be917ce6283852cf701b"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:fc4974d3684f28b61b9a90fcb4c41fb340fd4b6a50c04365704a4da5a9603b05"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:87724e7ed2a936fdda2c05dbd99d395c91ea3c96f029a033a4a20e008dd876bf"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:68722e6a550f5de2e3cfe9da6afb9a7dd15ef7032afa5651b0f0c6b3adb8815d"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:328529f7c7f90adcd65aed06a161851f83f475c2f664a898af574893f55d9e53"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:df40c16a7e8be7413b885c9bf900d402918cc848be08a59b022478804ea076b8"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:426f2fa71331a64f5132369ede5171c52fd1df1bd9727ce621f38b5b24f48750"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-win32.whl", hash = "sha256:33157920b233bc542ce497a81a2e1452e685a11834c5763933b440fedd1d8e2d"}, + {file = "SQLAlchemy-2.0.28-cp39-cp39-win_amd64.whl", hash = "sha256:2f60843068e432311c886c5f03c4664acaef507cf716f6c60d5fde7265be9d7b"}, + {file = "SQLAlchemy-2.0.28-py3-none-any.whl", hash = "sha256:78bb7e8da0183a8301352d569900d9d3594c48ac21dc1c2ec6b3121ed8b6c986"}, + {file = "SQLAlchemy-2.0.28.tar.gz", hash = "sha256:dd53b6c4e6d960600fd6532b79ee28e2da489322fcf6648738134587faf767b6"}, ] [package.dependencies] @@ -5058,24 +5185,24 @@ files = [ [[package]] name = "types-docutils" -version = "0.20.0.20240227" +version = "0.20.0.20240304" description = "Typing stubs for docutils" optional = false python-versions = ">=3.8" files = [ - {file = "types-docutils-0.20.0.20240227.tar.gz", hash = "sha256:7f2dbb02356024b5db3efd9df26b236da050ad2eada89872e5284b4a394b7761"}, - {file = "types_docutils-0.20.0.20240227-py3-none-any.whl", hash = "sha256:51c139502ba0add871392cbc37200a3a64096e61eeb6396727443ba6d38ae579"}, + {file = "types-docutils-0.20.0.20240304.tar.gz", hash = "sha256:c35ae35ca835a5aeead758df411cd46cfb7e7f19f2b223c413dae7e069d5b0be"}, + {file = "types_docutils-0.20.0.20240304-py3-none-any.whl", hash = "sha256:ef02f9d05f2b61500638b1358cdf3fbf975cc5dedaa825a2eb5ea71b7318a760"}, ] [[package]] name = "types-protobuf" -version = "4.24.0.20240129" +version = "4.24.0.20240302" description = "Typing stubs for protobuf" optional = false python-versions = ">=3.8" files = [ - {file = "types-protobuf-4.24.0.20240129.tar.gz", hash = "sha256:8a83dd3b9b76a33e08d8636c5daa212ace1396418ed91837635fcd564a624891"}, - {file = "types_protobuf-4.24.0.20240129-py3-none-any.whl", hash = "sha256:23be68cc29f3f5213b5c5878ac0151706182874040e220cfb11336f9ee642ead"}, + {file = "types-protobuf-4.24.0.20240302.tar.gz", hash = "sha256:f22c00cc0cea9722e71e14d389bba429af9e35a74a949719c167203a5abbe2e4"}, + {file = "types_protobuf-4.24.0.20240302-py3-none-any.whl", hash = "sha256:5c607990f50f14606c2edaf379f8acc7418fef1451b227aa3c6a8a2cbc6ff14a"}, ] [[package]] @@ -5696,4 +5823,4 @@ testing = ["big-O", "jaraco.functools", "jaraco.itertools", "more-itertools", "p [metadata] lock-version = "2.0" python-versions = ">=3.8.1,<4.0" -content-hash = "7521296bc392c8bb14845d4f764faaaef668863f9442fd44a1bb5539d261d77c" +content-hash = "b3cad5844057965a829ca5df97dfcce50bf430eef20b0b69e7be04a0288acef9" diff --git a/pyproject.toml b/pyproject.toml index 466a97043e605..7ef492487c9b4 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -44,7 +44,7 @@ name = "llama-index" packages = [{from = "_llama-index", include = "llama_index"}] readme = "README.md" repository = "https://github.com/run-llama/llama_index" -version = "0.10.14" +version = "0.10.16" [tool.poetry.dependencies] python = ">=3.8.1,<4.0" @@ -57,7 +57,7 @@ llama-index-agent-openai = "^0.1.4" llama-index-readers-file = "^0.1.4" llama-index-readers-llama-parse = "^0.1.2" llama-index-indices-managed-llama-cloud = "^0.1.2" -llama-index-core = "^0.10.14" +llama-index-core = "^0.10.16" llama-index-multi-modal-llms-openai = "^0.1.3" llama-index-cli = "^0.1.2"