update

eric-epsilla · eric-epsilla · commit f8c992cdeaa2 · 2024-11-28T10:22:03.000+08:00
diff --git a/examples/Question_Answering_Pipeline_with_LangChain_and_Epsilla.py b/examples/Question_Answering_Pipeline_with_LangChain_and_Epsilla.py
@@ -16,6 +16,7 @@
 
 # Step2. Configure the OpenAI API Key
 import os
+
 os.environ["OPENAI_API_KEY"] = "Your-OpenAI-API-Key"
 
 
@@ -24,9 +25,13 @@
 from langchain.text_splitter import CharacterTextSplitter
 from langchain_openai import OpenAIEmbeddings
 
-loader = WebBaseLoader("https://raw.githubusercontent.com/hwchase17/chat-your-data/master/state_of_the_union.txt")
+loader = WebBaseLoader(
+    "https://raw.githubusercontent.com/hwchase17/chat-your-data/master/state_of_the_union.txt"
+)
 documents = loader.load()
-documents = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0).split_documents(documents)
+documents = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0).split_documents(
+    documents
+)
 embeddings = OpenAIEmbeddings()
 
 
@@ -49,8 +54,6 @@
 )
 
 
-
-
 # Step4. Create the QA for Retrieval
 from langchain.chains import RetrievalQA
 from langchain_openai import OpenAI
diff --git a/examples/Question_Answering_Pipeline_with_LangChain_and_EpsillaCloud.py b/examples/Question_Answering_Pipeline_with_LangChain_and_EpsillaCloud.py
@@ -18,55 +18,61 @@
 import os
 
 os.environ["OPENAI_API_KEY"] = "Your-OpenAI-API-Key"
-epsilla_api_key = os.getenv("EPSILLA_API_KEY", "Your-Epsilla-API-Key")
-project_id = os.getenv("EPSILLA_PROJECT_ID", "Your-Project-ID")
-db_id = os.getenv("EPSILLA_DB_ID", "Your-DB-ID")
-db_sharding_id = os.getenv("EPSILLA_DB_SHARDING_ID", 0)
 
+EPSILLA_PROJECT_ID = os.getenv("EPSILLA_PROJECT_ID", "Your-Epsilla-Project-ID")
+EPSILLA_API_KEY = os.getenv("EPSILLA_API_KEY", "Your-Epsilla-API-Key")
+EPSILLA_DB_ID = os.getenv("EPSILLA_DB_ID", "Your-Epsilla-DB-ID")
+EPSILLA_DB_SHARDING_ID = os.getenv("EPSILLA_DB_SHARDING_ID", 0)
+
+TABLE_NAME = os.getenv("TABLE_NAME", "MyTable")
+
+db_name = f"db_{EPSILLA_DB_ID.replace('-', '_')}"
+db_path = f"/data/{EPSILLA_PROJECT_ID}/{db_name}/s{EPSILLA_DB_SHARDING_ID}"
+
+
+from langchain.text_splitter import CharacterTextSplitter
 
 # Step3. Load the documents
 from langchain_community.document_loaders import WebBaseLoader
-from langchain.text_splitter import CharacterTextSplitter
 from langchain_openai import OpenAIEmbeddings
 
-loader = WebBaseLoader("https://raw.githubusercontent.com/hwchase17/chat-your-data/master/state_of_the_union.txt")
+loader = WebBaseLoader(
+    "https://raw.githubusercontent.com/hwchase17/chat-your-data/master/state_of_the_union.txt"
+)
 documents = loader.load()
-documents = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0).split_documents(documents)
+documents = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0).split_documents(
+    documents
+)
 embeddings = OpenAIEmbeddings()
 
 
 # Step4. Load the vector store
 from langchain_community.vectorstores import Epsilla
 from pyepsilla import cloud
 
-db_name = f"db_{db_id.replace('-', '_')}"
-db_path = f"/data/{project_id}/{db_name}/s{db_sharding_id}"
-table_name = "MyCollection"
-
 # Step4.1 Connect to Epsilla Cloud
 cloud_client = cloud.Client(
-    project_id=project_id,
-    api_key=epsilla_api_key,
+    project_id=EPSILLA_PROJECT_ID,
+    api_key=EPSILLA_API_KEY,
 )
 
 # Step4.2 Connect to Vectordb
-db_client = cloud_client.vectordb(db_id)
+db_client = cloud_client.vectordb(EPSILLA_DB_ID)
 
 vector_store = Epsilla.from_documents(
     documents,
     embeddings,
     db_client,
     db_path=db_path,
     db_name=db_name,
-    collection_name=table_name,
+    collection_name=TABLE_NAME,
 )
 
 # query = "What did the president say about Ketanji Brown Jackson"
 # docs = vector_store.similarity_search(query)
 # print(docs[0].page_content)
 
 
-
 # Step5. Create the QA for Retrieval
 from langchain.chains import RetrievalQA
 from langchain_openai import OpenAI
diff --git a/examples/hello_epsilla_cloud.py b/examples/hello_epsilla_cloud.py
@@ -11,18 +11,18 @@
 
 from pyepsilla import cloud
 
-EPSILLA_PROJECT_ID = os.getenv("EPSILLA_PROJECT_ID", "Your-Project-ID")
+EPSILLA_PROJECT_ID = os.getenv("EPSILLA_PROJECT_ID", "Your-Epsilla-Project-ID")
 EPSILLA_API_KEY = os.getenv("EPSILLA_API_KEY", "Your-Epsilla-API-Key")
 
-DB_ID = os.getenv("DB_ID", "Your-DB-ID")
+DB_ID = os.getenv("EPSILLA_DB_ID", "Your-Epsilla-DB-ID")
 DB_NAME = os.getenv("DB_NAME", "MyDB")
 DB_PATH = os.getenv("DB_PATH", "/tmp/epsilla_demo")
 TABLE_NAME = os.getenv("TABLE_NAME", "MyTable")
 
 
 if not EPSILLA_PROJECT_ID or not EPSILLA_API_KEY or not DB_ID:
     print(
-        "Please set the environment variables: EPSILLA_PROJECT_ID, EPSILLA_API_KEY, DB_ID"
+        "Please set the environment variables: EPSILLA_PROJECT_ID, EPSILLA_API_KEY, EPSILLA_DB_ID"
     )
     sys.exit(1)
 
diff --git a/examples/hello_epsilla_rag.py b/examples/hello_epsilla_rag.py
@@ -10,7 +10,7 @@
 
 from pyepsilla import cloud
 
-EPSILLA_PROJECT_ID = os.getenv("EPSILLA_PROJECT_ID", "Your-Project-ID")
+EPSILLA_PROJECT_ID = os.getenv("EPSILLA_PROJECT_ID", "Your-Epsilla-Project-ID")
 EPSILLA_API_KEY = os.getenv("EPSILLA_API_KEY", "Your-Epsilla-API-Key")
 EPSILLA_RAGAPP_ID = os.getenv("EPSILLA_RAGAPP_ID", "Your-Epsilla-RAGAPP-ID")
 EPSILLA_CONVERSATION_ID = os.getenv("EPSILLA_CONVERSATION_ID", None)