elastic
diff --git a/‎example-apps/workplace-search/README.md‎
Lines changed: 44 additions & 2 deletions b/‎example-apps/workplace-search/README.md‎
Lines changed: 44 additions & 2 deletions
diff --git a/‎example-apps/workplace-search/api/app.py‎
Lines changed: 4 additions & 151 deletions b/‎example-apps/workplace-search/api/app.py‎
Lines changed: 4 additions & 151 deletions
diff --git a/‎example-apps/workplace-search/api/chat.py‎
Lines changed: 129 additions & 0 deletions b/‎example-apps/workplace-search/api/chat.py‎
Lines changed: 129 additions & 0 deletions
diff --git a/‎example-apps/workplace-search/api/elasticsearch_client.py‎
Lines changed: 16 additions & 0 deletions b/‎example-apps/workplace-search/api/elasticsearch_client.py‎
Lines changed: 16 additions & 0 deletions
@@ -21,7 +21,6 @@ This app requires the following environment variables to be set:
 export ELASTIC_CLOUD_ID=...
 export ELASTIC_USERNAME=...
 export ELASTIC_PASSWORD=...
-export OPENAI_API_KEY=...
 ```
 
 Note:
@@ -31,7 +30,50 @@ Note:
  1. Go to the [Create deployment](https://cloud.elastic.co/deployments/create) page
  2. Select **Create deployment** and follow the instructions
 
-- you can get your OpenAI key from the [OpenAI dashboard](https://platform.openai.com/account/api-keys).
+
+To use llm other than openai you can set up the LLM_TYPE environment variable to one of the following values:
+```sh
+# azure|openai|vertex|bedrock
+export LLM_TYPE=azure
+```
+
+### 2.1. OpenAI LLM
+
+To use OpenAI LLM, you will need to set up only OPENAI_API_KEY environment variable:
+
+```sh
+export OPENAI_API_KEY=...
+```
+You can get your OpenAI key from the [OpenAI dashboard](https://platform.openai.com/account/api-keys).
+### 2.2. Azure OPENAI LLM
+
+If you are using Azure LLM, you will need to set the following environment variables:
+
+```sh
+export OPENAI_VERSION=... # e.g. 2023-05-15
+export OPENAI_BASE_URL=...
+export OPENAI_API_KEY=...
+export OPENAI_ENGINE=... # deployment name in Azure
+```
+
+### 2.3. Bedrock LLM
+
+To use Bedrock LLM you need to set the following environment variables:
+ 
+```sh
+ export AWS_ACCESS_KEY=...
+ export AWS_SECRET_KEY=...
+ export AWS_REGION=... # e.g. us-east-1
+```
+or you can create config file `~/.aws/config` as it described here:
+https://boto3.amazonaws.com/v1/documentation/api/latest/guide/credentials.html#configuring-credentials
+
+```
+[default]
+aws_access_key_id=...
+aws_secret_access_key=...
+region=...
+```
 
 ## 3. Index Data
 
 
@@ -1,181 +1,34 @@
-from elasticsearch import Elasticsearch
-from lib.elasticsearch_chat_message_history import ElasticsearchChatMessageHistory
 from flask import Flask, jsonify, request, Response
 from flask_cors import CORS
-from langchain.callbacks.base import BaseCallbackHandler
-from langchain.chains import ConversationalRetrievalChain
-from langchain.chat_models import ChatOpenAI
-from langchain.prompts.chat import (
- HumanMessagePromptTemplate,
- SystemMessagePromptTemplate,
- ChatPromptTemplate,
-)
-from langchain.prompts.prompt import PromptTemplate
-from langchain.vectorstores import ElasticsearchStore
 from queue import Queue
 from uuid import uuid4
-import json
-import os
+from chat import chat, ask_question, parse_stream_message
 import threading
 
-INDEX = "workplace-app-docs"
-INDEX_CHAT_HISTORY = "workplace-app-docs-chat-history"
-ELASTIC_CLOUD_ID = os.getenv("ELASTIC_CLOUD_ID")
-ELASTIC_USERNAME = os.getenv("ELASTIC_USERNAME")
-ELASTIC_PASSWORD = os.getenv("ELASTIC_PASSWORD")
-OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
-
-POISON_MESSAGE = "~~~END~~~"
-SESSION_ID_TAG = "[SESSION_ID]"
-SOURCE_TAG = "[SOURCE]"
-DONE_TAG = "[DONE]"
-
-
-class QueueCallbackHandler(BaseCallbackHandler):
- def __init__(
- self,
- queue: Queue,
- ):
- self.queue = queue
- self.in_human_prompt = True
-
- def on_retriever_end(self, documents, *, run_id, parent_run_id=None, **kwargs):
- if len(documents) > 0:
- for doc in documents:
- source = {
- "name": doc.metadata["name"],
- "page_content": doc.page_content,
- "url": doc.metadata["url"],
- "icon": doc.metadata["category"],
- "updated_at": doc.metadata.get("updated_at", None)
- }
- self.queue.put(f"{SOURCE_TAG} {json.dumps(source)}")
-
- def on_llm_new_token(self, token, **kwargs):
- if not self.in_human_prompt:
- self.queue.put(token)
-
- def on_llm_start(
- self,
- serialized,
- prompts,
- *,
- run_id,
- parent_run_id=None,
- tags=None,
- metadata=None,
- **kwargs,
- ):
- self.in_human_prompt = prompts[0].startswith("Human:")
-
- def on_llm_end(self, response, *, run_id, parent_run_id=None, **kwargs):
- if not self.in_human_prompt:
- self.queue.put(POISON_MESSAGE)
-
-
-elasticsearch_client = Elasticsearch(
- cloud_id=ELASTIC_CLOUD_ID, basic_auth=(ELASTIC_USERNAME, ELASTIC_PASSWORD)
-)
-
-store = ElasticsearchStore(
- es_connection=elasticsearch_client,
- index_name=INDEX,
- strategy=ElasticsearchStore.SparseVectorRetrievalStrategy(),
-)
-
-retriever = store.as_retriever()
-
-llm = ChatOpenAI(openai_api_key=OPENAI_API_KEY, streaming=True, temperature=0.2)
-
-general_system_template = """ 
-Use the following passages to answer the user's question.
-Each passage has a SOURCE which is the title of the document. When answering, give the source name of the passages you are answering from, put them as an array of strings in here <script>[sources]</script>.
-If you don't know the answer, just say that you don't know, don't try to make up an answer.
-
-----
-{context}
-----
-
-"""
-general_user_template = "Question: {question}"
-qa_prompt = ChatPromptTemplate.from_messages(
- [
- SystemMessagePromptTemplate.from_template(general_system_template),
- HumanMessagePromptTemplate.from_template(general_user_template),
- ]
-)
-
-document_prompt = PromptTemplate(
- input_variables=["page_content", "name"],
- template="""
----
-NAME: "{name}"
-PASSAGE: 
-{page_content}
----
-""",
-)
-
-chat = ConversationalRetrievalChain.from_llm(
- llm=llm,
- retriever=store.as_retriever(),
- return_source_documents=True,
- combine_docs_chain_kwargs={"prompt": qa_prompt, "document_prompt": document_prompt},
- verbose=True,
-)
-
 app = Flask(__name__, static_folder="../frontend/public")
 CORS(app)
 
-
 @app.route("/")
 def api_index():
  return app.send_static_file("index.html")
 
-
-def ask_question(question, queue, chat_history):
- result = chat(
- {"question": question, "chat_history": chat_history.messages},
- callbacks=[QueueCallbackHandler(queue)],
- )
-
- chat_history.add_user_message(result["question"])
- chat_history.add_ai_message(result["answer"])
-
-
 @app.route("/api/chat", methods=["POST"])
 def api_chat():
- stream_queue = Queue()
  request_json = request.get_json()
  question = request_json.get("question")
  if question is None:
  return jsonify({"msg": "Missing question from request JSON"}), 400
 
+ stream_queue = Queue()
  session_id = request.args.get("session_id", str(uuid4()))
 
  print("Chat session ID: ", session_id)
- chat_history = ElasticsearchChatMessageHistory(
- client=elasticsearch_client, index=INDEX_CHAT_HISTORY, session_id=session_id
- )
-
- def generate(queue: Queue):
- yield f"data: {SESSION_ID_TAG} {session_id}\n\n"
-
- message = None
- while True:
- message = queue.get()
-
- if message == POISON_MESSAGE: # Poison message
- break
- yield f"data: {message}\n\n"
-
- yield f"data: {DONE_TAG}\n\n"
 
  threading.Thread(
- target=ask_question, args=(question, stream_queue, chat_history)
+ target=ask_question, args=(question, stream_queue, session_id)
  ).start()
 
- return Response(generate(stream_queue), mimetype="text/event-stream")
+ return Response(parse_stream_message(session_id, stream_queue), mimetype="text/event-stream")
 
 
 if __name__ == "__main__":
 
@@ -0,0 +1,129 @@
+from langchain.callbacks.base import BaseCallbackHandler
+from langchain.chains import ConversationalRetrievalChain
+from langchain.prompts.chat import (
+ HumanMessagePromptTemplate,
+ SystemMessagePromptTemplate,
+ ChatPromptTemplate,
+)
+from langchain.prompts.prompt import PromptTemplate
+from langchain.vectorstores import ElasticsearchStore
+from queue import Queue
+from llm_integrations import get_llm
+from elasticsearch_client import elasticsearch_client, get_elasticsearch_chat_message_history
+import json
+
+INDEX = "workplace-app-docs"
+INDEX_CHAT_HISTORY = "workplace-app-docs-chat-history"
+POISON_MESSAGE = "~~~END~~~"
+SESSION_ID_TAG = "[SESSION_ID]"
+SOURCE_TAG = "[SOURCE]"
+DONE_TAG = "[DONE]"
+
+class QueueCallbackHandler(BaseCallbackHandler):
+ def __init__(
+ self,
+ queue: Queue,
+ ):
+ self.queue = queue
+ self.in_human_prompt = True
+
+ def on_retriever_end(self, documents, *, run_id, parent_run_id=None, **kwargs):
+ if len(documents) > 0:
+ for doc in documents:
+ source = {
+ "name": doc.metadata["name"],
+ "page_content": doc.page_content,
+ "url": doc.metadata["url"],
+ "icon": doc.metadata["category"],
+ "updated_at": doc.metadata.get("updated_at", None)
+ }
+ self.queue.put(f"{SOURCE_TAG} {json.dumps(source)}")
+
+ def on_llm_new_token(self, token, **kwargs):
+ if not self.in_human_prompt:
+ self.queue.put(token)
+
+ def on_llm_start(
+ self,
+ serialized,
+ prompts,
+ *,
+ run_id,
+ parent_run_id=None,
+ tags=None,
+ metadata=None,
+ **kwargs,
+ ):
+ self.in_human_prompt = prompts[0].startswith("Human:")
+
+ def on_llm_end(self, response, *, run_id, parent_run_id=None, **kwargs):
+ if not self.in_human_prompt:
+ self.queue.put(POISON_MESSAGE)
+
+store = ElasticsearchStore(
+ es_connection=elasticsearch_client,
+ index_name=INDEX,
+ strategy=ElasticsearchStore.SparseVectorRetrievalStrategy(),
+)
+
+general_system_template = """
+Use the following passages to answer the user's question.
+Each passage has a SOURCE which is the title of the document. When answering, give the source name of the passages you are answering from, put them as an array of strings in here <script>[sources]</script>.
+If you don't know the answer, just say that you don't know, don't try to make up an answer.
+
+----
+{context}
+----
+
+"""
+general_user_template = "Question: {question}"
+qa_prompt = ChatPromptTemplate.from_messages(
+ [
+ SystemMessagePromptTemplate.from_template(general_system_template),
+ HumanMessagePromptTemplate.from_template(general_user_template),
+ ]
+)
+
+document_prompt = PromptTemplate(
+ input_variables=["page_content", "name"],
+ template="""
+---
+NAME: "{name}"
+PASSAGE:
+{page_content}
+---
+""",
+)
+
+retriever = store.as_retriever()
+llm = get_llm()
+chat = ConversationalRetrievalChain.from_llm(
+ llm=llm,
+ retriever=store.as_retriever(),
+ return_source_documents=True,
+ combine_docs_chain_kwargs={"prompt": qa_prompt, "document_prompt": document_prompt},
+ verbose=True,
+)
+
+def parse_stream_message(session_id, queue: Queue):
+ yield f"data: {SESSION_ID_TAG} {session_id}\n\n"
+
+ message = None
+ while True:
+ message = queue.get()
+
+ if message == POISON_MESSAGE:
+ break
+ yield f"data: {message}\n\n"
+
+ yield f"data: {DONE_TAG}\n\n"
+
+def ask_question(question, queue, session_id):
+ chat_history=get_elasticsearch_chat_message_history(INDEX_CHAT_HISTORY, session_id)
+ result=chat(
+ {"question": question, "chat_history": chat_history.messages},
+ callbacks=[QueueCallbackHandler(queue)],
+ )
+
+ chat_history.add_user_message(result["question"])
+ chat_history.add_ai_message(result["answer"])
@@ -0,0 +1,16 @@
+from elasticsearch import Elasticsearch
+from lib.elasticsearch_chat_message_history import ElasticsearchChatMessageHistory
+import os
+
+ELASTIC_CLOUD_ID = os.getenv("ELASTIC_CLOUD_ID")
+ELASTIC_USERNAME = os.getenv("ELASTIC_USERNAME")
+ELASTIC_PASSWORD = os.getenv("ELASTIC_PASSWORD")
+
+elasticsearch_client = Elasticsearch(
+ cloud_id=ELASTIC_CLOUD_ID, basic_auth=(ELASTIC_USERNAME, ELASTIC_PASSWORD)
+)
+
+def get_elasticsearch_chat_message_history(index, session_id):
+ return ElasticsearchChatMessageHistory(
+ client=elasticsearch_client, index=index, session_id=session_id
+ )