Spaces:

lfoppiano
/

document-qa

Running

App Files Files Community

Luca Foppiano commited on Nov 1, 2023

Commit

9997b7b

•

1 Parent(s): fcde626

fix env variables (#9)

Browse files

* avoid writing env variables of api keys

Files changed (4) hide show

README.md +3 -3
document_qa/document_qa_engine.py +1 -0
requirements.txt +0 -1
streamlit_app.py +28 -21

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
-title: 📝 Scientific Document Insight QA
-emoji:
 colorFrom: yellow
 colorTo: pink
 sdk: streamlit
@@ -10,7 +10,7 @@ pinned: false
 license: apache-2.0
 ---
-# DocumentIQA: Scientific Document Insight QA
 **Work in progress** :construction_worker:

 ---
+title: Scientific Document Insights Q/A
+emoji: 📝
 colorFrom: yellow
 colorTo: pink
 sdk: streamlit
 license: apache-2.0
 ---
+# DocumentIQA: Scientific Document Insights Q/A
 **Work in progress** :construction_worker:

document_qa/document_qa_engine.py CHANGED Viewed

@@ -205,6 +205,7 @@ class DocumentQAEngine:
         if doc_id:
             hash = doc_id
         else:
             hash = metadata[0]['hash']
         if hash not in self.embeddings_dict.keys():

         if doc_id:
             hash = doc_id
         else:
             hash = metadata[0]['hash']
         if hash not in self.embeddings_dict.keys():

requirements.txt CHANGED Viewed

@@ -19,7 +19,6 @@ chromadb==0.4.15
 tiktoken==0.4.0
 openai==0.27.7
 langchain==0.0.314
-promptlayer==0.2.4
 typing-inspect==0.9.0
 typing_extensions==4.8.0
 pydantic==2.4.2

 tiktoken==0.4.0
 openai==0.27.7
 langchain==0.0.314
 typing-inspect==0.9.0
 typing_extensions==4.8.0
 pydantic==2.4.2

streamlit_app.py CHANGED Viewed

@@ -10,7 +10,7 @@ from langchain.llms.huggingface_hub import HuggingFaceHub
 dotenv.load_dotenv(override=True)
 import streamlit as st
-from langchain.chat_models import PromptLayerChatOpenAI
 from langchain.embeddings import OpenAIEmbeddings, HuggingFaceEmbeddings
 from document_qa.document_qa_engine import DocumentQAEngine
@@ -52,7 +52,7 @@ if 'uploaded' not in st.session_state:
     st.session_state['uploaded'] = False
 st.set_page_config(
-    page_title="Document Insights QA",
     page_icon="📝",
     initial_sidebar_state="expanded",
     menu_items={
@@ -70,13 +70,21 @@ def new_file():
 # @st.cache_resource
-def init_qa(model):
     if model == 'chatgpt-3.5-turbo':
-        chat = PromptLayerChatOpenAI(model_name="gpt-3.5-turbo",
-                                     temperature=0,
-                                     return_pl_id=True,
-                                     pl_tags=["streamlit", "chatgpt"])
-        embeddings = OpenAIEmbeddings()
     elif model == 'mistral-7b-instruct-v0.1':
         chat = HuggingFaceHub(repo_id="mistralai/Mistral-7B-Instruct-v0.1",
                               model_kwargs={"temperature": 0.01, "max_length": 4096, "max_new_tokens": 2048})
@@ -162,12 +170,11 @@ with st.sidebar:
     st.markdown(
         ":warning: Mistral is free to use, however requests might hit limits of the huggingface free API and fail. :warning: ")
-    if model == 'mistral-7b-instruct-v0.1' or model == 'llama-2-70b-chat':
         if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ:
             api_key = st.text_input('Huggingface API Key', type="password")
-            st.markdown(
-                "Get it [here](https://huggingface.co/docs/hub/security-tokens)")
         else:
             api_key = os.environ['HUGGINGFACEHUB_API_TOKEN']
@@ -176,33 +183,33 @@ with st.sidebar:
             if model not in st.session_state['rqa'] or model not in st.session_state['api_keys']:
                 with st.spinner("Preparing environment"):
                     st.session_state['api_keys'][model] = api_key
-                    if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ:
-                        os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_key
                     st.session_state['rqa'][model] = init_qa(model)
-    elif model == 'chatgpt-3.5-turbo':
         if 'OPENAI_API_KEY' not in os.environ:
             api_key = st.text_input('OpenAI API Key', type="password")
-            st.markdown(
-                "Get it [here](https://platform.openai.com/account/api-keys)")
         else:
             api_key = os.environ['OPENAI_API_KEY']
         if api_key:
-            # st.session_state['api_key'] = is_api_key_provided = True
             if model not in st.session_state['rqa'] or model not in st.session_state['api_keys']:
                 with st.spinner("Preparing environment"):
                     st.session_state['api_keys'][model] = api_key
                     if 'OPENAI_API_KEY' not in os.environ:
-                        os.environ['OPENAI_API_KEY'] = api_key
-                    st.session_state['rqa'][model] = init_qa(model)
     # else:
     #     is_api_key_provided = st.session_state['api_key']
-st.title("📝 Scientific Document Insight QA")
 st.subheader("Upload a scientific article in PDF, ask questions, get insights.")
-st.markdown(":warning: Do not upload sensitive data. We **temporarily** store text from the uploaded PDF documents solely for the purpose of processing your request, and we **do not assume responsibility** for any subsequent use or handling of the data submitted to third parties LLMs.")
 uploaded_file = st.file_uploader("Upload an article", type=("pdf", "txt"), on_change=new_file,
                                  disabled=st.session_state['model'] is not None and st.session_state['model'] not in

 dotenv.load_dotenv(override=True)
 import streamlit as st
+from langchain.chat_models import ChatOpenAI
 from langchain.embeddings import OpenAIEmbeddings, HuggingFaceEmbeddings
 from document_qa.document_qa_engine import DocumentQAEngine
     st.session_state['uploaded'] = False
 st.set_page_config(
+    page_title="Scientific Document Insights Q/A",
     page_icon="📝",
     initial_sidebar_state="expanded",
     menu_items={
 # @st.cache_resource
+def init_qa(model, api_key=None):
     if model == 'chatgpt-3.5-turbo':
+        if api_key:
+            chat = ChatOpenAI(model_name="gpt-3.5-turbo",
+                              temperature=0,
+                              openai_api_key=api_key,
+                              frequency_penalty=0.1)
+            embeddings = OpenAIEmbeddings(openai_api_key=api_key)
+        else:
+            chat = ChatOpenAI(model_name="gpt-3.5-turbo",
+                              temperature=0,
+                              frequency_penalty=0.1)
+            embeddings = OpenAIEmbeddings()
     elif model == 'mistral-7b-instruct-v0.1':
         chat = HuggingFaceHub(repo_id="mistralai/Mistral-7B-Instruct-v0.1",
                               model_kwargs={"temperature": 0.01, "max_length": 4096, "max_new_tokens": 2048})
     st.markdown(
         ":warning: Mistral is free to use, however requests might hit limits of the huggingface free API and fail. :warning: ")
+    if model == 'mistral-7b-instruct-v0.1' and model not in st.session_state['api_keys']:
         if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ:
             api_key = st.text_input('Huggingface API Key', type="password")
+            st.markdown("Get it [here](https://huggingface.co/docs/hub/security-tokens)")
         else:
             api_key = os.environ['HUGGINGFACEHUB_API_TOKEN']
             if model not in st.session_state['rqa'] or model not in st.session_state['api_keys']:
                 with st.spinner("Preparing environment"):
                     st.session_state['api_keys'][model] = api_key
+                    # if 'HUGGINGFACEHUB_API_TOKEN' not in os.environ:
+                    #     os.environ["HUGGINGFACEHUB_API_TOKEN"] = api_key
                     st.session_state['rqa'][model] = init_qa(model)
+    elif model == 'chatgpt-3.5-turbo' and model not in st.session_state['api_keys']:
         if 'OPENAI_API_KEY' not in os.environ:
             api_key = st.text_input('OpenAI API Key', type="password")
+            st.markdown("Get it [here](https://platform.openai.com/account/api-keys)")
         else:
             api_key = os.environ['OPENAI_API_KEY']
         if api_key:
             if model not in st.session_state['rqa'] or model not in st.session_state['api_keys']:
                 with st.spinner("Preparing environment"):
                     st.session_state['api_keys'][model] = api_key
                     if 'OPENAI_API_KEY' not in os.environ:
+                        st.session_state['rqa'][model] = init_qa(model, api_key)
+                    else:
+                        st.session_state['rqa'][model] = init_qa(model)
     # else:
     #     is_api_key_provided = st.session_state['api_key']
+st.title("📝 Scientific Document Insights Q/A")
 st.subheader("Upload a scientific article in PDF, ask questions, get insights.")
+st.markdown(
+    ":warning: Do not upload sensitive data. We **temporarily** store text from the uploaded PDF documents solely for the purpose of processing your request, and we **do not assume responsibility** for any subsequent use or handling of the data submitted to third parties LLMs.")
 uploaded_file = st.file_uploader("Upload an article", type=("pdf", "txt"), on_change=new_file,
                                  disabled=st.session_state['model'] is not None and st.session_state['model'] not in