Spaces:

Insightly
/

CSV-Bot

Runtime error

App Files Files Community

shreyasiv commited on Jul 11, 2023

Commit

7ac0c16

•

1 Parent(s): 77482e0

Upload 7 files

Browse files

Files changed (7) hide show

app.py +62 -0
data.csv +0 -0
emb.py +80 -0
get-pip.py +0 -0
requirements.txt +77 -0
setup.sh +38 -0
tempfile +0 -0

app.py ADDED Viewed

	@@ -0,0 +1,62 @@

+from tempfile import NamedTemporaryFile
+from langchain.agents import create_csv_agent
+from langchain.llms import OpenAI
+from dotenv import load_dotenv
+import os
+import streamlit as st
+import pandas as pd
+from streamlit_chat import message
+from langchain.embeddings.openai import OpenAIEmbeddings
+from langchain.chat_models import ChatOpenAI
+from langchain.chains import ConversationalRetrievalChain
+from langchain.document_loaders.csv_loader import CSVLoader
+from langchain.vectorstores import FAISS
+def main():
+    load_dotenv()
+    # Load the OpenAI API key from the environment variable
+    api_key = os.getenv("OPENAI_API_KEY")
+    if api_key is None or api_key == "":
+        st.error("OPENAI_API_KEY is not set")
+        return
+    st.set_page_config(page_title="Insightly")
+    st.sidebar.image("/home/oem/Downloads/insightly_wbg.png", use_column_width=True)
+    st.header("Data Analysis 📈")
+    csv_files = st.file_uploader("Upload CSV files", type="csv", accept_multiple_files=True)
+    if csv_files:
+        llm = OpenAI(temperature=0)
+        user_input = st.text_input("Question here:")
+        # Iterate over each CSV file
+        for csv_file in csv_files:
+            with NamedTemporaryFile(delete=False) as f:
+                f.write(csv_file.getvalue())
+                f.flush()
+                df = pd.read_csv(f.name)
+                # Perform any necessary data preprocessing or feature engineering here
+                # You can modify the code based on your specific requirements
+                # Example: Accessing columns from the DataFrame
+                # column_data = df["column_name"]
+                # Example: Applying transformations or calculations to the data
+                # transformed_data = column_data.apply(lambda x: x * 2)
+                # Example: Using the preprocessed data with the OpenAI API
+                # llm_response = llm.predict(transformed_data)
+                if user_input:
+                    # Pass the user input to the OpenAI agent for processing
+                    agent = create_csv_agent(llm, f.name, verbose=True)
+                    response = agent.run(user_input)
+                    st.write(f"CSV File: {csv_file.name}")
+                    st.write("Response:")
+                    st.write(response)
+if __name__ == "__main__":
+    main()

data.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

emb.py ADDED Viewed

	@@ -0,0 +1,80 @@

+import openai
+# Set up the OpenAI API credentials
+openai.api_key = "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"
+# Code snippet
+code = """
+from tempfile import NamedTemporaryFile
+from langchain.agents import create_csv_agent
+from langchain.llms import OpenAI
+from dotenv import load_dotenv
+import os
+import streamlit as st
+import pandas as pd
+def main():
+    load_dotenv()
+    # Load the OpenAI API key from the environment variable
+    api_key = os.getenv("OPENAI_API_KEY")
+    if api_key is None or api_key == "":
+        st.error("OPENAI_API_KEY is not set")
+        return
+    st.set_page_config(page_title="Insightly")
+    st.sidebar.image("/home/oem/Downloads/insightly_wbg.png", use_column_width=True)
+    st.header("Data Analysis 📈")
+    csv_files = st.file_uploader("Upload CSV files", type="csv", accept_multiple_files=True)
+    if csv_files:
+        llm = OpenAI(temperature=0)
+        user_input = st.text_input("Question here:")
+        # Iterate over each CSV file
+        for csv_file in csv_files:
+            with NamedTemporaryFile(delete=False) as f:
+                f.write(csv_file.getvalue())
+                f.flush()
+                df = pd.read_csv(f.name)
+                # Perform any necessary data preprocessing or feature engineering here
+                # You can modify the code based on your specific requirements
+                # Example: Accessing columns from the DataFrame
+                # column_data = df["column_name"]
+                # Example: Applying transformations or calculations to the data
+                # transformed_data = column_data.apply(lambda x: x * 2)
+                # Example: Using the preprocessed data with the OpenAI API
+                # llm_response = llm.predict(transformed_data)
+                if user_input:
+                    # Pass the user input to the OpenAI agent for processing
+                    agent = create_csv_agent(llm, f.name, verbose=True)
+                    response = agent.run(user_input)
+                    st.write(f"CSV File: {csv_file.name}")
+                    st.write("Response:")
+                    st.write(response)
+if __name__ == "__main__":
+    main()
+"""
+# Retrieve the embeddings
+response = openai.Completion.create(
+    model="gpt-3.5-turbo",
+    documents=[code],
+    num_completions=1,
+    return_prompt=True,
+    return_sequences=False,
+    expand_prompt=False
+)
+# Extract the embeddings from the response
+embeddings = response.choices[0].embedding
+# Print the embeddings
+print(embeddings)

get-pip.py ADDED Viewed

The diff for this file is too large to render. See raw diff

requirements.txt ADDED Viewed

	@@ -0,0 +1,77 @@

+aiohttp==3.8.4
+aiosignal==1.3.1
+altair==5.0.1
+async-timeout==4.0.2
+attrs==23.1.0
+blinker==1.6.2
+cachetools==5.3.1
+certifi==2023.5.7
+charset-normalizer==3.1.0
+click==8.1.3
+Cython==0.29.35
+dataclasses-json==0.5.8
+decorator==5.1.1
+filelock==3.12.2
+frozenlist==1.3.3
+fsspec==2023.6.0
+gitdb==4.0.10
+GitPython==3.1.31
+greenlet==2.0.2
+huggingface==0.0.1
+huggingface-hub==0.15.1
+idna==3.4
+importlib-metadata==6.7.0
+Jinja2==3.1.2
+jsonschema==4.17.3
+langchain==0.0.219
+langchainplus-sdk==0.0.17
+markdown-it-py==3.0.0
+MarkupSafe==2.1.3
+marshmallow==3.19.0
+marshmallow-enum==1.5.1
+mdurl==0.1.2
+multidict==6.0.4
+mypy-extensions==1.0.0
+numexpr==2.8.4
+numpy==1.25.0
+openai==0.27.8
+openapi-schema-pydantic==1.2.4
+packaging==23.1
+pandas==2.0.3
+Pillow==9.5.0
+protobuf==4.23.3
+pyarrow==12.0.1
+pydantic==1.10.9
+pydeck==0.8.1b0
+Pygments==2.15.1
+Pympler==1.0.1
+pyrsistent==0.19.3
+python-dateutil==2.8.2
+python-dotenv==1.0.0
+pytz==2023.3
+pytz-deprecation-shim==0.1.0.post0
+PyYAML==6.0
+regex==2023.6.3
+requests==2.31.0
+rich==13.4.2
+safetensors==0.3.1
+six==1.16.0
+smmap==5.0.0
+SQLAlchemy==2.0.17
+streamlit==1.24.0
+streamlit-chat==0.1.1
+tabulate==0.9.0
+tenacity==8.2.2
+toml==0.10.2
+toolz==0.12.0
+tornado==6.3.2
+tqdm==4.65.0
+typing-inspect==0.9.0
+typing_extensions==4.6.3
+tzdata==2023.3
+tzlocal==4.3.1
+urllib3==2.0.3
+validators==0.20.0
+watchdog==3.0.0
+yarl==1.9.2
+zipp==3.15.0

setup.sh ADDED Viewed

	@@ -0,0 +1,38 @@

+import streamlit as st
+def display_ui():
+    st.sidebar.image("/home/oem/Downloads/insightly_wbg.png", use_column_width=True)
+    st.header("Data Analysis 📈")
+    csv_files = st.file_uploader("Upload CSV files", type="csv", accept_multiple_files=True)
+    if csv_files:
+        llm = OpenAI(temperature=0)
+        user_input = st.text_input("Question here:")
+        # Iterate over each CSV file
+        for csv_file in csv_files:
+            with NamedTemporaryFile(delete=False) as f:
+                f.write(csv_file.getvalue())
+                f.flush()
+                df = pd.read_csv(f.name)
+                # Perform any necessary data preprocessing or feature engineering here
+                # You can modify the code based on your specific requirements
+                # Example: Accessing columns from the DataFrame
+                # column_data = df["column_name"]
+                # Example: Applying transformations or calculations to the data
+                # transformed_data = column_data.apply(lambda x: x * 2)
+                # Example: Using the preprocessed data with the OpenAI API
+                # llm_response = llm.predict(transformed_data)
+                if user_input:
+                    # Pass the user input to the OpenAI agent for processing
+                    agent = create_csv_agent(llm, f.name, verbose=True)
+                    response = agent.run(user_input)
+                    st.write(f"CSV File: {csv_file.name}")
+                    st.write("Response:")
+                    st.write(response)

tempfile ADDED Viewed

The diff for this file is too large to render. See raw diff