mr

Build error

App Files Files Community

JPBianchi commited on May 16

Commit

0a6f805

•

1 Parent(s): 88ae985

renamed method in processing

Browse files

Files changed (3) hide show

app/engine/processing.py +1 -1
app/engine/vectorstore.py +0 -1
app/main.py +1 -42

app/engine/processing.py CHANGED Viewed

@@ -42,7 +42,7 @@ def process_pdf(filepath:str) -> dict:
     logger.info(f"Successfully vectorized PDF content")
     return new_content
-def process_question(question:str) -> List[str]:
     ans = finrag_vectorstore.hybrid_search(query=question, limit=3, alpha=0.8)
     return ans

     logger.info(f"Successfully vectorized PDF content")
     return new_content
+def vector_search(question:str) -> List[str]:
     ans = finrag_vectorstore.hybrid_search(query=question, limit=3, alpha=0.8)
     return ans

app/engine/vectorstore.py CHANGED Viewed

@@ -62,7 +62,6 @@ class VectorStore:
             self.client = WeaviateWCS(endpoint=self.url,
                                       api_key=self.api_key,
                                       model_name_or_path=self.model_path)
-            print('After client creation')
         except Exception as e:
             # raise Exception(f"Could not create Weaviate client: {e}")

             self.client = WeaviateWCS(endpoint=self.url,
                                       api_key=self.api_key,
                                       model_name_or_path=self.model_path)
         except Exception as e:
             # raise Exception(f"Could not create Weaviate client: {e}")

app/main.py CHANGED Viewed

@@ -32,8 +32,6 @@ if environment == "dev":
     )
 try:
-    # will not work on HuggingFace
-    # and Liquidity dont' have the env anyway
     load_dotenv(find_dotenv('env'))
 except Exception as e:
@@ -56,7 +54,7 @@ def read_root():
 def ping():
     """ Testing """
     logger.info("Someone is pinging the server")
-    return {"answer": str(random.random() * 100)}
 @app.delete("/erase_data/")
@@ -168,14 +166,6 @@ async def ragit(question: Question):
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
-# TODO
-#   rejects searches with a search score below a threshold
-#   scrape the tables (and find a way to reject them from the text search -> LLamaparse)
-#   see why the filename in search results is always empty
-#       -> add it to the search results to avoid confusion Google-Amazon for instance
-#   add python scripts to create index, rag etc
 if __name__ == '__main__':
     import uvicorn
     from os import getenv
@@ -198,34 +188,3 @@ if __name__ == '__main__':
 # curl -X POST http://localhost:80/ask/ -H "Content-Type: application/json" -d '{"question": "what is Amazon loss"}'
 # curl -X POST http://localhost:80/ragit/ -H "Content-Type: application/json" -d '{"question": "Does ATT have postpaid phone customers?"}'
-# TODO
-# import unittest
-# from unitesting_utils import load_impact_theory_data
-# class TestSplitContents(unittest.TestCase):
-#     '''
-#     Unit test to ensure proper functionality of split_contents function
-#     '''
-#     def test_split_contents(self):
-#         import tiktoken
-#         from llama_index.text_splitter import SentenceSplitter
-#         data = load_impact_theory_data()
-#         subset = data[:3]
-#         chunk_size = 256
-#         chunk_overlap = 0
-#         encoding = tiktoken.encoding_for_model('gpt-3.5-turbo-0613')
-#         gpt35_txt_splitter = SentenceSplitter(chunk_size=chunk_size, tokenizer=encoding.encode, chunk_overlap=chunk_overlap)
-#         results = split_contents(subset, gpt35_txt_splitter)
-#         self.assertEqual(len(results), 3)
-#         self.assertEqual(len(results[0]), 83)
-#         self.assertEqual(len(results[1]), 178)
-#         self.assertEqual(len(results[2]), 144)
-#         self.assertTrue(isinstance(results, list))
-#         self.assertTrue(isinstance(results[0], list))
-#         self.assertTrue(isinstance(results[0][0], str))
-# unittest.TextTestRunner().run(unittest.TestLoader().loadTestsFromTestCase(TestSplitContents))

     )
 try:
     load_dotenv(find_dotenv('env'))
 except Exception as e:
 def ping():
     """ Testing """
     logger.info("Someone is pinging the server")
+    return {"answer": str(int(random.random() * 100))}
 @app.delete("/erase_data/")
     except Exception as e:
         raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail=str(e))
 if __name__ == '__main__':
     import uvicorn
     from os import getenv
 # curl -X POST http://localhost:80/ask/ -H "Content-Type: application/json" -d '{"question": "what is Amazon loss"}'
 # curl -X POST http://localhost:80/ragit/ -H "Content-Type: application/json" -d '{"question": "Does ATT have postpaid phone customers?"}'