gkrishnan commited on
Commit
b9578f7
1 Parent(s): 7a31d3e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -0
app.py CHANGED
@@ -6,6 +6,14 @@ from langchain.chains import RetrievalQA
6
  from transformers import AutoTokenizer
7
  import pickle
8
  import os
 
 
 
 
 
 
 
 
9
 
10
  with open('shakespeare.pkl', 'rb') as fp:
11
  data = pickle.load(fp)
 
6
  from transformers import AutoTokenizer
7
  import pickle
8
  import os
9
+ from langchain.document_loaders import BSHTMLLoader, DirectoryLoader
10
+
11
+ bshtml_dir_loader = DirectoryLoader('./data/', loader_cls = BSHTMLLoader)
12
+
13
+ data = bshtml_dir_loader.load()
14
+
15
+ with open("shakespeare.pkl", "wb") as fp:
16
+ pickle.dump(data, fp)
17
 
18
  with open('shakespeare.pkl', 'rb') as fp:
19
  data = pickle.load(fp)