Spaces:

dammy
/

chatPDF

Runtime error

dammy commited on Nov 17, 2023

Commit

2a5a407

1 Parent(s): cc385c2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -45,40 +45,33 @@ def local_query(query, context):
 def run_query(btn, history, query):
-    global count
-    count = 1
-    if count ==1:
-        print('inside')
-        print(count)
-        file_name = btn.name
-        loader = PDFMinerLoader(file_name)
-        doc = loader.load()
-        text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
-        texts = text_splitter.split_documents(doc)
-        texts = [i.page_content for i in texts]
-        doc_emb = st_model.encode(texts)
-        doc_emb = doc_emb.tolist()
-        ids = [str(uuid.uuid1()) for _ in doc_emb]
-        client = chromadb.Client()
-        collection = client.create_collection("test_db")
-        collection.add(
-            embeddings=doc_emb,
-            documents=texts,
-            ids=ids
-        )
-        count+=1
-        print(count)
     context = get_context(query, collection)

 def run_query(btn, history, query):
+    # file_name = btn.name
+    # loader = PDFMinerLoader(file_name)
+    # doc = loader.load()
+    # text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
+    # texts = text_splitter.split_documents(doc)
+    # texts = [i.page_content for i in texts]
+    # doc_emb = st_model.encode(texts)
+    # doc_emb = doc_emb.tolist()
+    # ids = [str(uuid.uuid1()) for _ in doc_emb]
+    # client = chromadb.Client()
+    # collection = client.create_collection("test_db")
+    # collection.add(
+    #     embeddings=doc_emb,
+    #     documents=texts,
+    #     ids=ids
+    # )
     context = get_context(query, collection)