Spaces:
Running
on
T4
Running
on
T4
Update auditqa/doc_process.py
Browse files- auditqa/doc_process.py +3 -2
auditqa/doc_process.py
CHANGED
|
@@ -14,7 +14,8 @@ path_to_data = "./data/"
|
|
| 14 |
|
| 15 |
def process_pdf():
|
| 16 |
files = {'MWTS2021':'./data/MWTS2021.pdf',
|
| 17 |
-
'MWTS2022':'./data/MWTS2022.pdf'
|
|
|
|
| 18 |
docs = {}
|
| 19 |
for file,value in files.items():
|
| 20 |
try:
|
|
@@ -46,7 +47,7 @@ def process_pdf():
|
|
| 46 |
|
| 47 |
|
| 48 |
embeddings = HuggingFaceEmbeddings(
|
| 49 |
-
model_name="
|
| 50 |
)
|
| 51 |
|
| 52 |
qdrant_collections = {}
|
|
|
|
| 14 |
|
| 15 |
def process_pdf():
|
| 16 |
files = {'MWTS2021':'./data/MWTS2021.pdf',
|
| 17 |
+
'MWTS2022':'./data/MWTS2022.pdf',
|
| 18 |
+
'Consolidated2021':'./data/Consolidated2021.pdf'}
|
| 19 |
docs = {}
|
| 20 |
for file,value in files.items():
|
| 21 |
try:
|
|
|
|
| 47 |
|
| 48 |
|
| 49 |
embeddings = HuggingFaceEmbeddings(
|
| 50 |
+
model_name="BAAI/bge-small-en-v1.5"
|
| 51 |
)
|
| 52 |
|
| 53 |
qdrant_collections = {}
|