Spaces:
Running
on
T4
Running
on
T4
Update auditqa/doc_process.py
Browse files- auditqa/doc_process.py +2 -2
auditqa/doc_process.py
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
import glob
|
| 2 |
import os
|
| 3 |
-
from langchain_text_splitters import MarkdownHeaderTextSplitter
|
| 4 |
-
from langchain_community.document_loaders import UnstructuredMarkdownLoader
|
| 5 |
from langchain.text_splitter import RecursiveCharacterTextSplitter, SentenceTransformersTokenTextSplitter
|
| 6 |
from transformers import AutoTokenizer
|
| 7 |
from langchain_community.document_loaders import PyMuPDFLoader
|
|
|
|
| 1 |
import glob
|
| 2 |
import os
|
| 3 |
+
#from langchain_text_splitters import MarkdownHeaderTextSplitter
|
| 4 |
+
#from langchain_community.document_loaders import UnstructuredMarkdownLoader
|
| 5 |
from langchain.text_splitter import RecursiveCharacterTextSplitter, SentenceTransformersTokenTextSplitter
|
| 6 |
from transformers import AutoTokenizer
|
| 7 |
from langchain_community.document_loaders import PyMuPDFLoader
|