Commit
·
c7743de
1
Parent(s):
6381fc9
Revert "Thử giảm kích thước image"
Browse filesThis reverts commit 1be45942019dda8848ed2e743a57394275ca0b37.
- data_processing.py +1 -1
- requirements.txt +4 -2
data_processing.py
CHANGED
|
@@ -17,7 +17,7 @@ import docling
|
|
| 17 |
from docling.document_converter import DocumentConverter, PdfFormatOption
|
| 18 |
from docling.datamodel.base_models import InputFormat
|
| 19 |
from docling.datamodel.pipeline_options import PdfPipelineOptions
|
| 20 |
-
|
| 21 |
import pandas as pd
|
| 22 |
import gradio as gr
|
| 23 |
from pymongo import MongoClient, UpdateOne
|
|
|
|
| 17 |
from docling.document_converter import DocumentConverter, PdfFormatOption
|
| 18 |
from docling.datamodel.base_models import InputFormat
|
| 19 |
from docling.datamodel.pipeline_options import PdfPipelineOptions
|
| 20 |
+
from docling.backend.pypdfium2_backend import PyPdfiumDocumentBackend
|
| 21 |
import pandas as pd
|
| 22 |
import gradio as gr
|
| 23 |
from pymongo import MongoClient, UpdateOne
|
requirements.txt
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
-
|
| 2 |
transformers
|
| 3 |
sentence-transformers
|
| 4 |
FlagEmbedding
|
|
@@ -11,4 +11,6 @@ requests
|
|
| 11 |
gradio
|
| 12 |
python-dotenv
|
| 13 |
docling
|
| 14 |
-
|
|
|
|
|
|
|
|
|
| 1 |
+
torch
|
| 2 |
transformers
|
| 3 |
sentence-transformers
|
| 4 |
FlagEmbedding
|
|
|
|
| 11 |
gradio
|
| 12 |
python-dotenv
|
| 13 |
docling
|
| 14 |
+
pandas
|
| 15 |
+
openpyxl
|
| 16 |
+
pypdfium2
|