Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
wangsen
MinerU
Commits
07eaa2d7
Unverified
Commit
07eaa2d7
authored
Mar 20, 2025
by
Xiaomeng Zhao
Committed by
GitHub
Mar 20, 2025
Browse files
Merge pull request #1959 from myhloli/dev
Dev push
parents
132c16ad
2f40fa7d
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
16 additions
and
7 deletions
+16
-7
magic_pdf/model/doc_analyze_by_custom_model.py
magic_pdf/model/doc_analyze_by_custom_model.py
+4
-4
magic_pdf/pdf_parse_union_core_v2.py
magic_pdf/pdf_parse_union_core_v2.py
+12
-3
No files found.
magic_pdf/model/doc_analyze_by_custom_model.py
View file @
07eaa2d7
...
...
@@ -257,13 +257,13 @@ def may_batch_image_analyze(
if
str
(
device
).
startswith
(
'npu'
)
or
str
(
device
).
startswith
(
'cuda'
):
gpu_memory
=
int
(
os
.
getenv
(
'VIRTUAL_VRAM_SIZE'
,
round
(
get_vram
(
device
))))
if
gpu_memory
is
not
None
:
if
gpu_memory
>=
20
:
if
gpu_memory
>=
16
:
batch_ratio
=
16
elif
gpu_memory
>=
1
5
:
elif
gpu_memory
>=
1
2
:
batch_ratio
=
8
elif
gpu_memory
>=
10
:
elif
gpu_memory
>=
8
:
batch_ratio
=
4
elif
gpu_memory
>=
7
:
elif
gpu_memory
>=
6
:
batch_ratio
=
2
else
:
batch_ratio
=
1
...
...
magic_pdf/pdf_parse_union_core_v2.py
View file @
07eaa2d7
...
...
@@ -333,8 +333,14 @@ def txt_spans_extract_v2(pdf_page, spans, all_bboxes, all_discarded_blocks, lang
def
model_init
(
model_name
:
str
):
from
transformers
import
LayoutLMv3ForTokenClassification
device
=
torch
.
device
(
get_device
())
device_name
=
get_device
()
bf_16_support
=
False
if
device_name
.
startswith
(
"cuda"
):
bf_16_support
=
torch
.
cuda
.
is_bf16_supported
()
elif
device_name
.
startswith
(
"mps"
):
bf_16_support
=
True
device
=
torch
.
device
(
device_name
)
if
model_name
==
'layoutreader'
:
# 检测modelscope的缓存目录是否存在
layoutreader_model_dir
=
get_local_layoutreader_model_dir
()
...
...
@@ -349,7 +355,10 @@ def model_init(model_name: str):
model
=
LayoutLMv3ForTokenClassification
.
from_pretrained
(
'hantian/layoutreader'
)
model
.
to
(
device
).
eval
()
if
bf_16_support
:
model
.
to
(
device
).
eval
().
bfloat16
()
else
:
model
.
to
(
device
).
eval
()
else
:
logger
.
error
(
'model name not allow'
)
exit
(
1
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment