Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
wangsen
paddle_dbnet
Commits
8e05d54c
Commit
8e05d54c
authored
Dec 20, 2021
by
WenmuZhou
Browse files
fix win train bug
parent
dc51469b
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
36 additions
and
14 deletions
+36
-14
ppstructure/vqa/eval_ser.py
ppstructure/vqa/eval_ser.py
+1
-1
ppstructure/vqa/train_ser.py
ppstructure/vqa/train_ser.py
+2
-2
ppstructure/vqa/xfun.py
ppstructure/vqa/xfun.py
+33
-11
No files found.
ppstructure/vqa/eval_ser.py
View file @
8e05d54c
...
...
@@ -61,7 +61,7 @@ def eval(args):
eval_dataloader
=
paddle
.
io
.
DataLoader
(
eval_dataset
,
batch_size
=
args
.
per_gpu_eval_batch_size
,
num_workers
=
0
,
num_workers
=
8
,
use_shared_memory
=
True
,
collate_fn
=
None
,
)
...
...
ppstructure/vqa/train_ser.py
View file @
8e05d54c
...
...
@@ -94,14 +94,14 @@ def train(args):
train_dataloader
=
paddle
.
io
.
DataLoader
(
train_dataset
,
batch_sampler
=
train_sampler
,
num_workers
=
0
,
num_workers
=
8
,
use_shared_memory
=
True
,
collate_fn
=
None
,
)
eval_dataloader
=
paddle
.
io
.
DataLoader
(
eval_dataset
,
batch_size
=
args
.
per_gpu_eval_batch_size
,
num_workers
=
0
,
num_workers
=
8
,
use_shared_memory
=
True
,
collate_fn
=
None
,
)
...
...
ppstructure/vqa/xfun.py
View file @
8e05d54c
...
...
@@ -79,14 +79,36 @@ class XFUNDataset(Dataset):
self
.
entities_labels
=
{
'HEADER'
:
0
,
'QUESTION'
:
1
,
'ANSWER'
:
2
}
self
.
return_keys
=
{
'bbox'
:
'np'
,
'input_ids'
:
'np'
,
'labels'
:
'np'
,
'attention_mask'
:
'np'
,
'image'
:
'np'
,
'token_type_ids'
:
'np'
,
'entities'
:
'dict'
,
'relations'
:
'dict'
,
'bbox'
:
{
'type'
:
'np'
,
'dtype'
:
'int64'
},
'input_ids'
:
{
'type'
:
'np'
,
'dtype'
:
'int64'
},
'labels'
:
{
'type'
:
'np'
,
'dtype'
:
'int64'
},
'attention_mask'
:
{
'type'
:
'np'
,
'dtype'
:
'int64'
},
'image'
:
{
'type'
:
'np'
,
'dtype'
:
'float32'
},
'token_type_ids'
:
{
'type'
:
'np'
,
'dtype'
:
'int64'
},
'entities'
:
{
'type'
:
'dict'
},
'relations'
:
{
'type'
:
'dict'
}
}
if
load_mode
==
"all"
:
...
...
@@ -103,7 +125,7 @@ class XFUNDataset(Dataset):
return_special_tokens_mask
=
False
):
# Padding
needs_to_be_padded
=
pad_to_max_seq_len
and
\
max_seq_len
and
len
(
encoded_inputs
[
"input_ids"
])
<
max_seq_len
max_seq_len
and
len
(
encoded_inputs
[
"input_ids"
])
<
max_seq_len
if
needs_to_be_padded
:
difference
=
max_seq_len
-
len
(
encoded_inputs
[
"input_ids"
])
...
...
@@ -412,8 +434,8 @@ class XFUNDataset(Dataset):
return_data
=
{}
for
k
,
v
in
data
.
items
():
if
k
in
self
.
return_keys
:
if
self
.
return_keys
[
k
]
==
'np'
:
v
=
np
.
array
(
v
)
if
self
.
return_keys
[
k
]
[
'type'
]
==
'np'
:
v
=
np
.
array
(
v
,
dtype
=
self
.
return_keys
[
k
][
'dtype'
]
)
return_data
[
k
]
=
v
return
return_data
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment