Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
opencompass
Commits
14fdecfe
Unverified
Commit
14fdecfe
authored
Sep 27, 2023
by
Kevin Wang
Committed by
GitHub
Sep 27, 2023
Browse files
[Dataset] add GLUE QQP dataset (#438)
parent
d8354fe5
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
55 additions
and
0 deletions
+55
-0
configs/datasets/GLUE_QQP/GLUE_QQP_ppl.py
configs/datasets/GLUE_QQP/GLUE_QQP_ppl.py
+4
-0
configs/datasets/GLUE_QQP/GLUE_QQP_ppl_250d00.py
configs/datasets/GLUE_QQP/GLUE_QQP_ppl_250d00.py
+51
-0
No files found.
configs/datasets/GLUE_QQP/GLUE_QQP_ppl.py
0 → 100644
View file @
14fdecfe
from
mmengine.config
import
read_base
with
read_base
():
from
.GLUE_QQP_ppl_250d00
import
QQP_datasets
# noqa: F401, F403
configs/datasets/GLUE_QQP/GLUE_QQP_ppl_250d00.py
0 → 100644
View file @
14fdecfe
from
opencompass.openicl.icl_prompt_template
import
PromptTemplate
from
opencompass.openicl.icl_retriever
import
FixKRetriever
from
opencompass.openicl.icl_inferencer
import
PPLInferencer
from
opencompass.openicl.icl_evaluator
import
AccEvaluator
from
opencompass.datasets
import
HFDataset
_hint
=
"The following are semantic matching questions.
\n
"
\
"Please determine whether the following two sentences are semantically duplicate: "
\
"0 means not duplicate, 1 means duplicate.
\n
"
QQP_infer_cfg
=
dict
(
ice_template
=
dict
(
type
=
PromptTemplate
,
template
=
"Sentence one: {question1}
\n
Sentence two: {question2}
\n
Result: {label}"
,
),
prompt_template
=
dict
(
type
=
PromptTemplate
,
template
=
{
answer
:
f
"
{
_hint
}
</E>Sentence one: {{question1}}
\n
Sentence two: {{question2}}
\n
Result:
{
answer
}
"
for
answer
in
[
0
,
1
]
},
ice_token
=
'</E>'
,
),
retriever
=
dict
(
type
=
FixKRetriever
),
inferencer
=
dict
(
type
=
PPLInferencer
,
fix_id_list
=
[
0
,
1
,
2
,
3
,
4
]))
QQP_eval_cfg
=
dict
(
evaluator
=
dict
(
type
=
AccEvaluator
),
)
QQP_datasets
=
[]
for
_split
in
[
"validation"
,
"test"
]:
QQP_reader_cfg
=
dict
(
input_columns
=
[
'question1'
,
'question2'
],
output_column
=
'label'
,
train_split
=
"train"
,
test_split
=
_split
)
QQP_datasets
.
append
(
dict
(
abbr
=
f
'QQP-
{
_split
}
'
,
type
=
HFDataset
,
path
=
'glue'
,
name
=
'qqp'
,
reader_cfg
=
QQP_reader_cfg
,
infer_cfg
=
QQP_infer_cfg
,
eval_cfg
=
QQP_eval_cfg
)
)
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment