Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
795b3e76
Commit
795b3e76
authored
Sep 27, 2019
by
Agrin Hilmkil
Browse files
Add docstring for processor method
parent
e31a4728
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
18 additions
and
0 deletions
+18
-0
transformers/data/processors/glue.py
transformers/data/processors/glue.py
+9
-0
transformers/data/processors/utils.py
transformers/data/processors/utils.py
+9
-0
No files found.
transformers/data/processors/glue.py
View file @
795b3e76
...
...
@@ -155,6 +155,7 @@ class MrpcProcessor(DataProcessor):
"""Processor for the MRPC data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence1'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'sentence2'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -194,6 +195,7 @@ class MnliProcessor(DataProcessor):
"""Processor for the MultiNLI data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'premise'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'hypothesis'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -243,6 +245,7 @@ class ColaProcessor(DataProcessor):
"""Processor for the CoLA data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence'
].
numpy
().
decode
(
'utf-8'
),
None
,
...
...
@@ -278,6 +281,7 @@ class Sst2Processor(DataProcessor):
"""Processor for the SST-2 data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence'
].
numpy
().
decode
(
'utf-8'
),
None
,
...
...
@@ -315,6 +319,7 @@ class StsbProcessor(DataProcessor):
"""Processor for the STS-B data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence1'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'sentence2'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -353,6 +358,7 @@ class QqpProcessor(DataProcessor):
"""Processor for the QQP data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'question1'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'question2'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -394,6 +400,7 @@ class QnliProcessor(DataProcessor):
"""Processor for the QNLI data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'question'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'sentence'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -433,6 +440,7 @@ class RteProcessor(DataProcessor):
"""Processor for the RTE data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence1'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'sentence2'
].
numpy
().
decode
(
'utf-8'
),
...
...
@@ -471,6 +479,7 @@ class WnliProcessor(DataProcessor):
"""Processor for the WNLI data set (GLUE version)."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""See base class."""
return
InputExample
(
tensor_dict
[
'idx'
].
numpy
(),
tensor_dict
[
'sentence1'
].
numpy
().
decode
(
'utf-8'
),
tensor_dict
[
'sentence2'
].
numpy
().
decode
(
'utf-8'
),
...
...
transformers/data/processors/utils.py
View file @
795b3e76
...
...
@@ -86,6 +86,15 @@ class InputFeatures(object):
class
DataProcessor
(
object
):
"""Base class for data converters for sequence classification data sets."""
def
get_example_from_tensor_dict
(
self
,
tensor_dict
):
"""Gets an example from a dict with tensorflow tensors
Args:
tensor_dict: Keys and values should match the corresponding Glue
tensorflow_dataset examples.
"""
raise
NotImplementedError
()
def
get_train_examples
(
self
,
data_dir
):
"""Gets a collection of `InputExample`s for the train set."""
raise
NotImplementedError
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment