paddlenlp.data.vocab.po 9.49 KB
Newer Older
yuguo-Jack's avatar
yuguo-Jack committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
# SOME DESCRIPTIVE TITLE.
# Copyright (C) 2021, PaddleNLP
# This file is distributed under the same license as the PaddleNLP package.
# FIRST AUTHOR <EMAIL@ADDRESS>, 2022.
#
#, fuzzy
msgid ""
msgstr ""
"Project-Id-Version: PaddleNLP \n"
"Report-Msgid-Bugs-To: \n"
"POT-Creation-Date: 2022-03-18 21:31+0800\n"
"PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
"Last-Translator: FULL NAME <EMAIL@ADDRESS>\n"
"Language-Team: LANGUAGE <LL@li.org>\n"
"MIME-Version: 1.0\n"
"Content-Type: text/plain; charset=utf-8\n"
"Content-Transfer-Encoding: 8bit\n"
"Generated-By: Babel 2.9.0\n"

#: ../source/paddlenlp.data.vocab.rst:2
msgid "vocab"
msgstr ""

#: of paddlenlp.data.vocab.Vocab:1
msgid "基类::class:`object`"
msgstr ""

#: of paddlenlp.data.vocab.Vocab:1
msgid ""
"The class used to convert between tokens and ids. It also includes some "
"store/load functions."
msgstr ""

#: of paddlenlp.data.vocab.Vocab paddlenlp.data.vocab.Vocab.build_vocab
#: paddlenlp.data.vocab.Vocab.from_dict paddlenlp.data.vocab.Vocab.from_json
#: paddlenlp.data.vocab.Vocab.load_vocabulary
#: paddlenlp.data.vocab.Vocab.to_indices paddlenlp.data.vocab.Vocab.to_json
#: paddlenlp.data.vocab.Vocab.to_tokens
msgid "参数"
msgstr ""

#: of paddlenlp.data.vocab.Vocab:4
msgid ""
"A Counter intance describes the tokens and their frequencies. Its keys "
"will be indexed accroding to the order of frequency sorting to construct "
"mapping relationship. If None, `token_to_idx` must be provided as the "
"mapping relationship. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:10
msgid "Max size of vocab, not including special tokens. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:13 paddlenlp.data.vocab.Vocab.build_vocab:11
msgid "Ignore tokens whose frequencies are less than `min_freq`. Default: 1."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:16 paddlenlp.data.vocab.Vocab.build_vocab:14
msgid ""
"A dict specifies the mapping relationship between tokens and indices to "
"be used. If provided, adjust the tokens and indices mapping according to "
"it. If None, counter must be provided. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:21
msgid ""
"Special token for unknow token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:24
msgid ""
"Special token for padding token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:27
msgid ""
"Special token for bos token. If no need, it also could be None. Default: "
"None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:30
msgid ""
"Special token for eos token. If no need, it lso could be None. Default: "
"None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab:33 paddlenlp.data.vocab.Vocab.build_vocab:31
#: paddlenlp.data.vocab.Vocab.from_dict:18
#: paddlenlp.data.vocab.Vocab.load_vocabulary:19
msgid ""
"Keyword arguments ending with `_token`. It can be used to specify further"
" special tokens that will be exposed as attribute of the vocabulary and "
"associated with an index."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_tokens:1
msgid "Maps the input indices to token list."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_tokens:3
msgid ""
"The input indice(s) for mapping. Must be an `int` or 1D "
"`list[int]`|`tuple[int]`|`numpy.ndarray`."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab
#: paddlenlp.data.vocab.Vocab.from_dict paddlenlp.data.vocab.Vocab.from_json
#: paddlenlp.data.vocab.Vocab.load_vocabulary
#: paddlenlp.data.vocab.Vocab.to_indices paddlenlp.data.vocab.Vocab.to_json
#: paddlenlp.data.vocab.Vocab.to_tokens
msgid "返回"
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_tokens:7
msgid ""
"Obtained token(s). If `indices` is an integer, it will return a str. If "
"`indices` is a list/tuple of integers, it will return a list of str."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab
#: paddlenlp.data.vocab.Vocab.from_dict paddlenlp.data.vocab.Vocab.from_json
#: paddlenlp.data.vocab.Vocab.load_vocabulary
#: paddlenlp.data.vocab.Vocab.to_indices paddlenlp.data.vocab.Vocab.to_json
#: paddlenlp.data.vocab.Vocab.to_tokens
msgid "返回类型"
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:41
#: paddlenlp.data.vocab.Vocab.from_dict:28
#: paddlenlp.data.vocab.Vocab.from_json:12
#: paddlenlp.data.vocab.Vocab.load_vocabulary:28
#: paddlenlp.data.vocab.Vocab.to_indices:13
#: paddlenlp.data.vocab.Vocab.to_json:14
#: paddlenlp.data.vocab.Vocab.to_tokens:13
msgid "示例"
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_indices:1
msgid "Maps the input tokens into indices."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_indices:3
msgid "The input token(s) for mapping."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_indices:7
msgid ""
"Obationed indice(s). If `tokens` is a str, it will return an integer. If "
"`tokens` is a list/tuple of str, it will return a list of integers."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.__call__:1
msgid ""
"Maps the input tokens into indices. Its function is the same as the "
":meth:`to_indices` method."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.__call__:4
msgid "See detail at `to_indices`."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_json:1
msgid ""
"Summarizes some information of vocab as JSON string. If path is gaven, "
"the JSON string will be saved into files. The JSON string and the saved "
"file all can be used to reconstruct the :class:`Vocab` by calling "
":meth:`from_json` method."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_json:6
msgid ""
"The path to save JSON string. If None, the JSON will not be saved. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.to_json:10
msgid "The JSON string including information of vocab."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_json:1
msgid ""
"Loads :class:`Vocab` from JSON string or JSON file, which is gotten by "
"calling :meth:`to_json` method."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_json:4
msgid "JSON string or file path of JSON string."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_json:7
msgid ""
"An instance of :class:`Vocab` generated from information contained in "
"JSON string."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:1
msgid "Builds the :class:`Vocab` from a dict."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:3
msgid "A dict describes the mapping relationship between tokens and indices."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:6
msgid ""
"The special token for unknow token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:9
msgid ""
"The special token for padding token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:12
msgid ""
"The special token for bos token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:15
msgid ""
"The special token for eos token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.from_dict:23
msgid ""
"An instance of :class:`Vocab` generated from the given dict and special "
"tokens."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:1
msgid ""
"Builds the :class:`Vocab` accoring to given iterator and other "
"information. Firstly, iterate over the `iterator` to construct a "
":class:`collections.Counter` and used to init the as  :class:`Vocab`."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:5
msgid ""
"Iterator of tokens. Each element should be a list of tokens if wordlevel "
"vocab is needed."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:8
msgid "The max size of vocab, not including special tokens. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:19
msgid ""
"The special token for unknow token '<unk>'. If no need, it also could be "
"None. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:22
msgid ""
"The special token for padding token '<pad>'. If no need, it also could be"
" None. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:25
msgid ""
"The special token for bos token '<bos>'. If no need, it also could be "
"None. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:28
msgid ""
"The special token for eos token '<eos>'. If no need, it also could be "
"None. Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.build_vocab:36
msgid ""
"An instance of :class:`Vocab` generated from given iterator and other "
"informations."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:1
msgid ""
"Builds the :class:`Vocab` from a file reserving all tokens by calling "
":meth:`Vocab.from_dict` method. The file contains a token per line, and "
"the line index would be the index of corresponding token."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:5
msgid "the path of file to construct vocabulary."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:7
msgid ""
"special token for unknown token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:10
msgid ""
"special token for padding token. If no need, it also could be None. "
"Default: None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:13
msgid ""
"special token for bos token. If no need, it also could be None. Default: "
"None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:16
msgid ""
"special token for eos token. If no need, it also could be None. Default: "
"None."
msgstr ""

#: of paddlenlp.data.vocab.Vocab.load_vocabulary:24
msgid "An instance of :class:`Vocab` generated from the given file."
msgstr ""