Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
tianlh
LightGBM-DCU
Commits
5af7eb7a
Unverified
Commit
5af7eb7a
authored
Jun 15, 2021
by
Frank Fineis
Committed by
GitHub
Jun 15, 2021
Browse files
[dask] Dask Vector types for group, init_score, sample_weights (fixes #4375) (#4380)
parent
9d9e9b87
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
26 additions
and
25 deletions
+26
-25
python-package/lightgbm/dask.py
python-package/lightgbm/dask.py
+26
-25
No files found.
python-package/lightgbm/dask.py
View file @
5af7eb7a
...
@@ -22,6 +22,7 @@ from .sklearn import LGBMClassifier, LGBMModel, LGBMRanker, LGBMRegressor, _lgbm
...
@@ -22,6 +22,7 @@ from .sklearn import LGBMClassifier, LGBMModel, LGBMRanker, LGBMRegressor, _lgbm
_DaskCollection
=
Union
[
dask_Array
,
dask_DataFrame
,
dask_Series
]
_DaskCollection
=
Union
[
dask_Array
,
dask_DataFrame
,
dask_Series
]
_DaskMatrixLike
=
Union
[
dask_Array
,
dask_DataFrame
]
_DaskMatrixLike
=
Union
[
dask_Array
,
dask_DataFrame
]
_DaskVectorLike
=
Union
[
dask_Array
,
dask_Series
]
_DaskPart
=
Union
[
np
.
ndarray
,
pd_DataFrame
,
pd_Series
,
ss
.
spmatrix
]
_DaskPart
=
Union
[
np
.
ndarray
,
pd_DataFrame
,
pd_Series
,
ss
.
spmatrix
]
_PredictionDtype
=
Union
[
Type
[
np
.
float32
],
Type
[
np
.
float64
],
Type
[
np
.
int32
],
Type
[
np
.
int64
]]
_PredictionDtype
=
Union
[
Type
[
np
.
float32
],
Type
[
np
.
float64
],
Type
[
np
.
int32
],
Type
[
np
.
int64
]]
...
@@ -214,9 +215,9 @@ def _train(
...
@@ -214,9 +215,9 @@ def _train(
label
:
_DaskCollection
,
label
:
_DaskCollection
,
params
:
Dict
[
str
,
Any
],
params
:
Dict
[
str
,
Any
],
model_factory
:
Type
[
LGBMModel
],
model_factory
:
Type
[
LGBMModel
],
sample_weight
:
Optional
[
_Dask
Collection
]
=
None
,
sample_weight
:
Optional
[
_Dask
VectorLike
]
=
None
,
init_score
:
Optional
[
_Dask
Collection
]
=
None
,
init_score
:
Optional
[
_Dask
VectorLike
]
=
None
,
group
:
Optional
[
_Dask
Collection
]
=
None
,
group
:
Optional
[
_Dask
VectorLike
]
=
None
,
**
kwargs
:
Any
**
kwargs
:
Any
)
->
LGBMModel
:
)
->
LGBMModel
:
"""Inner train routine.
"""Inner train routine.
...
@@ -233,11 +234,11 @@ def _train(
...
@@ -233,11 +234,11 @@ def _train(
Parameters passed to constructor of the local underlying model.
Parameters passed to constructor of the local underlying model.
model_factory : lightgbm.LGBMClassifier, lightgbm.LGBMRegressor, or lightgbm.LGBMRanker class
model_factory : lightgbm.LGBMClassifier, lightgbm.LGBMRegressor, or lightgbm.LGBMRanker class
Class of the local underlying model.
Class of the local underlying model.
sample_weight : Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)
sample_weight : Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)
Weights of training data.
Weights of training data.
init_score : Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)
init_score : Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)
Init score of training data.
Init score of training data.
group : Dask Array
, Dask DataFrame, Dask Series of shape = [n_samples]
or None, optional (default=None)
group : Dask Array
or Dask Series
or None, optional (default=None)
Group/query data.
Group/query data.
Only used in the learning-to-rank task.
Only used in the learning-to-rank task.
sum(group) = n_samples.
sum(group) = n_samples.
...
@@ -603,9 +604,9 @@ class _DaskLGBMModel:
...
@@ -603,9 +604,9 @@ class _DaskLGBMModel:
model_factory
:
Type
[
LGBMModel
],
model_factory
:
Type
[
LGBMModel
],
X
:
_DaskMatrixLike
,
X
:
_DaskMatrixLike
,
y
:
_DaskCollection
,
y
:
_DaskCollection
,
sample_weight
:
Optional
[
_Dask
Collection
]
=
None
,
sample_weight
:
Optional
[
_Dask
VectorLike
]
=
None
,
init_score
:
Optional
[
_Dask
Collection
]
=
None
,
init_score
:
Optional
[
_Dask
VectorLike
]
=
None
,
group
:
Optional
[
_Dask
Collection
]
=
None
,
group
:
Optional
[
_Dask
VectorLike
]
=
None
,
**
kwargs
:
Any
**
kwargs
:
Any
)
->
"_DaskLGBMModel"
:
)
->
"_DaskLGBMModel"
:
if
not
all
((
DASK_INSTALLED
,
PANDAS_INSTALLED
,
SKLEARN_INSTALLED
)):
if
not
all
((
DASK_INSTALLED
,
PANDAS_INSTALLED
,
SKLEARN_INSTALLED
)):
...
@@ -721,8 +722,8 @@ class DaskLGBMClassifier(LGBMClassifier, _DaskLGBMModel):
...
@@ -721,8 +722,8 @@ class DaskLGBMClassifier(LGBMClassifier, _DaskLGBMModel):
self
,
self
,
X
:
_DaskMatrixLike
,
X
:
_DaskMatrixLike
,
y
:
_DaskCollection
,
y
:
_DaskCollection
,
sample_weight
:
Optional
[
_Dask
Collection
]
=
None
,
sample_weight
:
Optional
[
_Dask
VectorLike
]
=
None
,
init_score
:
Optional
[
_Dask
Collection
]
=
None
,
init_score
:
Optional
[
_Dask
VectorLike
]
=
None
,
**
kwargs
:
Any
**
kwargs
:
Any
)
->
"DaskLGBMClassifier"
:
)
->
"DaskLGBMClassifier"
:
"""Docstring is inherited from the lightgbm.LGBMClassifier.fit."""
"""Docstring is inherited from the lightgbm.LGBMClassifier.fit."""
...
@@ -738,9 +739,9 @@ class DaskLGBMClassifier(LGBMClassifier, _DaskLGBMModel):
...
@@ -738,9 +739,9 @@ class DaskLGBMClassifier(LGBMClassifier, _DaskLGBMModel):
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
sample_weight_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
sample_weight_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
group_shape
=
"Dask Array
, Dask DataFrame, Dask Series of shape = [n_samples]
or None, optional (default=None)"
group_shape
=
"Dask Array
or Dask Series
or None, optional (default=None)"
)
)
# DaskLGBMClassifier does not support evaluation data, or early stopping
# DaskLGBMClassifier does not support evaluation data, or early stopping
...
@@ -871,8 +872,8 @@ class DaskLGBMRegressor(LGBMRegressor, _DaskLGBMModel):
...
@@ -871,8 +872,8 @@ class DaskLGBMRegressor(LGBMRegressor, _DaskLGBMModel):
self
,
self
,
X
:
_DaskMatrixLike
,
X
:
_DaskMatrixLike
,
y
:
_DaskCollection
,
y
:
_DaskCollection
,
sample_weight
:
Optional
[
_Dask
Collection
]
=
None
,
sample_weight
:
Optional
[
_Dask
VectorLike
]
=
None
,
init_score
:
Optional
[
_Dask
Collection
]
=
None
,
init_score
:
Optional
[
_Dask
VectorLike
]
=
None
,
**
kwargs
:
Any
**
kwargs
:
Any
)
->
"DaskLGBMRegressor"
:
)
->
"DaskLGBMRegressor"
:
"""Docstring is inherited from the lightgbm.LGBMRegressor.fit."""
"""Docstring is inherited from the lightgbm.LGBMRegressor.fit."""
...
@@ -888,9 +889,9 @@ class DaskLGBMRegressor(LGBMRegressor, _DaskLGBMModel):
...
@@ -888,9 +889,9 @@ class DaskLGBMRegressor(LGBMRegressor, _DaskLGBMModel):
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
sample_weight_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
sample_weight_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
group_shape
=
"Dask Array
, Dask DataFrame, Dask Series of shape = [n_samples]
or None, optional (default=None)"
group_shape
=
"Dask Array
or Dask Series
or None, optional (default=None)"
)
)
# DaskLGBMRegressor does not support evaluation data, or early stopping
# DaskLGBMRegressor does not support evaluation data, or early stopping
...
@@ -1003,9 +1004,9 @@ class DaskLGBMRanker(LGBMRanker, _DaskLGBMModel):
...
@@ -1003,9 +1004,9 @@ class DaskLGBMRanker(LGBMRanker, _DaskLGBMModel):
self
,
self
,
X
:
_DaskMatrixLike
,
X
:
_DaskMatrixLike
,
y
:
_DaskCollection
,
y
:
_DaskCollection
,
sample_weight
:
Optional
[
_Dask
Collection
]
=
None
,
sample_weight
:
Optional
[
_Dask
VectorLike
]
=
None
,
init_score
:
Optional
[
_Dask
Collection
]
=
None
,
init_score
:
Optional
[
_Dask
VectorLike
]
=
None
,
group
:
Optional
[
_Dask
Collection
]
=
None
,
group
:
Optional
[
_Dask
VectorLike
]
=
None
,
**
kwargs
:
Any
**
kwargs
:
Any
)
->
"DaskLGBMRanker"
:
)
->
"DaskLGBMRanker"
:
"""Docstring is inherited from the lightgbm.LGBMRanker.fit."""
"""Docstring is inherited from the lightgbm.LGBMRanker.fit."""
...
@@ -1022,9 +1023,9 @@ class DaskLGBMRanker(LGBMRanker, _DaskLGBMModel):
...
@@ -1022,9 +1023,9 @@ class DaskLGBMRanker(LGBMRanker, _DaskLGBMModel):
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
_base_doc
=
_lgbmmodel_doc_fit
.
format
(
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
X_shape
=
"Dask Array or Dask DataFrame of shape = [n_samples, n_features]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
y_shape
=
"Dask Array, Dask DataFrame or Dask Series of shape = [n_samples]"
,
sample_weight_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
sample_weight_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
, Dask DataFrame,
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
init_score_shape
=
"Dask Array
or
Dask Series of shape = [n_samples] or None, optional (default=None)"
,
group_shape
=
"Dask Array
, Dask DataFrame, Dask Series of shape = [n_samples]
or None, optional (default=None)"
group_shape
=
"Dask Array
or Dask Series
or None, optional (default=None)"
)
)
# DaskLGBMRanker does not support evaluation data, or early stopping
# DaskLGBMRanker does not support evaluation data, or early stopping
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment