Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
tianlh
LightGBM-DCU
Commits
bc9d34e4
Unverified
Commit
bc9d34e4
authored
Jul 04, 2021
by
Nikita Titov
Committed by
GitHub
Jul 04, 2021
Browse files
[python] migrate to pathlib in python examples (#4428)
parent
035a6cd5
Changes
7
Hide whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
39 additions
and
20 deletions
+39
-20
examples/python-guide/advanced_example.py
examples/python-guide/advanced_example.py
+6
-4
examples/python-guide/dask/ranking.py
examples/python-guide/dask/ranking.py
+4
-5
examples/python-guide/dataset_from_multi_hdf5.py
examples/python-guide/dataset_from_multi_hdf5.py
+7
-1
examples/python-guide/notebooks/interactive_plot_example.ipynb
...les/python-guide/notebooks/interactive_plot_example.ipynb
+7
-4
examples/python-guide/plot_example.py
examples/python-guide/plot_example.py
+5
-2
examples/python-guide/simple_example.py
examples/python-guide/simple_example.py
+5
-2
examples/python-guide/sklearn_example.py
examples/python-guide/sklearn_example.py
+5
-2
No files found.
examples/python-guide/advanced_example.py
View file @
bc9d34e4
# coding: utf-8
# coding: utf-8
import
json
import
json
import
pickle
import
pickle
from
pathlib
import
Path
import
numpy
as
np
import
numpy
as
np
import
pandas
as
pd
import
pandas
as
pd
...
@@ -10,10 +11,11 @@ import lightgbm as lgb
...
@@ -10,10 +11,11 @@ import lightgbm as lgb
print
(
'Loading data...'
)
print
(
'Loading data...'
)
# load or create your dataset
# load or create your dataset
df_train
=
pd
.
read_csv
(
'../binary_classification/binary.train'
,
header
=
None
,
sep
=
'
\t
'
)
binary_example_dir
=
Path
(
__file__
).
absolute
().
parents
[
1
]
/
'binary_classification'
df_test
=
pd
.
read_csv
(
'../binary_classification/binary.test'
,
header
=
None
,
sep
=
'
\t
'
)
df_train
=
pd
.
read_csv
(
str
(
binary_example_dir
/
'binary.train'
),
header
=
None
,
sep
=
'
\t
'
)
W_train
=
pd
.
read_csv
(
'../binary_classification/binary.train.weight'
,
header
=
None
)[
0
]
df_test
=
pd
.
read_csv
(
str
(
binary_example_dir
/
'binary.test'
),
header
=
None
,
sep
=
'
\t
'
)
W_test
=
pd
.
read_csv
(
'../binary_classification/binary.test.weight'
,
header
=
None
)[
0
]
W_train
=
pd
.
read_csv
(
str
(
binary_example_dir
/
'binary.train.weight'
),
header
=
None
)[
0
]
W_test
=
pd
.
read_csv
(
str
(
binary_example_dir
/
'binary.test.weight'
),
header
=
None
)[
0
]
y_train
=
df_train
[
0
]
y_train
=
df_train
[
0
]
y_test
=
df_test
[
0
]
y_test
=
df_test
[
0
]
...
...
examples/python-guide/dask/ranking.py
View file @
bc9d34e4
import
os
from
pathlib
import
Path
import
dask.array
as
da
import
dask.array
as
da
import
numpy
as
np
import
numpy
as
np
...
@@ -10,10 +10,9 @@ import lightgbm as lgb
...
@@ -10,10 +10,9 @@ import lightgbm as lgb
if
__name__
==
"__main__"
:
if
__name__
==
"__main__"
:
print
(
"loading data"
)
print
(
"loading data"
)
X
,
y
=
load_svmlight_file
(
os
.
path
.
join
(
os
.
path
.
dirname
(
os
.
path
.
realpath
(
__file__
)),
rank_example_dir
=
Path
(
__file__
).
absolute
().
parents
[
2
]
/
'lambdarank'
'../../lambdarank/rank.train'
))
X
,
y
=
load_svmlight_file
(
str
(
rank_example_dir
/
'rank.train'
))
group
=
np
.
loadtxt
(
os
.
path
.
join
(
os
.
path
.
dirname
(
os
.
path
.
realpath
(
__file__
)),
group
=
np
.
loadtxt
(
str
(
rank_example_dir
/
'rank.train.query'
))
'../../lambdarank/rank.train.query'
))
print
(
"initializing a Dask cluster"
)
print
(
"initializing a Dask cluster"
)
...
...
examples/python-guide/dataset_from_multi_hdf5.py
View file @
bc9d34e4
from
pathlib
import
Path
import
h5py
import
h5py
import
numpy
as
np
import
numpy
as
np
import
pandas
as
pd
import
pandas
as
pd
...
@@ -97,7 +99,11 @@ def generate_hdf(input_fname, output_basename, batch_size):
...
@@ -97,7 +99,11 @@ def generate_hdf(input_fname, output_basename, batch_size):
def
main
():
def
main
():
batch_size
=
64
batch_size
=
64
output_basename
=
'regression'
output_basename
=
'regression'
hdf_files
=
generate_hdf
(
'../regression/regression.train'
,
output_basename
,
batch_size
)
hdf_files
=
generate_hdf
(
str
(
Path
(
__file__
).
absolute
().
parents
[
1
]
/
'regression'
/
'regression.train'
),
output_basename
,
batch_size
)
create_dataset_from_multiple_hdf
(
hdf_files
,
batch_size
=
batch_size
)
create_dataset_from_multiple_hdf
(
hdf_files
,
batch_size
=
batch_size
)
...
...
examples/python-guide/notebooks/interactive_plot_example.ipynb
View file @
bc9d34e4
...
@@ -18,10 +18,12 @@
...
@@ -18,10 +18,12 @@
},
},
"outputs": [],
"outputs": [],
"source": [
"source": [
"import pandas as pd\n",
"from pathlib import Path\n",
"import lightgbm as lgb\n",
"\n",
"\n",
"import matplotlib.pyplot as plt\n",
"import matplotlib.pyplot as plt\n",
"import pandas as pd\n",
"\n",
"import lightgbm as lgb\n",
"\n",
"\n",
"%matplotlib inline\n",
"%matplotlib inline\n",
"\n",
"\n",
...
@@ -52,8 +54,9 @@
...
@@ -52,8 +54,9 @@
},
},
"outputs": [],
"outputs": [],
"source": [
"source": [
"df_train = pd.read_csv('../../regression/regression.train', header=None, sep='\\t')\n",
"regression_example_dir = Path().absolute().parents[1] / 'regression'\n",
"df_test = pd.read_csv('../../regression/regression.test', header=None, sep='\\t')\n",
"df_train = pd.read_csv(str(regression_example_dir / 'regression.train'), header=None, sep='\\t')\n",
"df_test = pd.read_csv(str(regression_example_dir / 'regression.test'), header=None, sep='\\t')\n",
"\n",
"\n",
"y_train = df_train[0]\n",
"y_train = df_train[0]\n",
"y_test = df_test[0]\n",
"y_test = df_test[0]\n",
...
...
examples/python-guide/plot_example.py
View file @
bc9d34e4
# coding: utf-8
# coding: utf-8
from
pathlib
import
Path
import
pandas
as
pd
import
pandas
as
pd
import
lightgbm
as
lgb
import
lightgbm
as
lgb
...
@@ -10,8 +12,9 @@ else:
...
@@ -10,8 +12,9 @@ else:
print
(
'Loading data...'
)
print
(
'Loading data...'
)
# load or create your dataset
# load or create your dataset
df_train
=
pd
.
read_csv
(
'../regression/regression.train'
,
header
=
None
,
sep
=
'
\t
'
)
regression_example_dir
=
Path
(
__file__
).
absolute
().
parents
[
1
]
/
'regression'
df_test
=
pd
.
read_csv
(
'../regression/regression.test'
,
header
=
None
,
sep
=
'
\t
'
)
df_train
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.train'
),
header
=
None
,
sep
=
'
\t
'
)
df_test
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.test'
),
header
=
None
,
sep
=
'
\t
'
)
y_train
=
df_train
[
0
]
y_train
=
df_train
[
0
]
y_test
=
df_test
[
0
]
y_test
=
df_test
[
0
]
...
...
examples/python-guide/simple_example.py
View file @
bc9d34e4
# coding: utf-8
# coding: utf-8
from
pathlib
import
Path
import
pandas
as
pd
import
pandas
as
pd
from
sklearn.metrics
import
mean_squared_error
from
sklearn.metrics
import
mean_squared_error
...
@@ -6,8 +8,9 @@ import lightgbm as lgb
...
@@ -6,8 +8,9 @@ import lightgbm as lgb
print
(
'Loading data...'
)
print
(
'Loading data...'
)
# load or create your dataset
# load or create your dataset
df_train
=
pd
.
read_csv
(
'../regression/regression.train'
,
header
=
None
,
sep
=
'
\t
'
)
regression_example_dir
=
Path
(
__file__
).
absolute
().
parents
[
1
]
/
'regression'
df_test
=
pd
.
read_csv
(
'../regression/regression.test'
,
header
=
None
,
sep
=
'
\t
'
)
df_train
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.train'
),
header
=
None
,
sep
=
'
\t
'
)
df_test
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.test'
),
header
=
None
,
sep
=
'
\t
'
)
y_train
=
df_train
[
0
]
y_train
=
df_train
[
0
]
y_test
=
df_test
[
0
]
y_test
=
df_test
[
0
]
...
...
examples/python-guide/sklearn_example.py
View file @
bc9d34e4
# coding: utf-8
# coding: utf-8
from
pathlib
import
Path
import
numpy
as
np
import
numpy
as
np
import
pandas
as
pd
import
pandas
as
pd
from
sklearn.metrics
import
mean_squared_error
from
sklearn.metrics
import
mean_squared_error
...
@@ -8,8 +10,9 @@ import lightgbm as lgb
...
@@ -8,8 +10,9 @@ import lightgbm as lgb
print
(
'Loading data...'
)
print
(
'Loading data...'
)
# load or create your dataset
# load or create your dataset
df_train
=
pd
.
read_csv
(
'../regression/regression.train'
,
header
=
None
,
sep
=
'
\t
'
)
regression_example_dir
=
Path
(
__file__
).
absolute
().
parents
[
1
]
/
'regression'
df_test
=
pd
.
read_csv
(
'../regression/regression.test'
,
header
=
None
,
sep
=
'
\t
'
)
df_train
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.train'
),
header
=
None
,
sep
=
'
\t
'
)
df_test
=
pd
.
read_csv
(
str
(
regression_example_dir
/
'regression.test'
),
header
=
None
,
sep
=
'
\t
'
)
y_train
=
df_train
[
0
]
y_train
=
df_train
[
0
]
y_test
=
df_test
[
0
]
y_test
=
df_test
[
0
]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment