Unverified Commit bc9d34e4 authored by Nikita Titov's avatar Nikita Titov Committed by GitHub
Browse files

[python] migrate to pathlib in python examples (#4428)

parent 035a6cd5
# coding: utf-8 # coding: utf-8
import json import json
import pickle import pickle
from pathlib import Path
import numpy as np import numpy as np
import pandas as pd import pandas as pd
...@@ -10,10 +11,11 @@ import lightgbm as lgb ...@@ -10,10 +11,11 @@ import lightgbm as lgb
print('Loading data...') print('Loading data...')
# load or create your dataset # load or create your dataset
df_train = pd.read_csv('../binary_classification/binary.train', header=None, sep='\t') binary_example_dir = Path(__file__).absolute().parents[1] / 'binary_classification'
df_test = pd.read_csv('../binary_classification/binary.test', header=None, sep='\t') df_train = pd.read_csv(str(binary_example_dir / 'binary.train'), header=None, sep='\t')
W_train = pd.read_csv('../binary_classification/binary.train.weight', header=None)[0] df_test = pd.read_csv(str(binary_example_dir / 'binary.test'), header=None, sep='\t')
W_test = pd.read_csv('../binary_classification/binary.test.weight', header=None)[0] W_train = pd.read_csv(str(binary_example_dir / 'binary.train.weight'), header=None)[0]
W_test = pd.read_csv(str(binary_example_dir / 'binary.test.weight'), header=None)[0]
y_train = df_train[0] y_train = df_train[0]
y_test = df_test[0] y_test = df_test[0]
......
import os from pathlib import Path
import dask.array as da import dask.array as da
import numpy as np import numpy as np
...@@ -10,10 +10,9 @@ import lightgbm as lgb ...@@ -10,10 +10,9 @@ import lightgbm as lgb
if __name__ == "__main__": if __name__ == "__main__":
print("loading data") print("loading data")
X, y = load_svmlight_file(os.path.join(os.path.dirname(os.path.realpath(__file__)), rank_example_dir = Path(__file__).absolute().parents[2] / 'lambdarank'
'../../lambdarank/rank.train')) X, y = load_svmlight_file(str(rank_example_dir / 'rank.train'))
group = np.loadtxt(os.path.join(os.path.dirname(os.path.realpath(__file__)), group = np.loadtxt(str(rank_example_dir / 'rank.train.query'))
'../../lambdarank/rank.train.query'))
print("initializing a Dask cluster") print("initializing a Dask cluster")
......
from pathlib import Path
import h5py import h5py
import numpy as np import numpy as np
import pandas as pd import pandas as pd
...@@ -97,7 +99,11 @@ def generate_hdf(input_fname, output_basename, batch_size): ...@@ -97,7 +99,11 @@ def generate_hdf(input_fname, output_basename, batch_size):
def main(): def main():
batch_size = 64 batch_size = 64
output_basename = 'regression' output_basename = 'regression'
hdf_files = generate_hdf('../regression/regression.train', output_basename, batch_size) hdf_files = generate_hdf(
str(Path(__file__).absolute().parents[1] / 'regression' / 'regression.train'),
output_basename,
batch_size
)
create_dataset_from_multiple_hdf(hdf_files, batch_size=batch_size) create_dataset_from_multiple_hdf(hdf_files, batch_size=batch_size)
......
...@@ -18,10 +18,12 @@ ...@@ -18,10 +18,12 @@
}, },
"outputs": [], "outputs": [],
"source": [ "source": [
"import pandas as pd\n", "from pathlib import Path\n",
"import lightgbm as lgb\n",
"\n", "\n",
"import matplotlib.pyplot as plt\n", "import matplotlib.pyplot as plt\n",
"import pandas as pd\n",
"\n",
"import lightgbm as lgb\n",
"\n", "\n",
"%matplotlib inline\n", "%matplotlib inline\n",
"\n", "\n",
...@@ -52,8 +54,9 @@ ...@@ -52,8 +54,9 @@
}, },
"outputs": [], "outputs": [],
"source": [ "source": [
"df_train = pd.read_csv('../../regression/regression.train', header=None, sep='\\t')\n", "regression_example_dir = Path().absolute().parents[1] / 'regression'\n",
"df_test = pd.read_csv('../../regression/regression.test', header=None, sep='\\t')\n", "df_train = pd.read_csv(str(regression_example_dir / 'regression.train'), header=None, sep='\\t')\n",
"df_test = pd.read_csv(str(regression_example_dir / 'regression.test'), header=None, sep='\\t')\n",
"\n", "\n",
"y_train = df_train[0]\n", "y_train = df_train[0]\n",
"y_test = df_test[0]\n", "y_test = df_test[0]\n",
......
# coding: utf-8 # coding: utf-8
from pathlib import Path
import pandas as pd import pandas as pd
import lightgbm as lgb import lightgbm as lgb
...@@ -10,8 +12,9 @@ else: ...@@ -10,8 +12,9 @@ else:
print('Loading data...') print('Loading data...')
# load or create your dataset # load or create your dataset
df_train = pd.read_csv('../regression/regression.train', header=None, sep='\t') regression_example_dir = Path(__file__).absolute().parents[1] / 'regression'
df_test = pd.read_csv('../regression/regression.test', header=None, sep='\t') df_train = pd.read_csv(str(regression_example_dir / 'regression.train'), header=None, sep='\t')
df_test = pd.read_csv(str(regression_example_dir / 'regression.test'), header=None, sep='\t')
y_train = df_train[0] y_train = df_train[0]
y_test = df_test[0] y_test = df_test[0]
......
# coding: utf-8 # coding: utf-8
from pathlib import Path
import pandas as pd import pandas as pd
from sklearn.metrics import mean_squared_error from sklearn.metrics import mean_squared_error
...@@ -6,8 +8,9 @@ import lightgbm as lgb ...@@ -6,8 +8,9 @@ import lightgbm as lgb
print('Loading data...') print('Loading data...')
# load or create your dataset # load or create your dataset
df_train = pd.read_csv('../regression/regression.train', header=None, sep='\t') regression_example_dir = Path(__file__).absolute().parents[1] / 'regression'
df_test = pd.read_csv('../regression/regression.test', header=None, sep='\t') df_train = pd.read_csv(str(regression_example_dir / 'regression.train'), header=None, sep='\t')
df_test = pd.read_csv(str(regression_example_dir / 'regression.test'), header=None, sep='\t')
y_train = df_train[0] y_train = df_train[0]
y_test = df_test[0] y_test = df_test[0]
......
# coding: utf-8 # coding: utf-8
from pathlib import Path
import numpy as np import numpy as np
import pandas as pd import pandas as pd
from sklearn.metrics import mean_squared_error from sklearn.metrics import mean_squared_error
...@@ -8,8 +10,9 @@ import lightgbm as lgb ...@@ -8,8 +10,9 @@ import lightgbm as lgb
print('Loading data...') print('Loading data...')
# load or create your dataset # load or create your dataset
df_train = pd.read_csv('../regression/regression.train', header=None, sep='\t') regression_example_dir = Path(__file__).absolute().parents[1] / 'regression'
df_test = pd.read_csv('../regression/regression.test', header=None, sep='\t') df_train = pd.read_csv(str(regression_example_dir / 'regression.train'), header=None, sep='\t')
df_test = pd.read_csv(str(regression_example_dir / 'regression.test'), header=None, sep='\t')
y_train = df_train[0] y_train = df_train[0]
y_test = df_test[0] y_test = df_test[0]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment