Skip to content

Commit a23b6fa

Browse files
remove uneeded code and dependencies
1 parent 399d9eb commit a23b6fa

File tree

5 files changed

+4
-29
lines changed

5 files changed

+4
-29
lines changed

envs/conda-env-rapids.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,8 +10,7 @@ dependencies:
1010
# sklbench dependencies
1111
- scikit-learn
1212
- pandas
13-
- tabulate
14-
- fastparquet
13+
- pyarrow
1514
- h5py
1615
- openpyxl
1716
- tqdm

envs/conda-env-sklearn.yml

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,14 +6,11 @@ dependencies:
66
- xgboost
77
- catboost
88
- lightgbm
9-
- faiss-cpu
10-
- modin-all
119
- scikit-learn-intelex
1210
# sklbench dependencies
1311
- scikit-learn
1412
- pandas
15-
- tabulate
16-
- fastparquet
13+
- pyarrow
1714
- h5py
1815
- openpyxl
1916
- tqdm

envs/requirements-sklearn.txt

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,16 +2,13 @@
22
xgboost
33
catboost
44
lightgbm
5-
faiss-cpu
6-
modin[all]
75
scikit-learn-intelex
86
dpctl
97
dpnp
108
# sklbench dependencies
119
scikit-learn
1210
pandas
13-
tabulate
14-
fastparquet
11+
pyarrow
1512
h5py
1613
openpyxl
1714
tqdm

sklbench/datasets/common.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,7 @@ def save_data_to_cache(data: Dict, data_cache: str, data_name: str):
101101
for column in list(data_compoment.columns)
102102
]
103103
data_compoment.to_parquet(
104-
component_filepath, engine="fastparquet", compression="snappy"
104+
component_filepath
105105
)
106106
elif isinstance(data_compoment, csr_matrix):
107107
component_filepath += ".csr.npz"

sklbench/datasets/transformer.py

Lines changed: 0 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -57,24 +57,6 @@ def convert_data(data, dformat: str, order: str, dtype: str, device: str = None)
5757
import dpctl.tensor
5858

5959
return dpctl.tensor.asarray(data, dtype=dtype, order=order, device=device)
60-
elif dformat.startswith("modin"):
61-
if dformat.endswith("ray"):
62-
os.environ["MODIN_ENGINE"] = "ray"
63-
elif dformat.endswith("dask"):
64-
os.environ["MODIN_ENGINE"] = "dask"
65-
elif dformat.endswith("unidist"):
66-
os.environ["MODIN_ENGINE"] = "unidist"
67-
os.environ["UNIDIST_BACKEND"] = "mpi"
68-
else:
69-
logger.info(
70-
"Modin engine is unknown or not specified. Default engine will be used."
71-
)
72-
73-
import modin.pandas as modin_pd
74-
75-
if data.ndim == 1:
76-
return modin_pd.Series(data)
77-
return modin_pd.DataFrame(data)
7860
elif dformat == "cudf":
7961
import cudf
8062

0 commit comments

Comments
 (0)