microsoft · StrikerRUS · Jun 5, 2022 · May 30, 2022 · Jun 1, 2022 · jameslamb
@@ -537,7 +537,7 @@ def _data_from_pandas(data, feature_name, categorical_feature, pandas_categorica
         if len(data.shape) != 2 or data.shape[0] < 1:
             raise ValueError('Input data must be 2 dimensional and non empty.')
         if feature_name == 'auto' or feature_name is None:
-            data = data.rename(columns=str)
+            data = data.rename(columns=str, copy=False)
         cat_cols = [col for col, dtype in zip(data.columns, data.dtypes) if isinstance(dtype, pd_CategoricalDtype)]
         cat_cols_not_ordered = [col for col in cat_cols if not data[col].cat.ordered]
         if pandas_categorical is None:  # train dataset

@@ -648,9 +648,7 @@ def test_no_copy_when_single_float_dtype_dataframe(dtype):
     pd = pytest.importorskip('pandas')
     X = np.random.rand(10, 2).astype(dtype)
     df = pd.DataFrame(X)
-    # feature names are required to not make a copy (rename makes a copy)
-    feature_name = ['x1', 'x2']
-    built_data = lgb.basic._data_from_pandas(df, feature_name, None, None)[0]
+    built_data = lgb.basic._data_from_pandas(df, 'auto', None, None)[0]
     assert built_data.dtype == dtype
     assert np.shares_memory(X, built_data)
 
@@ -659,7 +657,7 @@ def test_categorical_code_conversion_doesnt_modify_original_data():
     pd = pytest.importorskip('pandas')
     X = np.random.choice(['a', 'b'], 100).reshape(-1, 1)
     df = pd.DataFrame(X.copy(), columns=['x1'], dtype='category')
-    data = lgb.basic._data_from_pandas(df, ['x1'], None, None)[0]
+    data = lgb.basic._data_from_pandas(df, 'auto', None, None)[0]
     # check that the original data wasn't modified
     np.testing.assert_equal(df['x1'], X[:, 0])
     # check that the built data has the codes