|
@@ -92,8 +92,9 @@ class DataProcess():
|
|
|
|
|
|
|
|
# 去除重复值和填补缺失值
|
|
# 去除重复值和填补缺失值
|
|
|
self._order_data.drop_duplicates(inplace=True)
|
|
self._order_data.drop_duplicates(inplace=True)
|
|
|
- self._order_data[remaining_cols.drop(col_all_missing)].fillna(0, inplace=True)
|
|
|
|
|
- self._order_data = self._order_data.infer_objects(copy=False)
|
|
|
|
|
|
|
+ self._order_data[remaining_cols.drop(col_all_missing)] = self._order_data[remaining_cols.drop(col_all_missing)].fillna(0)
|
|
|
|
|
+ self._order_data = self._order_data.infer_objects(copy=False)
|
|
|
|
|
+
|
|
|
|
|
|
|
|
def _clean_shopping_data(self):
|
|
def _clean_shopping_data(self):
|
|
|
"""处理商圈数据缺省值"""
|
|
"""处理商圈数据缺省值"""
|
|
@@ -122,7 +123,7 @@ class DataProcess():
|
|
|
def _generate_pos_train_data(self):
|
|
def _generate_pos_train_data(self):
|
|
|
pos_data = self._generate_original_train_data(is_pos=True)
|
|
pos_data = self._generate_original_train_data(is_pos=True)
|
|
|
pos_data.dropna(subset=['YLT_TURNOVER_RATE'], inplace=True)
|
|
pos_data.dropna(subset=['YLT_TURNOVER_RATE'], inplace=True)
|
|
|
- pos_data[OrderConfig.POSFEATURES].fillna(0, inplace=True)
|
|
|
|
|
|
|
+ pos_data[OrderConfig.POSFEATURES] = pos_data[OrderConfig.POSFEATURES].fillna(0)
|
|
|
pos_data = pos_data.infer_objects(copy=False)
|
|
pos_data = pos_data.infer_objects(copy=False)
|
|
|
return pos_data
|
|
return pos_data
|
|
|
|
|
|