|
@@ -24,9 +24,9 @@ class CustConfig:
|
|
|
]
|
|
]
|
|
|
# 数据清洗规则
|
|
# 数据清洗规则
|
|
|
CLEANING_RULES = {
|
|
CLEANING_RULES = {
|
|
|
- "BB_RTL_CUST_POSITION_TYPE_NAME": {"method": "fillna", "opt": "fill", "value": "其它", "type": "str"},
|
|
|
|
|
- "BB_RTL_CUST_MARKET_TYPE_NAME": {"method": "fillna", "opt": "fill", "value": "其它", "type": "str"},
|
|
|
|
|
- "BB_RTL_CUST_SUB_BUSI_PLACE_NAME": {"method": "fillna", "opt": "fill", "value": "其它", "type": "str"},
|
|
|
|
|
|
|
+ "BB_RTL_CUST_POSITION_TYPE_NAME": {"method": "fillna", "opt": "fill", "value": "其他", "type": "str"},
|
|
|
|
|
+ "BB_RTL_CUST_SUB_BUSI_PLACE_NAME": {"method": "fillna", "opt": "fill", "value": "其他", "type": "str"},
|
|
|
|
|
+ "BB_RTL_CUST_GRADE_NAME": {"method": "fillna", "opt": "fill", "value": "其他", "type": "str"},
|
|
|
# "BB_RTL_CUST_TERMINALEVEL_NAME": {"method": "fillna", "opt": "replace", "value": "BB_RTL_CUST_TERMINAL_LEVEL_NAME", "type": "str"},
|
|
# "BB_RTL_CUST_TERMINALEVEL_NAME": {"method": "fillna", "opt": "replace", "value": "BB_RTL_CUST_TERMINAL_LEVEL_NAME", "type": "str"},
|
|
|
# "MD04_MG_RTL_CUST_CREDITCLASS_NAME": {"method": "fillna", "opt": "fill", "value": "未评价", "type": "str"},
|
|
# "MD04_MG_RTL_CUST_CREDITCLASS_NAME": {"method": "fillna", "opt": "fill", "value": "未评价", "type": "str"},
|
|
|
# "MD04_MG_SAMPLE_CUST_FLAG": {"method": "fillna", "value": "N", "opt": "fill"},
|
|
# "MD04_MG_SAMPLE_CUST_FLAG": {"method": "fillna", "value": "N", "opt": "fill"},
|
|
@@ -40,7 +40,15 @@ class CustConfig:
|
|
|
"OPERATOR_EDU_LEVEL": {"method": "fillna", "opt": "fill", "value": "00", "type": "str"},
|
|
"OPERATOR_EDU_LEVEL": {"method": "fillna", "opt": "fill", "value": "00", "type": "str"},
|
|
|
}
|
|
}
|
|
|
# one-hot编码
|
|
# one-hot编码
|
|
|
-
|
|
|
|
|
|
|
+ ONEHOT = [
|
|
|
|
|
+ "BB_RTL_CUST_POSITION_TYPE_NAME",
|
|
|
|
|
+ "BB_RTL_CUST_MARKET_TYPE_NAME",
|
|
|
|
|
+ "BB_RTL_CUST_SUB_BUSI_PLACE_NAME",
|
|
|
|
|
+ "BB_RTL_CUST_GRADE_NAME",
|
|
|
|
|
+ "BB_RTL_CUST_CHAIN_FLAG",
|
|
|
|
|
+ "MD04_DIR_SAL_STORE_FLAG",
|
|
|
|
|
+ "OPERATOR_EDU_LEVEL",
|
|
|
|
|
+ ]
|
|
|
|
|
|
|
|
class ProductConfig:
|
|
class ProductConfig:
|
|
|
FEATURE_COLUMNS = [
|
|
FEATURE_COLUMNS = [
|
|
@@ -106,4 +114,27 @@ class ProductConfig:
|
|
|
"product_style_code_name": {"method": "fillna", "opt": "fill", "type": "str", "value": "其他"},
|
|
"product_style_code_name": {"method": "fillna", "opt": "fill", "type": "str", "value": "其他"},
|
|
|
"chinese_mix": {"method": "fillna", "opt": "fill", "type": "str", "value": "否"},
|
|
"chinese_mix": {"method": "fillna", "opt": "fill", "type": "str", "value": "否"},
|
|
|
"sub_price_type_name": {"method": "fillna", "opt": "fill", "type": "str", "value": "其他"},
|
|
"sub_price_type_name": {"method": "fillna", "opt": "fill", "type": "str", "value": "其他"},
|
|
|
- }
|
|
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
|
|
+ ONEHOT = [
|
|
|
|
|
+ "price_type_name", # 卷烟价类名称
|
|
|
|
|
+ "gear_type_name", # 卷烟档位名称
|
|
|
|
|
+ "category_type_name", # 卷烟品类名称
|
|
|
|
|
+ "is_key_brand", # 是否重点品牌
|
|
|
|
|
+ "is_high_level", # 是否高端烟
|
|
|
|
|
+ "is_upscale_level", # 是否高端烟不含高价
|
|
|
|
|
+ "is_high_price", # 是否高价烟
|
|
|
|
|
+ "is_low_price", # 是否低价烟
|
|
|
|
|
+ "is_low_tar", # 是否低焦油烟
|
|
|
|
|
+ "is_encourage", # 是否全国鼓励品牌
|
|
|
|
|
+ "is_abnormity", # 是否异形包装
|
|
|
|
|
+ "is_intake", # 是否进口烟
|
|
|
|
|
+ "is_short", # 是否紧俏品牌
|
|
|
|
|
+ "is_medium", # 是否中支烟
|
|
|
|
|
+ "is_shortbranch", # 是否短支烟
|
|
|
|
|
+ "is_ordinary_price_type", # 是否普一类烟
|
|
|
|
|
+ "source_type", # 来源类型
|
|
|
|
|
+ "product_style_code_name", # 包装类型名称
|
|
|
|
|
+ "chinese_mix", # 中式混合
|
|
|
|
|
+ "sub_price_type_name", # 细分卷烟价类名称
|
|
|
|
|
+ ]
|