mysql_dao.py 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141
  1. from database import MySqlDatabaseHelper
  2. from sqlalchemy import text
  3. import pandas as pd
  4. class MySqlDao:
  5. _instance = None
  6. def __new__(cls):
  7. if not cls._instance:
  8. cls._instance = super(MySqlDao, cls).__new__(cls)
  9. cls._instance._initialized = False
  10. return cls._instance
  11. def __init__(self):
  12. if self._initialized:
  13. return
  14. self.db_helper = MySqlDatabaseHelper()
  15. self._product_tablename = "tads_brandcul_product_info"
  16. self._cust_tablename = "tads_brandcul_cust_info"
  17. self._order_tablename = "tads_brandcul_cust_order"
  18. self._mock_order_tablename = "yunfu_mock_data"
  19. self._shopping_tablename = "tads_brandcul_cust_info_lbs"
  20. self._initialized = True
  21. def load_product_data(self, city_uuid):
  22. """从数据库中读取商品信息"""
  23. query = f"SELECT * FROM {self._product_tablename} WHERE city_uuid = :city_uuid"
  24. params = {"city_uuid": city_uuid}
  25. data = self.db_helper.load_data_with_page(query, params)
  26. return data
  27. def load_cust_data(self, city_uuid):
  28. """从数据库中读取商户信息"""
  29. query = f"SELECT * FROM {self._cust_tablename} WHERE BA_CITY_ORG_CODE = :city_uuid"
  30. params = {"city_uuid": city_uuid}
  31. data = self.db_helper.load_data_with_page(query, params)
  32. return data
  33. def load_order_data(self, city_uuid):
  34. """从数据库中读取订单信息"""
  35. query = f"SELECT * FROM {self._order_tablename} WHERE city_uuid = :city_uuid"
  36. params = {"city_uuid": city_uuid}
  37. data = self.db_helper.load_data_with_page(query, params)
  38. data.drop('stat_month', axis=1, inplace=True)
  39. data.drop('city_uuid', axis=1, inplace=True)
  40. # 去除重复值和填补缺失值
  41. data.drop_duplicates(inplace=True)
  42. data.fillna(0, inplace=True)
  43. data = data.infer_objects(copy=False)
  44. return data
  45. def load_mock_order_data(self):
  46. """从数据库中读取mock的订单信息"""
  47. query = f"SELECT * FROM {self._mock_order_tablename}"
  48. data = self.db_helper.load_data_with_page(query, {})
  49. # 去除重复值和填补缺失值
  50. data.drop_duplicates(inplace=True)
  51. data.fillna(0, inplace=True)
  52. data = data.infer_objects(copy=False)
  53. return data
  54. def load_shopping_data(self, city_uuid):
  55. """从数据库中读取商圈数据"""
  56. query = f"SELECT * FROM {self._shopping_tablename} WHERE city_uuid = :city_uuid"
  57. params = {"city_uuid": city_uuid}
  58. data = self.db_helper.load_data_with_page(query, params)
  59. return data
  60. def get_cust_list(self, city_uuid):
  61. """获取商户列表"""
  62. data = self.load_cust_data(city_uuid)
  63. cust_list = data["BB_RETAIL_CUSTOMER_CODE"].to_list()
  64. if len(cust_list) == 0:
  65. return []
  66. return cust_list
  67. def get_product_by_id(self, city_uuid, product_id):
  68. """根据city_uuid 和 product_id 从表中获取拼柜信息"""
  69. query = text(f"""
  70. SELECT *
  71. FROM {self._product_tablename}
  72. WHERE city_uuid = :city_uuid
  73. AND product_code = :product_id
  74. """)
  75. params = {"city_uuid": city_uuid, "product_id": product_id}
  76. data = self.db_helper.fetch_one(query, params)
  77. return data
  78. def get_cust_by_ids(self, city_uuid, cust_id_list):
  79. """根据零售户列表查询其信息"""
  80. if not cust_id_list:
  81. return None
  82. cust_id_str = ",".join([f"'{cust_id}'" for cust_id in cust_id_list])
  83. query = text(f"""
  84. SELECT *
  85. FROM {self._cust_tablename}
  86. WHERE BA_CITY_ORG_CODE = :city_uuid
  87. AND BB_RETAIL_CUSTOMER_CODE IN ({cust_id_str})
  88. """)
  89. params = {"city_uuid": city_uuid}
  90. data = self.db_helper.fetch_all(query, params)
  91. return data
  92. def data_preprocess(self, data: pd.DataFrame):
  93. data.drop(["cust_uuid", "longitude", "latitude", "range_radius"], axis=1, inplace=True)
  94. remaining_cols = data.columns.drop(["city_uuid", "cust_code"])
  95. col_with_missing = remaining_cols[data[remaining_cols].isnull().any()].tolist() # 判断有缺失的字段
  96. col_all_missing = remaining_cols[data[remaining_cols].isnull().all()].to_list() # 全部缺失的字段
  97. col_partial_missing = list(set(col_with_missing) - set(col_all_missing)) # 部分缺失的字段
  98. for col in col_partial_missing:
  99. data[col] = data[col].fillna(data[col].mean())
  100. for col in col_all_missing:
  101. data[col] = data[col].fillna(0).infer_objects(copy=False)
  102. if __name__ == "__main__":
  103. dao = MySqlDao()
  104. city_uuid = "00000000000000000000000011445301"
  105. # city_uuid = "00000000000000000000000011441801"
  106. cust_id_list = ["441800100006", "441800100051", "441800100811"]
  107. cust_list = dao.load_mock_order_data()