file_stream.py 3.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980
  1. import time
  2. from core import get_logger, settings
  3. from io import BytesIO
  4. import os
  5. import pandas as pd
  6. import requests
  7. logger = get_logger("utils.file_stream")
  8. class FileStreamUtils:
  9. upload_url = settings.file_upload_url
  10. download_url = settings.file_download_url
  11. headers = {
  12. "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36",
  13. "Accept": "*/*",
  14. }
  15. @staticmethod
  16. def upload_files(reports_dir, files):
  17. files_id = {}
  18. for filename in files:
  19. file_path = os.path.join(reports_dir, f"{filename}.xlsx")
  20. start_time = time.time()
  21. try:
  22. with open(file_path, "rb") as f:
  23. upload_files = {"file": (os.path.basename(file_path), f)}
  24. response = requests.post(
  25. FileStreamUtils.upload_url,
  26. headers=FileStreamUtils.headers,
  27. files=upload_files,
  28. verify=True,
  29. )
  30. duration_ms = (time.time() - start_time) * 1000
  31. if response.json().get("success"):
  32. file_id = response.json()["data"]["file_info"]["fileid"]
  33. files_id[filename] = file_id
  34. logger.info(f"File uploaded: {filename} -> {file_id} ({duration_ms:.0f}ms)")
  35. else:
  36. logger.error(f"Upload failed for {filename}: {response.text}")
  37. return None
  38. except requests.exceptions.RequestException as e:
  39. logger.error(f"Upload request error for {filename}: {e}", exc_info=True)
  40. return None
  41. except Exception as e:
  42. logger.error(f"Upload error for {filename}: {e}", exc_info=True)
  43. return None
  44. return files_id
  45. @staticmethod
  46. def download_file(file_id, file_type="xlsx"):
  47. """通过file_id从阿里云文件数据库下载文件"""
  48. start_time = time.time()
  49. try:
  50. response = requests.get(
  51. f"{FileStreamUtils.download_url}/{file_id}",
  52. headers=FileStreamUtils.headers,
  53. verify=True,
  54. )
  55. duration_ms = (time.time() - start_time) * 1000
  56. if response.status_code == 200:
  57. file_content = BytesIO(response.content)
  58. if file_type == "xlsx":
  59. data = pd.read_excel(file_content, engine="openpyxl")
  60. elif file_type == "csv":
  61. data = pd.read_csv(file_content)
  62. else:
  63. raise ValueError(f"不支持的文件类型:{file_type}")
  64. logger.info(f"File downloaded: {file_id} ({duration_ms:.0f}ms, {len(response.content)} bytes)")
  65. return data
  66. else:
  67. logger.error(f"Download failed: file_id={file_id}, status={response.status_code}")
  68. return None
  69. except requests.exceptions.RequestException as e:
  70. logger.error(f"Download request error: file_id={file_id}, error={e}", exc_info=True)
  71. return None
  72. except Exception as e:
  73. logger.error(f"Download error: file_id={file_id}, error={e}", exc_info=True)
  74. return None