test_api.py 1.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657
  1. import requests
  2. from io import BytesIO
  3. import base64
  4. import json
  5. from PIL import Image, ImageFilter, ImageEnhance
  6. def image_to_base64(pil_image, image_format="JPEG"):
  7. """将PIL Image图像转换为Base64编码"""
  8. buffered = BytesIO()
  9. pil_image.save(buffered, format=image_format)
  10. img_byte_array = buffered.getvalue()
  11. encode_image = base64.b64encode(img_byte_array).decode('utf-8')
  12. return encode_image
  13. def resize_image(image, max_size=512):
  14. """缩放图像尺寸,保持 OCR 质量"""
  15. width, height = image.size
  16. max_dim = max(width, height)
  17. # 如果图像不需要缩小,直接返回
  18. if max_dim <= max_size:
  19. return image
  20. scaling_factor = max_size / max_dim
  21. new_width = int(width * scaling_factor)
  22. new_height = int(height * scaling_factor)
  23. resized = image.resize((new_width, new_height), Image.Resampling.LANCZOS)
  24. resized = resized.filter(ImageFilter.UnsharpMask(radius=1, percent=120, threshold=3))
  25. enhancer = ImageEnhance.Contrast(resized)
  26. resized = enhancer.enhance(1.1)
  27. return resized
  28. image = Image.open('./test1.jpg')
  29. image = resize_image(image)
  30. image_base64 = image_to_base64(image)
  31. # response = requests.post(
  32. # "http://127.0.0.1:8000/api/v1/ocr",
  33. # json={
  34. # "image": image_base64,
  35. # "text": PROMPT_EXTRACT_NAME
  36. # }
  37. # )
  38. response = requests.post(
  39. "https://749757254390085-http-7080.edge-proxy.gpugeek.com:8443/api/v1/agent_ocr",
  40. json={
  41. "image": image_base64,
  42. }
  43. )
  44. result = response.json()
  45. print(result)