img.py 1.0 KB

1234567891011121314151617181920212223242526272829
  1. # -*- coding: utf-8 -*-
  2. from .__load__ import *
  3. from langchain_community.document_loaders import UnstructuredImageLoader
  4. from langchain.schema import Document
  5. from aip import AipOcr
  6. #from PIL import Image
  7. #from cnocr import CnOcr
  8. #from pix2text import Pix2Text, merge_line_texts
  9. class Img(object):
  10. def run(self, file, param = {}):
  11. #loader = UnstructuredImageLoader(file, mode='single', **param)
  12. #return loader.load()
  13. with open(file, 'rb') as image_file:
  14. image_data = image_file.read()
  15. # 初始化AipOcr对象
  16. client = AipOcr(Demeter.config['baiduocr']['app_id'], Demeter.config['baiduocr']['api_key'], Demeter.config['baiduocr']['secret_key'])
  17. # 调用百度OCR接口识别文字
  18. result = client.basicGeneral(image_data)
  19. text = ''
  20. if 'words_result' in result:
  21. for item in result['words_result']:
  22. text += item['words'] + '\n'
  23. data = Document(page_content=text, metadata={"source": "ocr"})
  24. return data