ocr_tesseract.py 1.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. # -*- coding:utf-8 -*-
  2. from ssat_sdk import sat_environment
  3. from ssat_sdk.utils.LoggingUtil import DebugLogger
  4. import os, sys, time
  5. import pytesseract as tes
  6. import cv2 as cv
  7. try:
  8. from PIL import Image
  9. except ImportError:
  10. import Image
  11. Lan_Default = ""
  12. Tes_LanDIC = {"chineseprc+english": "chi_eng", "chinesetaiwan+english": "",
  13. "spanish": "",
  14. "chineseprc": "chi_sim", "chinesetaiwan": "chi_tra", "russian": "", "french": "",
  15. "english": "eng", "vietnamese": "", "hebrew": "", "thai": "",
  16. "arabic":""
  17. }
  18. class OCRTes():
  19. def __init__(self):
  20. self.logger = DebugLogger()
  21. self.uiStyle = sat_environment.getMenuTreeSelectedStyle()
  22. self.chip = sat_environment.getMenuTreeSelectedChip()
  23. self.tesData_proj = self.chip + "." + self.uiStyle
  24. self.logger.info(__file__, "OCRTes", "__init__", "tesData:" + self.tesData_proj)
  25. # print "getMenuTreeRootDir:",sat_environment.getMenuTreeRootDir()
  26. # print "getMenuTreeSelectedProjectCfgPath:",sat_environment.getMenuTreeSelectedProjectCfgPath()
  27. # print "getMenuTreeSelectedChip:",sat_environment.getMenuTreeSelectedChip()
  28. # print "getMenuTreeSelectedTVUI:",sat_environment.getMenuTreeSelectedTVUI()
  29. # print "getSATMenuTreeDIR:",sat_environment.getSATMenuTreeDIR()
  30. def getStr(self,picPath, lan, type ):
  31. tesdata = self.tesData_proj #+ "." + Lan_Default #每个项目,暂时只放一个字库,不区分语言
  32. print "OCRTes.getStr,params:",picPath, tesdata, type
  33. startTime = time.time()
  34. strArr = tes.image_to_string(picPath, lang=tesdata)
  35. print "OCRTes,getStr cost:", time.time() - startTime
  36. # strArr = tes.image_to_data(img, lang=lan)
  37. # print strArr
  38. return strArr