From b6e199096d33769f580d6aeb283ca85c67013156 Mon Sep 17 00:00:00 2001 From: wvivi2023 Date: Mon, 22 Apr 2024 13:34:14 +0800 Subject: [PATCH] first commit --- OCRPython/logs/ocr_reconginition.log | 12 +++ OCRPython/main.py | 6 +- OCRPython/maincopy.py | 95 +++++++++++----------- OCRTool/.idea/.gitignore | 3 - OCRTool/src/main/resources/application.yml | 8 +- 5 files changed, 67 insertions(+), 57 deletions(-) delete mode 100644 OCRTool/.idea/.gitignore diff --git a/OCRPython/logs/ocr_reconginition.log b/OCRPython/logs/ocr_reconginition.log index c30d500..63bdcec 100644 --- a/OCRPython/logs/ocr_reconginition.log +++ b/OCRPython/logs/ocr_reconginition.log @@ -201,3 +201,15 @@ 2024-04-21 15:25:57,306 - main.py[line:119] - INFO: 0 2024-04-21 15:25:57,483 - ocr.py[line:19] - INFO: from rapidocr_onnxruntime import RapidOCR 2024-04-21 15:26:00,173 - main.py[line:42] - INFO: extractIdCardInfo 耗时2.866658926010132秒 +2024-04-22 11:01:10,204 - ocr.py[line:19] - INFO: from rapidocr_onnxruntime import RapidOCR +2024-04-22 11:01:14,447 - main.py[line:42] - INFO: extractIdCardInfo 耗时4.689878702163696秒 +2024-04-22 11:01:54,639 - main.py[line:96] - INFO: main.py len of parameter: 2 +2024-04-22 11:01:54,640 - main.py[line:104] - INFO: python 脚本里的接收到的参数是: +2024-04-22 11:01:54,640 - main.py[line:105] - INFO: 0 +2024-04-22 11:01:54,640 - main.py[line:106] - INFO: 开始执行sys.stdin.read +2024-04-22 11:01:54,640 - main.py[line:108] - INFO: +2024-04-22 11:01:54,640 - main.py[line:109] - INFO: 55 +2024-04-22 11:01:54,640 - main.py[line:118] - INFO: 55 +2024-04-22 11:01:54,640 - main.py[line:119] - INFO: 0 +2024-04-22 11:01:54,819 - ocr.py[line:19] - INFO: from rapidocr_onnxruntime import RapidOCR +2024-04-22 11:01:57,426 - main.py[line:42] - INFO: extractIdCardInfo 耗时2.785860061645508秒 diff --git a/OCRPython/main.py b/OCRPython/main.py index d6df214..0489c63 100644 --- a/OCRPython/main.py +++ b/OCRPython/main.py @@ -95,12 +95,12 @@ if __name__ == "__main__": try: logger.info(f"main.py len of parameter: {len(sys.argv)}") jsonString = "" - if len(sys.argv) > 3: + if len(sys.argv) > 3: logger.info(f"{sys.argv[1]}") logger.info(f"{sys.argv[2]}") logger.info(f"{sys.argv[3]}") jsonString = extractIdCardInfo(int(sys.argv[1]), sys.argv[2], sys.argv[3]) - elif len(sys.argv) > 1: + elif len(sys.argv) > 1: logger.info(f"python 脚本里的接收到的参数是:") logger.info(f"{sys.argv[1]}") logger.info(f"开始执行sys.stdin.read") @@ -117,7 +117,7 @@ if __name__ == "__main__": data1 = split_data[0] logger.info(f"{len(data1)}") logger.info(f"{len(data2)}") - + jsonString = extractIdCardInfo(int(sys.argv[1]), data1, data2) print(jsonString) diff --git a/OCRPython/maincopy.py b/OCRPython/maincopy.py index 3a56b2d..edb49d6 100644 --- a/OCRPython/maincopy.py +++ b/OCRPython/maincopy.py @@ -37,6 +37,7 @@ def extractIdCardInfoByPath(filePath1: str, filePath2: str)->str: except Exception as e: logger.error(e) + logger.info(f"text:{text}") extractor = IdentityCardExtractor() jsonString = extractor.extract_textbyPaddle(text) end_time = time.time() # 记录结束时间 @@ -86,59 +87,59 @@ def extractIdCardInfoByBase64Data(base64data1:str, base64Data2: str)->str: # with open('/Users/wangvivi/Desktop/Code/ocrtest/images/id_card.JPG', 'rb') as image_file: # base64_image_string = base64.b64encode(image_file.read()).decode('utf-8') - +# # jsonString = extractIdCardInfoByBase64Data(base64_image_string,"") # print(jsonString) - -jsonString = extractIdCardInfoByPath("/Users/wangvivi/Desktop/Code/ocrtest/images/id_card.JPG","") -print(jsonString) +# +# jsonString = extractIdCardInfoByPath("/Users/wangvivi/Desktop/Code/ocrtest/images/id_card.JPG","") +# print(jsonString) -# if __name__ == "__main__": -# try: -# logger.info(f"main.py len of parameter: {len(sys.argv)}") -# jsonString = "" -# if len(sys.argv) > 3: -# logger.info(f"{sys.argv[1]}") -# logger.info(f"{sys.argv[2]}") -# logger.info(f"{sys.argv[3]}") -# jsonString = extractIdCardInfo(int(sys.argv[1]), sys.argv[2], sys.argv[3]) -# elif len(sys.argv) > 1: -# logger.info(f"python 脚本里的接收到的参数是:") -# logger.info(f"{sys.argv[1]}") -# logger.info(f"开始执行sys.stdin.read") -# input_data = sys.stdin.read() -# logger.info("") -# logger.info(f"{len(input_data)}") -# split_data = input_data.split(os.linesep) -# data1 = "" -# data2 = "" -# if 2 == len(split_data): -# data1 = split_data[0] -# data2 = split_data[1] -# elif 1 == len(split_data): -# data1 = split_data[0] -# logger.info(f"{len(data1)}") -# logger.info(f"{len(data2)}") - -# jsonString = extractIdCardInfo(int(sys.argv[1]), data1, data2) -# print(jsonString) -# except KeyboardInterrupt: -# logger.error("KeyboardInterrupt") +if __name__ == "__main__": + try: + logger.info(f"main.py len of parameter: {len(sys.argv)}") + jsonString = "" + if len(sys.argv) > 3: + logger.info(f"{sys.argv[1]}") + logger.info(f"{sys.argv[2]}") + logger.info(f"{sys.argv[3]}") + jsonString = extractIdCardInfo(int(sys.argv[1]), sys.argv[2], sys.argv[3]) + elif len(sys.argv) > 1: + logger.info(f"python 脚本里的接收到的参数是:") + logger.info(f"{sys.argv[1]}") + logger.info(f"开始执行sys.stdin.read") + input_data = sys.stdin.read() + logger.info("") + logger.info(f"len(input_data):{len(input_data)}") + split_data = input_data.split(os.linesep) + data1 = "" + data2 = "" + if 2 == len(split_data): + data1 = split_data[0] + data2 = split_data[1] + elif 1 == len(split_data): + data1 = split_data[0] + logger.info(f"{data1}") + logger.info(f"{data2}") -# except IndexError: -# # 如果参数过长,捕获 IndexError 异常并进行处理 -# logger.error("参数过长,未指定足够的参数") + jsonString = extractIdCardInfo(int(sys.argv[1]), data1, data2) + print(jsonString) + except KeyboardInterrupt: + logger.error("KeyboardInterrupt") -# except OverflowError: -# # 如果发生了 OverflowError 异常,捕获并进行相应的处理 -# logger.error("命令行参数过长,导致溢出错误") + except IndexError: + # 如果参数过长,捕获 IndexError 异常并进行处理 + logger.error("参数过长,未指定足够的参数") -# except EOFError: -# # 如果达到输入流的末尾,捕获 EOFError 异常并进行处理 -# logger.error("已经到达输入流的末尾") + except OverflowError: + # 如果发生了 OverflowError 异常,捕获并进行相应的处理 + logger.error("命令行参数过长,导致溢出错误") -# except Exception as e: -# # 如果发生了其他异常,捕获并进行相应的处理 -# logger.error("发生了异常:", e) + except EOFError: + # 如果达到输入流的末尾,捕获 EOFError 异常并进行处理 + logger.error("已经到达输入流的末尾") + + except Exception as e: + # 如果发生了其他异常,捕获并进行相应的处理 + logger.error("发生了异常:", e) diff --git a/OCRTool/.idea/.gitignore b/OCRTool/.idea/.gitignore deleted file mode 100644 index 26d3352..0000000 --- a/OCRTool/.idea/.gitignore +++ /dev/null @@ -1,3 +0,0 @@ -# Default ignored files -/shelf/ -/workspace.xml diff --git a/OCRTool/src/main/resources/application.yml b/OCRTool/src/main/resources/application.yml index 24ae826..2423790 100644 --- a/OCRTool/src/main/resources/application.yml +++ b/OCRTool/src/main/resources/application.yml @@ -3,8 +3,8 @@ spring: active=dev: recognition: - pythonEnv: /Users/wangvivi/Desktop/MySelf/myenv/bin/python - scriptEnv: /Users/wangvivi/Desktop/Code/Component/OCR/main.py - #pythonEnv: /Users/wangvivi/miniconda3/envs/ocr/bin/python - #scriptEnv: /Users/wangvivi/Desktop/Code/Component/OCR/maincopy.py +# pythonEnv: /Users/wangvivi/Desktop/MySelf/myenv/bin/python +# scriptEnv: /Users/wangvivi/Desktop/Code/Component/OCRPython/main.py + pythonEnv: /Users/wangvivi/miniconda3/envs/ocr/bin/python + scriptEnv: /Users/wangvivi/Desktop/Code/Component/OCRPython/maincopy.py