Commit 88e16305 authored by zhougaofeng's avatar zhougaofeng
Browse files

Update pdf_client.py

parent bf156ede
# -*- coding: utf-8 -*- # -*- coding: utf-8 -*-
import configparser
import time import time
import requests import requests
...@@ -12,14 +13,15 @@ class ocrPdfClient: ...@@ -12,14 +13,15 @@ class ocrPdfClient:
def __init__(self, api_url): def __init__(self, api_url):
self.api_url = api_url self.api_url = api_url
def ocr_pdf_client(self, path,output_dir): def ocr_pdf_client(self, path,output_dir,config_path):
payload = { payload = {
"path": str(path), "path": str(path),
"output_dir": str(output_dir), "output_dir": str(output_dir),
'config_path': str(config_path)
} }
logger.info(f'pdf路径:{path},输出路径{output_dir}') logger.info(f'pdf_server:{self.api_url},pdf路径:{path},输出路径{output_dir},配置文件在{config_path}')
response = requests.post(f"{self.api_url}/pdf_ocr", json=payload) response = requests.post(f"{self.api_url}/pdf_ocr", json=payload)
logger.info(f'response:{response}') #logger.info(f'response:{response}')
if response.status_code == 200: if response.status_code == 200:
return output_dir return output_dir
...@@ -29,10 +31,6 @@ class ocrPdfClient: ...@@ -29,10 +31,6 @@ class ocrPdfClient:
def parse_args(): def parse_args():
parser = argparse.ArgumentParser() parser = argparse.ArgumentParser()
parser.add_argument(
'--url',
default='http://0.0.0.0:6030',
)
parser.add_argument( parser.add_argument(
'--path', '--path',
'-p', '-p',
...@@ -43,14 +41,21 @@ def parse_args(): ...@@ -43,14 +41,21 @@ def parse_args():
'-o', '-o',
required=True required=True
) )
parser.add_argument(
'--config_path',
default='/home/practice/magic_pdf-main/magic_pdf/config.ini',
)
args = parser.parse_args() args = parser.parse_args()
return args return args
def main(): def main():
args = parse_args() args = parse_args()
config = configparser.ConfigParser()
embedder = ocrPdfClient(args.url) config.read(args.config_path)
pdf_server = config.get('server', 'pdf_server')
embedder = ocrPdfClient(pdf_server)
doc_analyze_start = time.time() doc_analyze_start = time.time()
if not os.path.isabs(args.output_dir): if not os.path.isabs(args.output_dir):
...@@ -79,4 +84,3 @@ def main(): ...@@ -79,4 +84,3 @@ def main():
if __name__ == "__main__": if __name__ == "__main__":
main() main()
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment