quyuan 1 жил өмнө
parent
commit
b7a2f547bb

+ 3 - 3
tests/test_cli/test_cli.py

@@ -23,7 +23,7 @@ class TestCli:
         """
         输入jsonl, 默认方式解析
         """
-        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972'"
+        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972'" % (code_path)
         logging.info(cmd)
         common.check_shell(cmd)
         common.count_folders_and_check_contents(pdf_res_path)
@@ -32,7 +32,7 @@ class TestCli:
         """
         输入jsonl, txt方式解析  
         """
-        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972' --method txt"
+        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972' --method txt" % (code_path)
         logging.info(cmd)
         common.check_shell(cmd)
         common.count_folders_and_check_contents(pdf_res_path)
@@ -41,7 +41,7 @@ class TestCli:
         """
         输入jsonl, ocr方式解析
         """
-        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972' --method ocr"
+        cmd = "cd %s && export PYTHONPATH=. && python magic_pdf/cli/magicpdf.py  json-command --json 's3://llm-process-pperf/ebook_index_textbook_40k/中高考&竞赛知识点/part-663f1ef5e7c1-009416.jsonl?bytes=0,1133972' --method ocr" % (code_path)
         logging.info(cmd)
         common.check_shell(cmd)
         common.count_folders_and_check_contents(pdf_res_path)