Commit 2e487cac authored by 赵小蒙's avatar 赵小蒙

修复目录重构导致的引用异常

parent 846dbecf
...@@ -2,7 +2,7 @@ import json ...@@ -2,7 +2,7 @@ import json
import os import os
from tqdm import tqdm from tqdm import tqdm
from magic_pdf.libs import join_path from magic_pdf.libs.commons import join_path
with open('/mnt/petrelfs/share_data/ouyanglinke/OCR/OCR_validation_dataset.json', 'r') as f: with open('/mnt/petrelfs/share_data/ouyanglinke/OCR/OCR_validation_dataset.json', 'r') as f:
samples = json.load(f) samples = json.load(f)
......
from magic_pdf.libs import fitz # PyMuPDF from magic_pdf.libs.commons import fitz # PyMuPDF
# PDF文件路径 # PDF文件路径
pdf_path = "D:\\project\\20231108code-clean\\code-clean\\tmp\\unittest\\download-pdfs\\scihub\\scihub_53700000\\libgen.scimag53724000-53724999.zip_10.1097\\00129191-200509000-00018.pdf" pdf_path = "D:\\project\\20231108code-clean\\code-clean\\tmp\\unittest\\download-pdfs\\scihub\\scihub_53700000\\libgen.scimag53724000-53724999.zip_10.1097\\00129191-200509000-00018.pdf"
......
...@@ -5,7 +5,7 @@ from pathlib import Path ...@@ -5,7 +5,7 @@ from pathlib import Path
import click import click
from loguru import logger from loguru import logger
from magic_pdf.libs import join_path from magic_pdf.libs.commons import join_path
from magic_pdf.dict2md.mkcontent import mk_mm_markdown from magic_pdf.dict2md.mkcontent import mk_mm_markdown
from magic_pdf.pipeline import parse_pdf_by_model from magic_pdf.pipeline import parse_pdf_by_model
......
import io import io
import json import json
import os import os
from magic_pdf.libs import fitz from magic_pdf.libs.commons import fitz
from app.common.s3 import get_s3_config, get_s3_client from app.common.s3 import get_s3_config, get_s3_client
from magic_pdf.libs import join_path, json_dump_path, read_file, parse_bucket_key from magic_pdf.libs.commons import join_path, json_dump_path, read_file, parse_bucket_key
from loguru import logger from loguru import logger
test_pdf_dir_path = "s3://llm-pdf-text/unittest/pdf/" test_pdf_dir_path = "s3://llm-pdf-text/unittest/pdf/"
......
...@@ -2,10 +2,10 @@ import os ...@@ -2,10 +2,10 @@ import os
import pytest import pytest
from magic_pdf.filter import classify_by_area, classify_by_text_len, classify_by_avg_words, \ from magic_pdf.filter.pdf_classify_by_type import classify_by_area, classify_by_text_len, classify_by_avg_words, \
classify_by_img_num, classify_by_text_layout, classify_by_img_narrow_strips classify_by_img_num, classify_by_text_layout, classify_by_img_narrow_strips
from magic_pdf.filter.pdf_meta_scan import get_pdf_page_size_pts, get_pdf_textlen_per_page, get_imgs_per_page from magic_pdf.filter.pdf_meta_scan import get_pdf_page_size_pts, get_pdf_textlen_per_page, get_imgs_per_page
from test.test_commons import get_docs_from_test_pdf, get_test_json_data from tests.test_commons import get_docs_from_test_pdf, get_test_json_data
# 获取当前目录 # 获取当前目录
current_directory = os.path.dirname(os.path.abspath(__file__)) current_directory = os.path.dirname(os.path.abspath(__file__))
......
...@@ -2,7 +2,7 @@ import os ...@@ -2,7 +2,7 @@ import os
import pytest import pytest
from magic_pdf.filter.pdf_meta_scan import get_pdf_page_size_pts, get_image_info, get_pdf_text_layout_per_page, get_language from magic_pdf.filter.pdf_meta_scan import get_pdf_page_size_pts, get_image_info, get_pdf_text_layout_per_page, get_language
from test.test_commons import get_docs_from_test_pdf, get_test_json_data from tests.test_commons import get_docs_from_test_pdf, get_test_json_data
# 获取当前目录 # 获取当前目录
current_directory = os.path.dirname(os.path.abspath(__file__)) current_directory = os.path.dirname(os.path.abspath(__file__))
......
...@@ -11,21 +11,21 @@ Execute the following command to run the tests under directory code-clean: ...@@ -11,21 +11,21 @@ Execute the following command to run the tests under directory code-clean:
""" """
from test.test_para.test_pdf2text_recogPara_Common import ( from tests.test_para.test_pdf2text_recogPara_Common import (
TestIsBboxOverlap, TestIsBboxOverlap,
TestIsInBbox, TestIsInBbox,
TestIsBboxOverlap, TestIsBboxOverlap,
TestIsLineLeftAlignedFromNeighbors, TestIsLineLeftAlignedFromNeighbors,
TestIsLineRightAlignedFromNeighbors, TestIsLineRightAlignedFromNeighbors,
) )
from test.test_para.test_pdf2text_recogPara_EquationsProcessor import TestCalcOverlapPct from tests.test_para.test_pdf2text_recogPara_EquationsProcessor import TestCalcOverlapPct
from test.test_para.test_pdf2text_recogPara_BlockInnerParasProcessor import TestIsConsistentLines from tests.test_para.test_pdf2text_recogPara_BlockInnerParasProcessor import TestIsConsistentLines
from test.test_para.test_pdf2text_recogPara_BlockContinuationProcessor import ( from tests.test_para.test_pdf2text_recogPara_BlockContinuationProcessor import (
TestIsAlphabetChar, TestIsAlphabetChar,
TestIsChineseChar, TestIsChineseChar,
TestIsOtherLetterChar, TestIsOtherLetterChar,
) )
from test.test_para.test_pdf2text_recogPara_TitleProcessor import TestTitleProcessor from tests.test_para.test_pdf2text_recogPara_TitleProcessor import TestTitleProcessor
# Test suite # Test suite
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment