Commit ec96c4ad authored by myhloli's avatar myhloli

Merge remote-tracking branch 'origin/master'

parents 81260a22 ab1ec002
...@@ -32,8 +32,6 @@ jobs: ...@@ -32,8 +32,6 @@ jobs:
- name: check-requirements - name: check-requirements
run: | run: |
source ~/.bashrc source ~/.bashrc
conda init
conda activate QA
pip install magic-pdf[full-cpu]==0.6.1 -i https://pypi.tuna.tsinghua.edu.cn/simple pip install magic-pdf[full-cpu]==0.6.1 -i https://pypi.tuna.tsinghua.edu.cn/simple
pip install https://raw.githubusercontent.com/myhloli/wheels/main/assets/whl/detectron2/detectron2-0.6-cp310-cp310-linux_x86_64.whl pip install https://raw.githubusercontent.com/myhloli/wheels/main/assets/whl/detectron2/detectron2-0.6-cp310-cp310-linux_x86_64.whl
......
<div id="top"></div> <div id="top">
<p align="center">
<img src="docs/images/datalab_logo.png" width="160px" style="vertical-align:middle;">
<span style="font-size: 28px; vertical-align: middle;">MinerU</span>
</p>
</div>
<div align="center"> <div align="center">
[![stars](https://img.shields.io/github/stars/opendatalab/MinerU.svg)](https://github.com/opendatalab/MinerU) [![stars](https://img.shields.io/github/stars/opendatalab/MinerU.svg)](https://github.com/opendatalab/MinerU)
...@@ -17,7 +24,14 @@ ...@@ -17,7 +24,14 @@
</div> </div>
<div align="center"> <div align="center">
<p align="center">
<a href="https://github.com/opendatalab/MinerU">MinerU: An end-to-end PDF parsing tool based on PDF-Extract-Kit, supporting conversion from PDF to Markdown.</a>🚀🚀🚀<br>
<a href="https://github.com/opendatalab/PDF-Extract-Kit">PDF-Extract-Kit: A Comprehensive Toolkit for High-Quality PDF Content Extraction</a>🔥🔥🔥
</p>
<p align="center">
👋 join us on <a href="https://discord.gg/AsQMhuMN" target="_blank">Discord</a> and <a href="https://cdn.vansin.top/internlm/mineru.jpg" target="_blank">WeChat</a>
</p>
</div> </div>
# MinerU # MinerU
......
<div id="top"></div> <div id="top">
<p align="center">
<img src="docs/images/datalab_logo.png" width="160px" style="vertical-align:middle;">
<span style="font-size: 28px; vertical-align: middle;">MinerU</span>
</p>
</div>
<div align="center"> <div align="center">
[![stars](https://img.shields.io/github/stars/opendatalab/MinerU.svg)](https://github.com/opendatalab/MinerU) [![stars](https://img.shields.io/github/stars/opendatalab/MinerU.svg)](https://github.com/opendatalab/MinerU)
...@@ -14,7 +19,14 @@ ...@@ -14,7 +19,14 @@
</div> </div>
<div align="center"> <div align="center">
<p align="center">
<a href="https://github.com/opendatalab/MinerU">MinerU: 端到端的PDF解析工具(基于PDF-Extract-Kit)支持PDF转Markdown</a>🚀🚀🚀<br>
<a href="https://github.com/opendatalab/PDF-Extract-Kit">PDF-Extract-Kit: 高质量PDF解析工具箱</a>🔥🔥🔥
</p>
<p align="center">
👋 join us on <a href="https://discord.gg/AsQMhuMN" target="_blank">Discord</a> and <a href="https://cdn.vansin.top/internlm/mineru.jpg" target="_blank">WeChat</a>
</p>
</div> </div>
# MinerU # MinerU
......
...@@ -6,7 +6,7 @@ import json ...@@ -6,7 +6,7 @@ import json
from magic_pdf.pipe.UNIPipe import UNIPipe from magic_pdf.pipe.UNIPipe import UNIPipe
from magic_pdf.rw.DiskReaderWriter import DiskReaderWriter from magic_pdf.rw.DiskReaderWriter import DiskReaderWriter
from lib import calculate_score from lib import calculate_score
import shutil
pdf_res_path = conf.conf["pdf_res_path"] pdf_res_path = conf.conf["pdf_res_path"]
code_path = conf.conf["code_path"] code_path = conf.conf["code_path"]
pdf_dev_path = conf.conf["pdf_dev_path"] pdf_dev_path = conf.conf["pdf_dev_path"]
...@@ -58,8 +58,8 @@ def pdf_to_markdown(): ...@@ -58,8 +58,8 @@ def pdf_to_markdown():
if not os.path.exists(dir_path): if not os.path.exists(dir_path):
os.makedirs(dir_path, exist_ok=True) os.makedirs(dir_path, exist_ok=True)
res_path = os.path.join(dir_path, f"{demo_name}.md") res_path = os.path.join(dir_path, f"{demo_name}.md")
#src_path = os.path.join(pdf_res_path, "pdf", f"{demo_name}.pdf") src_path = os.path.join(pdf_res_path, demo_name, "auto", f"{demo_name}.md")
#shutil.copy(src_path, res_path) shutil.copy(src_path, res_path)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment