Spaces:
Sleeping
Sleeping
Update README.md (#1)
Browse files- Update README.md (52351f5b6abfe52798f5df04518a16b64831c96c)
README.md
CHANGED
|
@@ -1,15 +1,12 @@
|
|
| 1 |
---
|
| 2 |
title: parser2md - PDF & HTML parser to markdown
|
| 3 |
emoji: π
|
| 4 |
-
title: parser2md - PDF & HTML parser to markdown
|
| 5 |
-
emoji: π
|
| 6 |
colorFrom: yellow
|
| 7 |
colorTo: purple
|
| 8 |
sdk: gradio
|
| 9 |
command: python main.py
|
| 10 |
app_file: main.py
|
| 11 |
python_version: 3.12
|
| 12 |
-
python_version: 3.12
|
| 13 |
license: mit
|
| 14 |
pinned: true
|
| 15 |
short_description: PDF & HTML parser to markdown
|
|
@@ -40,6 +37,35 @@ owner: research-semmyk
|
|
| 40 |
#short_description: PDF & HTML parser to markdown
|
| 41 |
version: 0.1.0
|
| 42 |
readme: README.md
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 43 |
requires-python: ">=3.12"
|
| 44 |
dependencies: []
|
| 45 |
#owner: research-semmyk
|
|
@@ -48,6 +74,12 @@ dependencies: []
|
|
| 48 |
# - https://huggingface.co/datalab-to/surya_tablerec
|
| 49 |
# - huggingface.co/datalab-to/line_detector0
|
| 50 |
# - https://huggingface.co/tarun-menta/ocr_error_detection/blob/main/config.json
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 51 |
---
|
| 52 |
|
| 53 |
# parserPDF
|
|
@@ -208,6 +240,4 @@ MIT License. See [LICENSE](LICENSE) for details.
|
|
| 208 |
- PDF parsing via [Marker](https://github.com/VikParuchuri/marker).
|
| 209 |
- LLM integrations using Hugging Face Transformers and OpenAI APIs.
|
| 210 |
- HuggingFace Spaces Configuration Reference [HF Spaces Configuration Reference](https://huggingface.co/docs/hub/en/spaces-config-reference)
|
| 211 |
-
- IBM Research: [HF Spaces Guide](https://huggingface.co/spaces/ibm-granite/granite-vision-demo/blob/main/DEVELOPMENT.md)
|
| 212 |
-
- HuggingFace Spaces Configuration Reference [HF Spaces Configuration Reference](https://huggingface.co/docs/hub/en/spaces-config-reference)
|
| 213 |
- IBM Research: [HF Spaces Guide](https://huggingface.co/spaces/ibm-granite/granite-vision-demo/blob/main/DEVELOPMENT.md)
|
|
|
|
| 1 |
---
|
| 2 |
title: parser2md - PDF & HTML parser to markdown
|
| 3 |
emoji: π
|
|
|
|
|
|
|
| 4 |
colorFrom: yellow
|
| 5 |
colorTo: purple
|
| 6 |
sdk: gradio
|
| 7 |
command: python main.py
|
| 8 |
app_file: main.py
|
| 9 |
python_version: 3.12
|
|
|
|
| 10 |
license: mit
|
| 11 |
pinned: true
|
| 12 |
short_description: PDF & HTML parser to markdown
|
|
|
|
| 37 |
#short_description: PDF & HTML parser to markdown
|
| 38 |
version: 0.1.0
|
| 39 |
readme: README.md
|
| 40 |
+
pinned: true
|
| 41 |
+
short_description: PDF & HTML parser to markdown
|
| 42 |
+
models: [meta-llama/Llama-4-Maverick-17B-128E-Instruct, openai/gpt-oss-120b, openai/gpt-oss-20b]
|
| 43 |
+
tags: [markdown, PDF, parser, converter, extractor]
|
| 44 |
+
#hf_oauth: true
|
| 45 |
+
preload_from_hub: [https://huggingface.co/datalab-to/surya_layout, https://huggingface.co/datalab-to/surya_tablerec, huggingface.co/datalab-to/line_detector0, https://huggingface.co/tarun-menta/ocr_error_detection/blob/main/config.json]
|
| 46 |
+
owner: research-semmyk
|
| 47 |
+
#---
|
| 48 |
+
#
|
| 49 |
+
#[Project]
|
| 50 |
+
#---
|
| 51 |
+
#title: parser2md - PDF & HTML parser to markdown
|
| 52 |
+
#emoji: \U0001F4C4ππ
|
| 53 |
+
#colorFrom: yellow
|
| 54 |
+
#colorTo: purple
|
| 55 |
+
#sdk: gradio
|
| 56 |
+
#python_version: 3.12
|
| 57 |
+
#sdk_version: 5.44.1
|
| 58 |
+
#app_file: main.py
|
| 59 |
+
#command: python main.py
|
| 60 |
+
#models:
|
| 61 |
+
# - meta-llama/Llama-4-Maverick-17B-128E-Instruct
|
| 62 |
+
# - openai/gpt-oss-120b
|
| 63 |
+
#pinned: false
|
| 64 |
+
#license: mit
|
| 65 |
+
#name: parser2md
|
| 66 |
+
#short_description: PDF & HTML parser to markdown
|
| 67 |
+
version: 0.1.0
|
| 68 |
+
readme: README.md
|
| 69 |
requires-python: ">=3.12"
|
| 70 |
dependencies: []
|
| 71 |
#owner: research-semmyk
|
|
|
|
| 74 |
# - https://huggingface.co/datalab-to/surya_tablerec
|
| 75 |
# - huggingface.co/datalab-to/line_detector0
|
| 76 |
# - https://huggingface.co/tarun-menta/ocr_error_detection/blob/main/config.json
|
| 77 |
+
#owner: research-semmyk
|
| 78 |
+
#preload_from_hub:
|
| 79 |
+
# - https://huggingface.co/datalab-to/surya_layout
|
| 80 |
+
# - https://huggingface.co/datalab-to/surya_tablerec
|
| 81 |
+
# - huggingface.co/datalab-to/line_detector0
|
| 82 |
+
# - https://huggingface.co/tarun-menta/ocr_error_detection/blob/main/config.json
|
| 83 |
---
|
| 84 |
|
| 85 |
# parserPDF
|
|
|
|
| 240 |
- PDF parsing via [Marker](https://github.com/VikParuchuri/marker).
|
| 241 |
- LLM integrations using Hugging Face Transformers and OpenAI APIs.
|
| 242 |
- HuggingFace Spaces Configuration Reference [HF Spaces Configuration Reference](https://huggingface.co/docs/hub/en/spaces-config-reference)
|
|
|
|
|
|
|
| 243 |
- IBM Research: [HF Spaces Guide](https://huggingface.co/spaces/ibm-granite/granite-vision-demo/blob/main/DEVELOPMENT.md)
|