Mercurial > repos > bgruening > markitdown
annotate markitdown.xml @ 1:f6fa7e70120f draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
| author | bgruening |
|---|---|
| date | Mon, 13 Oct 2025 13:22:13 +0000 |
| parents | 5ad32046903b |
| children | 4926706c13db |
| rev | line source |
|---|---|
|
1
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
1 <tool id="markitdown" name="Markitdown" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> |
|
0
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
2 <description>Convert documents to Markdown</description> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
3 <macros> |
|
1
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
4 <token name="@TOOL_VERSION@">0.1.3</token> |
|
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
5 <token name="@VERSION_SUFFIX@">0</token> |
|
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
6 <token name="@PROFILE@">23.0</token> |
|
0
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
7 </macros> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
8 <requirements> |
|
1
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
9 <requirement type="package" version="3.12">python</requirement> |
|
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
10 <requirement type="package" version="@TOOL_VERSION@">markitdown</requirement> |
|
0
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
11 </requirements> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
12 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
13 <command detect_errors="exit_code"><![CDATA[ |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
14 #set ext_map = { |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
15 'pdf': 'pdf', 'docx': 'docx', 'pptx': 'pptx', 'xlsx': 'xlsx', |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
16 'html': 'html', 'txt': 'txt', 'ipynb': 'ipynb', |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
17 'markdown': 'md', 'zip': 'zip', 'tabular': 'csv', 'csv': 'csv' |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
18 } |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
19 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
20 #set file_ext = ext_map.get($input.ext, '') |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
21 #set final_ext = $ext_hint if $ext_hint else $file_ext |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
22 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
23 markitdown |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
24 ${input} |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
25 -x $final_ext |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
26 #if $mime_type: |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
27 -m $mime_opt |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
28 #end if |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
29 #if $charset: |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
30 -c "$charset_opt" |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
31 #end if |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
32 $keep_data_uris |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
33 -o '$output' |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
34 ]]></command> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
35 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
36 <inputs> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
37 <param name="input" type="data" format="pdf,docx,pptx,xlsx,html,txt,ipynb,markdown,zip,tabular" |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
38 label="Input file"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
39 <param name="ext_hint" type="text" optional="true" label="Extension override"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
40 <param name="mime_type" type="text" optional="true" label="MIME type hint"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
41 <param name="charset" type="text" optional="true" label="Character set (e.g. UTF-8)"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
42 <param name="keep_data_uris" type="boolean" truevalue="--keep-data-uris" falsevalue="" label="Keep embedded data URIs"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
43 </inputs> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
44 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
45 <outputs> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
46 <data name="output" format="markdown" label="Converted Markdown output"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
47 </outputs> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
48 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
49 <tests> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
50 <test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
51 <param name="input" value="EAR.pdf" ftype="pdf"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
52 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
53 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
54 <has_text text="Tags: ERGA-BGE"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
55 <has_text text="Lineage: mammalia_odb10"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
56 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
57 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
58 </test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
59 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
60 <test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
61 <param name="input" value="example.docx" ftype="docx"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
62 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
63 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
64 <has_text text="# Lorem ipsum dolor sit amet, consectetur adipiscing elit."/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
65 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
66 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
67 </test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
68 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
69 <!--test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
70 <param name="input" value="example.odt"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
71 <param name="ext_hint" value="odt"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
72 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
73 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
74 <has_text text="This is a Word document"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
75 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
76 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
77 </test--> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
78 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
79 <test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
80 <param name="input" value="report_4.html" ftype="html"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
81 <param name="keep_data_uris" value="true"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
82 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
83 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
84 <has_text text="is the contig length such that using longer or equal length contigs produces"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
85 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
86 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
87 </test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
88 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
89 <test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
90 <param name="input" value="example.txt" ftype="txt"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
91 <param name="ext_hint" value="txt"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
92 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
93 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
94 <has_text text="This is a plain text file"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
95 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
96 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
97 </test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
98 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
99 <test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
100 <param name="input" value="example.ipynb" ftype="ipynb"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
101 <output name="output"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
102 <assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
103 <has_text text="print("Hello, world!")"/> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
104 </assert_contents> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
105 </output> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
106 </test> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
107 </tests> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
108 |
|
1
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
109 <help format="markdown"><![CDATA[ |
|
f6fa7e70120f
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents:
0
diff
changeset
|
110 |
|
0
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
111 **Markitdown** converts rich document formats (PDF, DOCX, HTML, etc.) to Markdown. |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
112 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
113 --- |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
114 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
115 ### Supported Formats: |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
116 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
117 - PDF, DOCX, PPTX, XLSX |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
118 - HTML, TXT, Markdown |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
119 - Jupyter Notebooks (IPYNB) |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
120 - ZIP containing supported formats |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
121 - Tabular (CSV) |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
122 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
123 --- |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
124 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
125 ### Options: |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
126 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
127 - **Extension override** (`-x`): hint for file type if not obvious |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
128 - **MIME type** (`-m`): manual MIME hint |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
129 - **Charset** (`-c`): text encoding hint |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
130 - **Keep data URIs**: retain base64-encoded images |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
131 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
132 Project: https://github.com/microsoft/markitdown |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
133 ]]></help> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
134 |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
135 <citations> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
136 <citation type="bibtex"> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
137 @misc{markitdown2024, |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
138 author = {Microsoft}, |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
139 title = {markitdown: Convert documents to markdown}, |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
140 year = {2024}, |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
141 howpublished = {\url{https://github.com/microsoft/markitdown}} |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
142 } |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
143 </citation> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
144 </citations> |
|
5ad32046903b
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff
changeset
|
145 </tool> |
