annotate markitdown.xml @ 1:f6fa7e70120f draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
author bgruening
date Mon, 13 Oct 2025 13:22:13 +0000
parents 5ad32046903b
children 4926706c13db
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
1 <tool id="markitdown" name="Markitdown" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
0
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
2 <description>Convert documents to Markdown</description>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
3 <macros>
1
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
4 <token name="@TOOL_VERSION@">0.1.3</token>
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
5 <token name="@VERSION_SUFFIX@">0</token>
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
6 <token name="@PROFILE@">23.0</token>
0
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
7 </macros>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
8 <requirements>
1
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
9 <requirement type="package" version="3.12">python</requirement>
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
10 <requirement type="package" version="@TOOL_VERSION@">markitdown</requirement>
0
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
11 </requirements>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
12
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
13 <command detect_errors="exit_code"><![CDATA[
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
14 #set ext_map = {
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
15 'pdf': 'pdf', 'docx': 'docx', 'pptx': 'pptx', 'xlsx': 'xlsx',
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
16 'html': 'html', 'txt': 'txt', 'ipynb': 'ipynb',
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
17 'markdown': 'md', 'zip': 'zip', 'tabular': 'csv', 'csv': 'csv'
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
18 }
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
19
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
20 #set file_ext = ext_map.get($input.ext, '')
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
21 #set final_ext = $ext_hint if $ext_hint else $file_ext
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
22
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
23 markitdown
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
24 ${input}
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
25 -x $final_ext
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
26 #if $mime_type:
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
27 -m $mime_opt
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
28 #end if
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
29 #if $charset:
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
30 -c "$charset_opt"
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
31 #end if
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
32 $keep_data_uris
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
33 -o '$output'
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
34 ]]></command>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
35
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
36 <inputs>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
37 <param name="input" type="data" format="pdf,docx,pptx,xlsx,html,txt,ipynb,markdown,zip,tabular"
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
38 label="Input file"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
39 <param name="ext_hint" type="text" optional="true" label="Extension override"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
40 <param name="mime_type" type="text" optional="true" label="MIME type hint"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
41 <param name="charset" type="text" optional="true" label="Character set (e.g. UTF-8)"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
42 <param name="keep_data_uris" type="boolean" truevalue="--keep-data-uris" falsevalue="" label="Keep embedded data URIs"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
43 </inputs>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
44
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
45 <outputs>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
46 <data name="output" format="markdown" label="Converted Markdown output"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
47 </outputs>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
48
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
49 <tests>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
50 <test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
51 <param name="input" value="EAR.pdf" ftype="pdf"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
52 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
53 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
54 <has_text text="Tags: ERGA-BGE"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
55 <has_text text="Lineage: mammalia_odb10"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
56 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
57 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
58 </test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
59
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
60 <test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
61 <param name="input" value="example.docx" ftype="docx"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
62 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
63 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
64 <has_text text="# Lorem ipsum dolor sit amet, consectetur adipiscing elit."/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
65 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
66 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
67 </test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
68
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
69 <!--test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
70 <param name="input" value="example.odt"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
71 <param name="ext_hint" value="odt"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
72 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
73 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
74 <has_text text="This is a Word document"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
75 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
76 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
77 </test-->
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
78
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
79 <test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
80 <param name="input" value="report_4.html" ftype="html"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
81 <param name="keep_data_uris" value="true"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
82 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
83 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
84 <has_text text="is the contig length such that using longer or equal length contigs produces"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
85 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
86 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
87 </test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
88
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
89 <test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
90 <param name="input" value="example.txt" ftype="txt"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
91 <param name="ext_hint" value="txt"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
92 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
93 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
94 <has_text text="This is a plain text file"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
95 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
96 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
97 </test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
98
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
99 <test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
100 <param name="input" value="example.ipynb" ftype="ipynb"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
101 <output name="output">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
102 <assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
103 <has_text text="print(&quot;Hello, world!&quot;)"/>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
104 </assert_contents>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
105 </output>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
106 </test>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
107 </tests>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
108
1
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
109 <help format="markdown"><![CDATA[
f6fa7e70120f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit 1df47411ce8651c1d4f68cd032b2afe7d5a721de
bgruening
parents: 0
diff changeset
110
0
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
111 **Markitdown** converts rich document formats (PDF, DOCX, HTML, etc.) to Markdown.
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
112
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
113 ---
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
114
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
115 ### Supported Formats:
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
116
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
117 - PDF, DOCX, PPTX, XLSX
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
118 - HTML, TXT, Markdown
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
119 - Jupyter Notebooks (IPYNB)
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
120 - ZIP containing supported formats
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
121 - Tabular (CSV)
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
122
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
123 ---
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
124
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
125 ### Options:
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
126
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
127 - **Extension override** (`-x`): hint for file type if not obvious
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
128 - **MIME type** (`-m`): manual MIME hint
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
129 - **Charset** (`-c`): text encoding hint
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
130 - **Keep data URIs**: retain base64-encoded images
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
131
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
132 Project: https://github.com/microsoft/markitdown
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
133 ]]></help>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
134
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
135 <citations>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
136 <citation type="bibtex">
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
137 @misc{markitdown2024,
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
138 author = {Microsoft},
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
139 title = {markitdown: Convert documents to markdown},
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
140 year = {2024},
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
141 howpublished = {\url{https://github.com/microsoft/markitdown}}
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
142 }
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
143 </citation>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
144 </citations>
5ad32046903b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/markitdown commit aaa9d49fda30d2aaf99030ff8a099d890a7c1d01
bgruening
parents:
diff changeset
145 </tool>