anndata_ops: anndata_operations.xml comparison

comparison anndata_operations.xml @ 22:fe75d2414dc0 draft

"planemo upload for repository https://github.com/ebi-gene-expression-group/container-galaxy-sc-tertiary/tree/develop/tools/tertiary-analysis/scanpy commit 8853a954bd9c343b3458479582f1f21c3981fef0-dirty"

author	ebi-gxa
date	Mon, 23 Aug 2021 11:32:48 +0000
parents	53a251c6d991
children	31e5e6d606ef

comparison

equal deleted inserted replaced

-:93ecc487a7d1
+:fe75d2414dc0
 <?xml version="1.0" encoding="utf-8"?>
-<tool id="anndata_ops" name="AnnData Operations" version="@TOOL_VERSION@+galaxy0" profile="@PROFILE@">
+<tool id="anndata_ops" name="AnnData Operations" version="@TOOL_VERSION@+galaxy1" profile="@PROFILE@">
 <description>modifies metadata and flags genes</description>
 <macros>
 <import>scanpy_macros2.xml</import>
 </macros>
 <expand macro="requirements"/>
 #if not $s.keep_original:
 del adata.obs['${s.from_obs}']
 #end if
 #end for
+#for $i, $s in enumerate($var_modifications)
+adata.var['${s.to_var}'] = adata.var['${s.from_var}']
+#if not $s.keep_original:
+del adata.var['${s.from_var}']
+#end if
+#end for
 gene_names = getattr(adata.var, gene_name)
 #for $i, $flag in enumerate($gene_flags)
 k_cat = gene_names.str.startswith('${flag.startswith}')
 if k_cat.sum() > 0:
 #if $copy_x.default and len($copy_x.xlayers) > 0:
 #for $i, $x_s in enumerate($copy_x.xlayers):
 ad_s = sc.read('x_source_${i}.h5')
 if adata.n_obs == ad_s.n_obs and all(adata.obs_names == ad_s.obs_names):
 #set xs=$copy_x.xlayers[$i]
 if "${xs.dest}" == '':
 logging.error("%sth destination layer for %sth X source not specified" % ("${i}", "${i}"))
 sys.exit(1)
 adata.layers["${xs.dest}"] = ad_s.X
 else:
 logging.error("X source ${i} AnnData file is not compatible to be merged to main AnnData file, different cell names.")
 #for $j, $l_key in enumerate($copy_l.layers):
 layers_to_copy = (k for k in ad_s.layers.keys() if "${l_key.contains}" in k)
 for l_to_copy in layers_to_copy:
 suffix=''
 if l_to_copy in adata.layers:
 suffix = "_${i}"
 adata.layers[l_to_copy+suffix] = ad_s.layers[l_to_copy]
 #end for
 else:
 logging.error("Layer source ${i} AnnData file is not compatible to be merged to main AnnData file, different cell names.")
 sys.exit(1)
 #for $j, $o_key in enumerate($copy_o.obs_keys):
 keys_to_copy = (k for k in ad_s.obs.keys() if "${o_key.contains}" in k)
 for k_to_copy in keys_to_copy:
 suffix=''
 if k_to_copy in adata.obs:
 suffix = "_${i}"
 adata.obs[[k_to_copy+suffix]] = ad_s.obs[[k_to_copy]]
 if k_to_copy in ad_s.uns.keys():
 adata.uns[k_to_copy+suffix] = ad_s.uns[k_to_copy]
 #end for
 else:
 </sanitizer>
 </param>
 <param name="to_obs" type="text" label="New name" help="New name in observations that you want to change"/>
 <param name="keep_original" type="boolean" label="Keep original" help="If activated, it will also keep the original column" checked="false"/>
 </repeat>
+<repeat name="var_modifications" title="Change field names in AnnData var" min="0">
+<param name="from_var" type="text" label="Original name" help="Name in var that you want to change">
+<sanitizer>
+<valid initial="string.printable"/>
+</sanitizer>
+</param>
+<param name="to_var" type="text" label="New name" help="New name in var that you want to change"/>
+<param name="keep_original" type="boolean" label="Keep original" help="If activated, it will also keep the original column" checked="false"/>
+</repeat>
 <param name="gene_symbols_field" value='index' type="text" label="Gene symbols field in AnnData" help="Field inside var.params where the gene symbols are, normally 'index' or 'gene_symbols'"/>
 <repeat name="gene_flags" title="Flag genes that start with these names">
 <param name="startswith" type="text" label="Starts with" help="Text that you expect the genes to be flagged to start with, such as 'MT-' for mito genes"/>
 <param name="flag" type="text" label="Var name" help="Name of the column in var.names where this boolean flag is stored, for example 'mito' for mitochondrial genes."/>
 </repeat>
 <test>
 <param name="input_obj_file" value="find_cluster.h5"/>
 <param name="input_format" value="anndata"/>
 <param name="color_by" value="louvain"/>
 <output name="output_h5ad" file="anndata_ops.h5" ftype="h5ad" compare="sim_size"/>
+</test>
+<test>
+<param name="input_obj_file" value="anndata_ops.h5"/>
+<param name="from_var" value = "gene_symbols" />
+<param name="to_var" value = "hello_all" />
+<output name="output_h5ad" ftype="h5ad">
+<assert_contents>
+<has_h5_keys keys="var/hello_all" />
+</assert_contents>
+</output>
 </test>
 <test>
 <param name="input_obj_file" value="find_cluster.h5"/>
 <param name="input_format" value="anndata"/>
 <conditional name="copy_r">
 Operations on AnnData objects
 =============================
 Performs the following operations:
-* Change observation fields, mostly for downstreaming processes convenience. Multiple fields can be changed as one.
+* Change observation/var fields, mostly for downstreaming processes convenience. Multiple fields can be changed as one.
 * Flag genes that start with a certain text: useful for flagging mitochondrial, spikes or other groups of genes.
 * For the flags created, calculates qc metrics (pct_<flag>_counts).
 * Calculates `n_genes`, `n_counts` for cells and `n_cells`, `n_counts` for genes.
 * For top <N> genes specified, calculate qc metrics (pct_counts_in_top_<N>_genes).
 * Copy from a set of compatible AnnData objects (same cells and genes):

Mercurial > repos > ebi-gxa > anndata_ops

comparison anndata_operations.xml @ 22:fe75d2414dc0 draft