Mercurial > repos > iuc > scanpy_normalize
comparison normalize.xml @ 13:7b9fafe32c86 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/scanpy/ commit 3974c0ff86bb1d6633281f29dfb4c605a74e1e6e
author | iuc |
---|---|
date | Thu, 14 Mar 2024 15:37:29 +0000 |
parents | 94c19fb1281c |
children | d844935c906c |
comparison
equal
deleted
inserted
replaced
12:94c19fb1281c | 13:7b9fafe32c86 |
---|---|
1 <tool id="scanpy_normalize" name="Normalize" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@profile@"> | 1 <tool id="scanpy_normalize" name="Normalize" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@profile@"> |
2 <description>with scanpy</description> | 2 <description>and impute with scanpy</description> |
3 <macros> | 3 <macros> |
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="bio_tools"/> | 6 <expand macro="bio_tools"/> |
7 <expand macro="requirements"/> | 7 <expand macro="requirements"/> |
63 adata=adata, | 63 adata=adata, |
64 log=$method.log, | 64 log=$method.log, |
65 plot=False, | 65 plot=False, |
66 copy=False) | 66 copy=False) |
67 | 67 |
68 #else if $method.method == "external.pp.magic" | |
69 sc.external.pp.magic( | |
70 adata=adata, | |
71 name_list='$method.name_list', | |
72 knn=$method.knn, | |
73 #if str($method.decay) != '' | |
74 decay=$method.decay, | |
75 #end if | |
76 #if str($method.knn_max) != '' | |
77 knn_max=$method.knn_max, | |
78 #end if | |
79 #if $method.t == -1 | |
80 t='auto', | |
81 #else | |
82 t=$method.t, | |
83 #end if | |
84 #if str($method.n_pca) != '' | |
85 n_pca=$method.n_pca, | |
86 #end if | |
87 solver='$method.solver', | |
88 knn_dist='$method.knn_dist', | |
89 random_state=$method.random_state, | |
90 copy=False) | |
68 #end if | 91 #end if |
69 | 92 |
70 @CMD_anndata_write_outputs@ | 93 @CMD_anndata_write_outputs@ |
71 | 94 |
72 ]]></configfile> | 95 ]]></configfile> |
77 <param argument="method" type="select" label="Method used for normalization"> | 100 <param argument="method" type="select" label="Method used for normalization"> |
78 <option value="pp.normalize_total">Normalize counts per cell, using 'pp.normalize_total'</option> | 101 <option value="pp.normalize_total">Normalize counts per cell, using 'pp.normalize_total'</option> |
79 <option value="pp.recipe_zheng17">Normalization and filtering as of Zheng et al. (2017), using 'pp.recipe_zheng17'</option> | 102 <option value="pp.recipe_zheng17">Normalization and filtering as of Zheng et al. (2017), using 'pp.recipe_zheng17'</option> |
80 <option value="pp.recipe_weinreb17">Normalization and filtering as of Weinreb et al (2017), using 'pp.recipe_weinreb17'</option> | 103 <option value="pp.recipe_weinreb17">Normalization and filtering as of Weinreb et al (2017), using 'pp.recipe_weinreb17'</option> |
81 <option value="pp.recipe_seurat">Normalization and filtering as of Seurat et al (2015), using 'pp.recipe_seurat'</option> | 104 <option value="pp.recipe_seurat">Normalization and filtering as of Seurat et al (2015), using 'pp.recipe_seurat'</option> |
105 <option value="external.pp.magic">Denoising using Markov Affinity-based Graph Imputation of Cells (MAGIC) API 'external.pp.magic'</option> | |
82 </param> | 106 </param> |
83 <when value="pp.normalize_total"> | 107 <when value="pp.normalize_total"> |
84 <param argument="target_sum" type="float" value="" optional="true" label="Target sum" help="If not provided, after normalization, each observation (cell) has a total count equal to the median of the total counts (cells) before normalization."/> | 108 <param argument="target_sum" type="float" value="" optional="true" label="Target sum" help="If not provided, after normalization, each observation (cell) has a total count equal to the median of the total counts (cells) before normalization."/> |
85 <conditional name="exclude_highly_expressed"> | 109 <conditional name="exclude_highly_expressed"> |
86 <param argument="exclude_highly_expressed" type="select" label="Exclude (very) highly expressed genes for the computation of the normalization factor (size factor) for each cell" help=" A gene is considered highly expressed, if it has more than max_fraction of the total counts in at least one cell. The not-excluded genes will sum up to target_sum"> | 110 <param argument="exclude_highly_expressed" type="select" label="Exclude (very) highly expressed genes for the computation of the normalization factor (size factor) for each cell" help=" A gene is considered highly expressed, if it has more than max_fraction of the total counts in at least one cell. The not-excluded genes will sum up to target_sum"> |
117 <expand macro="pca_random_state"/> | 141 <expand macro="pca_random_state"/> |
118 </when> | 142 </when> |
119 <when value="pp.recipe_seurat"> | 143 <when value="pp.recipe_seurat"> |
120 <expand macro="param_log"/> | 144 <expand macro="param_log"/> |
121 </when> | 145 </when> |
146 <when value="external.pp.magic"> | |
147 <param name="name_list" type="select" label="Denoised genes to return" help="Selecting all genes may require a large amount of memory"> | |
148 <option value="all_genes">All genes</option> | |
149 <option value="pca_only">PCA only</option> | |
150 </param> | |
151 <param argument="knn" type="integer" min="1" value="5" label="Number of nearest neighbors on which to build kernel" help=""/> | |
152 <param argument="decay" type="integer" optional="true" value="1" label="Set decay rate of kernel tails" | |
153 help="If not set, alpha decaying kernel is not used" /> | |
154 <param argument="knn_max" type="integer" min="1" optional="true" value="" label="Maximum number of nearest neighbors with nonzero connection" | |
155 help="If not set, will be set to 3 * knn" /> | |
156 <param argument="t" type="integer" min="-1" value="3" label="Power to which the diffusion operator is powered. This sets the level of diffusion" | |
157 help="If ‘-1’, this parameter is selected according to the Procrustes disparity of the diffused data." /> | |
158 <param argument="n_pca" type="integer" value="100" optional="true" label="Number of principal components to use for calculating neighborhoods" | |
159 help="For extremely large datasets, using n_pca less than 20 allows neighborhoods to be calculated in roughly log(n_samples) time. If not set, no PCA is performed." /> | |
160 <param name="solver" type="select" label="Which solver to use" help="Selecting all genes may require a large amount of memory"> | |
161 <option value="exact">"exact", the implementation described in van Dijk et al. (2018) </option> | |
162 <option value="approximate">"approximate", is faster that performs imputation in the PCA space and then projects back to the gene space</option> | |
163 </param> | |
164 <param name="knn_dist" type="select" label="Distance metric to use for the data" help="See scipy.spatial.distance.pdist documentation for more options https://docs.scipy.org/doc/scipy/reference/generated/scipy.spatial.distance.pdist.html"> | |
165 <expand macro="distance_metric_options"/> | |
166 </param> | |
167 <expand macro="param_random_state"/> | |
168 </when> | |
122 </conditional> | 169 </conditional> |
123 <expand macro="inputs_common_advanced"/> | 170 <expand macro="inputs_common_advanced"/> |
124 </inputs> | 171 </inputs> |
125 <outputs> | 172 <outputs> |
126 <expand macro="anndata_outputs"/> | 173 <expand macro="anndata_outputs"/> |
215 <has_text_matching expression="log=True"/> | 262 <has_text_matching expression="log=True"/> |
216 </assert_contents> | 263 </assert_contents> |
217 </output> | 264 </output> |
218 <output name="anndata_out" file="pp.recipe_seurat.recipe_zheng17.h5ad" ftype="h5ad" compare="sim_size" delta="1000000" delta_frac="0.25"/> | 265 <output name="anndata_out" file="pp.recipe_seurat.recipe_zheng17.h5ad" ftype="h5ad" compare="sim_size" delta="1000000" delta_frac="0.25"/> |
219 </test> | 266 </test> |
267 <test expect_num_outputs="2"> | |
268 <!-- test 5 --> | |
269 <param name="adata" value="krumsiek11.h5ad" /> | |
270 <conditional name="method"> | |
271 <param name="method" value="external.pp.magic"/> | |
272 <param name="name_list" value="all_genes"/> | |
273 <param name="t" value="-1"/> | |
274 <param name="n_pca" value="5"/> | |
275 </conditional> | |
276 <section name="advanced_common"> | |
277 <param name="show_log" value="true" /> | |
278 </section> | |
279 <output name="hidden_output"> | |
280 <assert_contents> | |
281 <has_text_matching expression="external.pp.magic"/> | |
282 <has_text_matching expression="name_list='all_genes'"/> | |
283 <has_text_matching expression="t='auto'"/> | |
284 <has_text_matching expression="n_pca=5"/> | |
285 </assert_contents> | |
286 </output> | |
287 <output name="anndata_out" file="external.pp.magic.all_genes.krumsiek11.h5ad" ftype="h5ad" compare="sim_size"/> | |
288 </test> | |
289 <test expect_num_outputs="2"> | |
290 <!-- test 6 --> | |
291 <param name="adata" value="krumsiek11.h5ad" /> | |
292 <conditional name="method"> | |
293 <param name="method" value="external.pp.magic"/> | |
294 <param name="name_list" value="pca_only"/> | |
295 <param name="t" value="3"/> | |
296 <param name="n_pca" value="5"/> | |
297 </conditional> | |
298 <section name="advanced_common"> | |
299 <param name="show_log" value="true" /> | |
300 </section> | |
301 <output name="hidden_output"> | |
302 <assert_contents> | |
303 <has_text_matching expression="external.pp.magic"/> | |
304 <has_text_matching expression="name_list='pca_only'"/> | |
305 <has_text_matching expression="t=3"/> | |
306 <has_text_matching expression="n_pca=5"/> | |
307 </assert_contents> | |
308 </output> | |
309 <output name="anndata_out" file="external.pp.magic.pca_only.krumsiek11.h5ad" ftype="h5ad" compare="sim_size"/> | |
310 <assert_stdout> | |
311 <has_text text="X_magic"/> | |
312 </assert_stdout> | |
313 </test> | |
220 </tests> | 314 </tests> |
221 <help><![CDATA[ | 315 <help><![CDATA[ |
222 Normalize total counts per cell (`pp.normalize_per_cell`) | 316 Normalize total counts per cell (`pp.normalize_per_cell`) |
223 ========================================================= | 317 ========================================================= |
224 | 318 |
267 Expects non-logarithmized data. If using logarithmized data, pass `log=False`. | 361 Expects non-logarithmized data. If using logarithmized data, pass `log=False`. |
268 | 362 |
269 More details on the `scanpy documentation | 363 More details on the `scanpy documentation |
270 <https://icb-scanpy.readthedocs-hosted.com/en/stable/api/scanpy.pp.recipe_seurat.html>`__ | 364 <https://icb-scanpy.readthedocs-hosted.com/en/stable/api/scanpy.pp.recipe_seurat.html>`__ |
271 | 365 |
366 | |
367 Markov Affinity-based Graph Imputation of Cells (MAGIC) as of Van Dijk D et al. (2018) (`external.pp.magic`) | |
368 ============================================================================================================ | |
369 | |
370 MAGIC is an algorithm for denoising and transcript recover of single cells applied to single-cell sequencing data. MAGIC builds a graph from the data and uses diffusion to smooth out noise and recover the data manifold. | |
371 | |
372 The algorithm implemented here has changed primarily in two ways compared to the algorithm described in Van Dijk D et al. (2018). | |
373 | |
374 - Firstly, we use the adaptive kernel described in Moon et al, (2019) for improved stability. | |
375 - Secondly, data diffusion is applied in the PCA space, rather than the data space, for speed and memory improvements. | |
376 | |
377 More details on the `scanpy documentation | |
378 <https://icb-scanpy.readthedocs-hosted.com/en/stable/api/scanpy.external.pp.magic.html>`__ | |
379 | |
272 ]]></help> | 380 ]]></help> |
273 <expand macro="citations"/> | 381 <expand macro="citations"/> |
274 </tool> | 382 </tool> |