cobraxy: COBRAxy/marea.py comparison

comparison COBRAxy/marea.py @ 143:507efdc9d226 draft

Uploaded

author	luca_milaz
date	Tue, 05 Nov 2024 21:42:17 +0000
parents	41f35c2f0c7b
children	a9a490ae198d

comparison

equal deleted inserted replaced

-:accda943dfb9
+:507efdc9d226
 from PIL import Image
 import os
 import argparse
 import pyvips
 from typing import Tuple, Union, Optional, List, Dict
+import copy
 ERRORS = []
 ########################## argparse ##########################################
 ARGS :argparse.Namespace
 def process_args() -> argparse.Namespace:
 except (TypeError, ZeroDivisionError): continue
 return tmp, max_z_score
-def computeEnrichment(metabMap :ET.ElementTree, class_pat :Dict[str, List[List[float]]], ids :List[str], *, fromRAS = True) -> None:
+def computeEnrichment(metabMap: ET.ElementTree, class_pat: Dict[str, List[List[float]]], ids: List[str], *, fromRAS=True) -> List[Tuple[str, str, dict, float]]:
 """
 Compares clustered data based on a given comparison mode and applies enrichment-based styling on the
 provided metabolic map.
 Args:
 class_pat : the clustered data.
 ids : ids for data association.
 fromRAS : whether the data to enrich consists of RAS scores.
 Returns:
-None
+List[Tuple[str, str, dict, float]]: List of tuples with pairs of dataset names, comparison dictionary, and max z-score.
 Raises:
 sys.exit : if there are less than 2 classes for comparison
 Side effects:
-metabMap : mut
+metabMap : mutates based on calculated enrichment
-ids : mut
+"""
-"""
+class_pat = {k.strip(): v for k, v in class_pat.items()}
-class_pat = { k.strip() : v for k, v in class_pat.items() }
+if (not class_pat) or (len(class_pat.keys()) < 2):
-#TODO: simplfy this stuff vvv and stop using sys.exit (raise the correct utils error)
+sys.exit('Execution aborted: classes provided for comparisons are less than two\n')
-if (not class_pat) or (len(class_pat.keys()) < 2): sys.exit('Execution aborted: classes provided for comparisons are less than two\n')
+enrichment_results = []
 if ARGS.comparison == "manyvsmany":
 for i, j in it.combinations(class_pat.keys(), 2):
-#TODO: these 2 functions are always called in pair and in this order and need common data,
-# some clever refactoring would be appreciated.
 comparisonDict, max_z_score = compareDatasetPair(class_pat.get(i), class_pat.get(j), ids)
-temp_thingsInCommon(comparisonDict, metabMap, max_z_score, i, j, fromRAS)
+enrichment_results.append((i, j, comparisonDict, max_z_score))
 elif ARGS.comparison == "onevsrest":
 for single_cluster in class_pat.keys():
-t :List[List[List[float]]] = []
+rest = [item for k, v in class_pat.items() if k != single_cluster for item in v]
-for k in class_pat.keys():
-if k != single_cluster:
-t.append(class_pat.get(k))
-rest :List[List[float]] = []
-for i in t:
-rest = rest + i
 comparisonDict, max_z_score = compareDatasetPair(class_pat.get(single_cluster), rest, ids)
-temp_thingsInCommon(comparisonDict, metabMap, max_z_score, single_cluster, fromRAS)
+enrichment_results.append((single_cluster, "rest", comparisonDict, max_z_score))
 elif ARGS.comparison == "onevsmany":
 controlItems = class_pat.get(ARGS.control)
 for otherDataset in class_pat.keys():
-if otherDataset == ARGS.control: continue
+if otherDataset == ARGS.control:
+continue
 comparisonDict, max_z_score = compareDatasetPair(controlItems, class_pat.get(otherDataset), ids)
-temp_thingsInCommon(comparisonDict, metabMap, max_z_score, ARGS.control, otherDataset, fromRAS)
+enrichment_results.append((ARGS.control, otherDataset, comparisonDict, max_z_score))
-def createOutputMaps(dataset1Name :str, dataset2Name :str, core_map :ET.ElementTree) -> None:
+return enrichment_results
-svgFilePath = buildOutputPath(dataset1Name, dataset2Name, details = "SVG Map", ext = utils.FileFormat.SVG)
+def createOutputMaps(dataset1Name: str, dataset2Name: str, core_map: ET.ElementTree) -> None:
+svgFilePath = buildOutputPath(dataset1Name, dataset2Name, details="SVG Map", ext=utils.FileFormat.SVG)
 utils.writeSvg(svgFilePath, core_map)
 if ARGS.generate_pdf:
-pngPath = buildOutputPath(dataset1Name, dataset2Name, details = "PNG Map", ext = utils.FileFormat.PNG)
+pngPath = buildOutputPath(dataset1Name, dataset2Name, details="PNG Map", ext=utils.FileFormat.PNG)
-pdfPath = buildOutputPath(dataset1Name, dataset2Name, details = "PDF Map", ext = utils.FileFormat.PDF)
+pdfPath = buildOutputPath(dataset1Name, dataset2Name, details="PDF Map", ext=utils.FileFormat.PDF)
 convert_to_pdf(svgFilePath, pngPath, pdfPath)
-if not ARGS.generate_svg: os.remove(svgFilePath.show())
+if not ARGS.generate_svg:
+os.remove(svgFilePath)
 ClassPat = Dict[str, List[List[float]]]
 def getClassesAndIdsFromDatasets(datasetsPaths :List[str], datasetPath :str, classPath :str, names :List[str]) -> Tuple[List[str], ClassPat]:
 # TODO: I suggest creating dicts with ids as keys instead of keeping class_pat and ids separate,
 # for the sake of everyone's sanity.
 None
 Raises:
 sys.exit : if a user-provided custom map is in the wrong format (ET.XMLSyntaxError, ET.XMLSchemaParseError)
 """
 global ARGS
 ARGS = process_args()
-if os.path.isdir('result') == False: os.makedirs('result')
+if not os.path.isdir('result'):
+os.makedirs('result')
-core_map :ET.ElementTree = ARGS.choice_map.getMap(
+core_map: ET.ElementTree = ARGS.choice_map.getMap(
 ARGS.tool_dir,
 utils.FilePath.fromStrPath(ARGS.custom_map) if ARGS.custom_map else None)
-# TODO: ^^^ ugly but fine for now, the argument is None if the model isn't custom because no file was given.
-# getMap will None-check the customPath and panic when the model IS custom but there's no file (good). A cleaner
-# solution can be derived from my comment in FilePath.fromStrPath
 if ARGS.using_RAS:
 ids, class_pat = getClassesAndIdsFromDatasets(ARGS.input_datas, ARGS.input_data, ARGS.input_class, ARGS.names)
-computeEnrichment(core_map, class_pat, ids)
+enrichment_results = computeEnrichment(core_map, class_pat, ids)
+for i, j, comparisonDict, max_z_score in enrichment_results:
+map_copy = copy.deepcopy(core_map)
+temp_thingsInCommon(comparisonDict, map_copy, max_z_score, i, j, fromRAS=True)
+createOutputMaps(i, j, map_copy)
 if ARGS.using_RPS:
 ids, class_pat = getClassesAndIdsFromDatasets(ARGS.input_datas_rps, ARGS.input_data_rps, ARGS.input_class_rps, ARGS.names_rps)
-computeEnrichment(core_map, class_pat, ids, fromRAS = False)
+enrichment_results = computeEnrichment(core_map, class_pat, ids, fromRAS=False)
+for i, j, comparisonDict, max_z_score in enrichment_results:
-# create output files: TODO: this is the same comparison happening in "maps", find a better way to organize this
+map_copy = copy.deepcopy(core_map)
-if ARGS.comparison == "manyvsmany":
+temp_thingsInCommon(comparisonDict, map_copy, max_z_score, i, j, fromRAS=False)
-for i, j in it.combinations(class_pat.keys(), 2): createOutputMaps(i, j, core_map)
+createOutputMaps(i, j, map_copy)
-return
+print('Execution succeeded')
-if ARGS.comparison == "onevsrest":
-for single_cluster in class_pat.keys(): createOutputMaps(single_cluster, "rest", core_map)
-return
-for otherDataset in class_pat.keys():
-if otherDataset != ARGS.control: createOutputMaps(i, j, core_map)
-if not ERRORS: return
-utils.logWarning(
-f"The following reaction IDs were mentioned in the dataset but weren't found in the map: {ERRORS}",
-ARGS.out_log)
-print('Execution succeded')
 ###############################################################################
 if __name__ == "__main__":
 main()

Mercurial > repos > bimib > cobraxy

comparison COBRAxy/marea.py @ 143:507efdc9d226 draft