cobraxy: COBRAxy/utils/model_utils.py comparison

comparison COBRAxy/utils/model_utils.py @ 503:8dd07e59f631 draft

Uploaded

author	francesco_lapi
date	Tue, 30 Sep 2025 18:01:30 +0000
parents	9bfd1ec3ae6f
children	96f512dff490

comparison

equal deleted inserted replaced

-:054c872e3880
+:8dd07e59f631
 max_pathways = 0
 reaction_pathways = {}
 for reaction in model.reactions:
 # Get unique pathways from all metabolites in the reaction
-if type(reaction.annotation['pathways']) == list:
+if 'pathways' in reaction.annotation:
-reaction_pathways[reaction.id] = reaction.annotation['pathways']
+if type(reaction.annotation['pathways']) == list:
-max_pathways = max(max_pathways, len(reaction.annotation['pathways']))
+reaction_pathways[reaction.id] = reaction.annotation['pathways']
+max_pathways = max(max_pathways, len(reaction.annotation['pathways']))
+else:
+reaction_pathways[reaction.id] = [reaction.annotation['pathways']]
 else:
-reaction_pathways[reaction.id] = [reaction.annotation['pathways']]
+# No pathway annotation - use empty list
+reaction_pathways[reaction.id] = []
 # Create column names for pathways
 pathway_columns = [f"Pathway_{i+1}" for i in range(max_pathways)]
 # Second pass: create the data
 logger.warning("Mapping dataframe is empty for the requested source genes; skipping uniqueness validation.")
 return
 # normalize temporary columns for grouping (without altering the original df)
 tmp = mapping_df[[source_col, target_col]].copy()
-tmp['_src_norm'] = tmp[source_col].astype(str).map(_normalize_gene_id)
+tmp['_src_norm'] = tmp[source_col].astype(str).apply(_normalize_gene_id)
 tmp['_tgt_norm'] = tmp[target_col].astype(str).str.strip()
 # optionally filter to the set of model source genes
 if model_source_genes is not None:
 tmp = tmp[tmp['_src_norm'].isin(model_source_genes)]
 model_source_genes = { _normalize_gene_id(g.id) for g in model.genes }
 logger.info(f"Filtering mapping to {len(model_source_genes)} source genes present in model (normalized).")
 tmp_map = mapping_df[[col_for_src, col_for_tgt]].dropna().copy()
-tmp_map[col_for_src + "_norm"] = tmp_map[col_for_src].astype(str).map(_normalize_gene_id)
+tmp_map[col_for_src + "_norm"] = tmp_map[col_for_src].astype(str).apply(_normalize_gene_id)
 filtered_map = tmp_map[tmp_map[col_for_src + "_norm"].isin(model_source_genes)].copy()
 if filtered_map.empty:
 logger.warning("No mapping rows correspond to source genes present in the model after filtering. Proceeding with empty mapping (no translation will occur).")
 Build mapping dict: source_id -> list of target_ids
 Normalizes IDs (removes prefixes like 'HGNC:' etc).
 """
 df = mapping_df[[source_col, target_col]].dropna().copy()
 # normalize to string
-df[source_col] = df[source_col].astype(str).map(_normalize_gene_id)
+df[source_col] = df[source_col].astype(str).apply(_normalize_gene_id)
 df[target_col] = df[target_col].astype(str).str.strip()
 df = df.drop_duplicates()
 logger.info(f"Creating mapping from {len(df)} rows")

Mercurial > repos > bimib > cobraxy

comparison COBRAxy/utils/model_utils.py @ 503:8dd07e59f631 draft