cobraxy: COBRAxy/marea_cluster.py comparison

comparison COBRAxy/marea_cluster.py @ 309:38c9a958ea78 draft

Uploaded

author	francesco_lapi
date	Thu, 22 May 2025 16:03:37 +0000
parents	4a677fc67aeb
children	4599fb23f25b

comparison

equal deleted inserted replaced

-:797d0e002934
+:38c9a958ea78
 default = 7,
 help = 'choose maximum cluster number to be generated')
 parser.add_argument('-el', '--elbow',
 type = str,
-default = 'false',
+default = 'False',
-choices = ['true', 'false'],
+choices = ['True', 'False'],
 help = 'choose if you want to generate an elbow plot for kmeans')
 parser.add_argument('-si', '--silhouette',
 type = str,
-default = 'false',
+default = 'False',
-choices = ['true', 'false'],
+choices = ['True', 'False'],
 help = 'choose if you want silhouette plots')
 parser.add_argument('-td', '--tool_dir',
 type = str,
 required = True,
 help = 'your tool directory')
 parser.add_argument('-ms', '--min_samples',
-type = float,
+type = int,
 help = 'min samples for dbscan (optional)')
 parser.add_argument('-ep', '--eps',
 type = float,
 help = 'eps for dbscan (optional)')
 s (str): The warning message to be logged and printed.
 Returns:
 None
 """
-args = process_args(sys.argv)
 with open(args.out_log, 'a') as log:
 log.write(s + "\n\n")
 print(s)
 ########################## read dataset ######################################
 Args:
 k_min (int): The minimum number of clusters to consider.
 k_max (int): The maximum number of clusters to consider.
 dataset (pandas.DataFrame): The dataset to perform clustering on.
-elbow (str): Whether to generate an elbow plot for kmeans ('true' or 'false').
+elbow (str): Whether to generate an elbow plot for kmeans ('True' or 'False').
-silhouette (str): Whether to generate silhouette plots ('true' or 'false').
+silhouette (str): Whether to generate silhouette plots ('True' or 'False').
 best_cluster (str): The file path to save the output of the best cluster.
 Returns:
 None
 """
 if not os.path.exists(args.output_path):
 os.makedirs(args.output_path)
-if elbow == 'true':
+if elbow == 'True':
 elbow = True
 else:
 elbow = False
-if silhouette == 'true':
+if silhouette == 'True':
 silhouette = True
 else:
 silhouette = False
 range_n_clusters = [i for i in range(k_min, k_max+1)]
 Args:
 dataset (pandas.DataFrame): The dataset to be clustered.
 k_min (int): The minimum number of clusters to consider.
 k_max (int): The maximum number of clusters to consider.
 best_cluster (str): The file path to save the output of the best cluster.
-silhouette (str): Whether to generate silhouette plots ('true' or 'false').
+silhouette (str): Whether to generate silhouette plots ('True' or 'False').
 Returns:
 None
 """
 if not os.path.exists(args.output_path):
 for i in range(len(labels)):
 prefix = ''
 if (i + k_min == best):
 prefix = '_BEST'
-if silhouette == 'true':
+if silhouette == 'True':
 silhouette_draw(dataset, labels[i], i + k_min, f'{args.output_path}/silhouette_with_' + str(i + k_min) + prefix + '_clusters.png')
 for i in range(len(labels)):
 if (i + k_min == best):
 labels = labels[i]

Mercurial > repos > bimib > cobraxy

comparison COBRAxy/marea_cluster.py @ 309:38c9a958ea78 draft