diff --git a/tools/tertiary-analysis/decoupler/decoupler_aucell_score.py b/tools/tertiary-analysis/decoupler/decoupler_aucell_score.py index 248ce360..6d178509 100644 --- a/tools/tertiary-analysis/decoupler/decoupler_aucell_score.py +++ b/tools/tertiary-analysis/decoupler/decoupler_aucell_score.py @@ -109,15 +109,19 @@ def run_for_genelists( if __name__ == "__main__": # Create command-line arguments parser parser = argparse.ArgumentParser(description="Score genes using Aucell") - parser.add_argument("--input_file", type=str, help="Path to input AnnData file") - parser.add_argument("--output_file", type=str, help="Path to output file") + parser.add_argument( + "--input_file", type=str, help="Path to input AnnData file", required=True + ) + parser.add_argument( + "--output_file", type=str, help="Path to output file", required=True + ) parser.add_argument("--gmt_file", type=str, help="Path to GMT file", required=False) # add argument for gene sets to score parser.add_argument( "--gene_sets_to_score", type=str, required=False, - help="Comma separated list of gene sets to score (the need to be in the gmt file)", + help="Optional comma separated list of gene sets to score (the need to be in the gmt file)", ) # add argument for gene list (comma separated) to score parser.add_argument( @@ -137,6 +141,7 @@ def run_for_genelists( "--gene_symbols_field", type=str, help="Name of the gene symbols field in the AnnData object", + required=True, ) parser.add_argument("--use_raw", action="store_true", help="Use raw data") parser.add_argument( @@ -149,15 +154,15 @@ def run_for_genelists( # Load input AnnData object adata = anndata.read_h5ad(args.input_file) - if args.gene_sets_to_score is not None and args.gmt_file is not None: + if args.gmt_file is not None: # Load MSigDB file in GMT format msigdb = read_gmt(args.gmt_file) - gene_sets_to_score = args.gene_sets_to_score.split(",") + gene_sets_to_score = args.gene_sets_to_score.split(",") if args.gene_sets_to_score else [] # Score genes by their ensembl ids using the score_genes_aucell function for _, row in msigdb.iterrows(): gene_set_name = row["gene_set_name"] - if gene_set_name in gene_sets_to_score: + if not gene_sets_to_score or gene_set_name in gene_sets_to_score: genes = row["genes"].split(",") # Convert gene symbols to ensembl ids by using the columns gene_symbols and index in adata.var specific to the gene set ens_gene_ids = adata.var[ diff --git a/tools/tertiary-analysis/decoupler/decoupler_aucell_score.xml b/tools/tertiary-analysis/decoupler/decoupler_aucell_score.xml index b549e776..6b7b1d3c 100644 --- a/tools/tertiary-analysis/decoupler/decoupler_aucell_score.xml +++ b/tools/tertiary-analysis/decoupler/decoupler_aucell_score.xml @@ -1,5 +1,5 @@ - + scores cells using the AUCell method for gene sets. @@ -10,11 +10,13 @@ python '$__tool_directory__/decoupler_aucell_score.py' --input_file '$input_file' #if $gene_lists_source.source == "gmt" - --gmt_file '$gmt_file' - --gene_sets_to_score '$gene_sets_to_score' + --gmt_file '$gene_lists_source.gmt_file' + #if $gene_lists_source.gene_sets_to_score + --gene_sets_to_score '$gene_lists_source.gene_sets_to_score' + #end if #else: - --gene_lists_to_score '$gene_lists_to_score' - --score_names '$score_names' + --gene_lists_to_score '$gene_lists_source.gene_lists_to_score' + --score_names '$gene_lists_source.score_names' #end if --gene_symbols_field '$gene_symbols_field' $use_raw @@ -34,7 +36,7 @@ - + @@ -56,12 +58,27 @@ - - + + + + + + + + + + + + + + + + + @@ -72,12 +89,12 @@ - - + + @@ -88,12 +105,12 @@ - - + +