@@ -30,7 +30,7 @@ def generate(
3030 dir_okay = False ,
3131 readable = True ,
3232 resolve_path = True ,
33- help = "CSV file containing protein sequences" ,
33+ help = "Path to and file name of the CSV file containing protein sequences. " ,
3434 ),
3535 output_dir : Path = typer .Argument (
3636 ...,
@@ -39,78 +39,80 @@ def generate(
3939 dir_okay = True ,
4040 writable = True ,
4141 resolve_path = True ,
42- help = "Output directory for generated MSA files" ,
42+ help = "Output directory for generated MSA files. " ,
4343 ),
4444 sequence_column : str | None = typer .Option (
4545 None ,
4646 "--sequence-column" ,
4747 "-c" ,
48- help = "Name of column containing sequences (required if CSV has multiple columns)" ,
48+ help = "Name of column containing sequences (required if CSV has multiple columns). " ,
4949 ),
5050 # MSAGenerationConfig parameters
5151 sharding_pattern : str = typer .Option (
5252 "/0:2/" ,
5353 "--sharding-pattern" ,
5454 "-s" ,
55- help = "Directory sharding pattern (e.g., '/0:2/')" ,
55+ help = "Directory sharding pattern (e.g., '/0:2/'). " ,
5656 ),
5757 output_extension : str = typer .Option (
5858 MSAFileExtension .A3M_GZ .value ,
5959 "--output-extension" ,
6060 "-o" ,
61- help = "Output file extension (.a3m, .a3m.gz, .a3m.zst, .afa, .afa.gz, .afa.zst)" ,
61+ help = "Output file extension (.a3m, .a3m.gz, .a3m.zst, .afa, .afa.gz, .afa.zst). " ,
6262 ),
6363 gpu : bool | None = typer .Option (
6464 None ,
6565 "--gpu/--no-gpu" ,
66- help = "Use GPU acceleration (auto-detects if not specified)" ,
66+ help = "Use GPU acceleration (auto-detects if not specified). " ,
6767 ),
6868 num_iterations : int = typer .Option (
6969 3 ,
7070 "--num-iterations" ,
7171 "-n" ,
72- help = "Number of MMseqs2 search iterations" ,
72+ help = "Number of MMseqs2 search iterations. " ,
7373 ),
7474 max_final_sequences : int = typer .Option (
7575 10_000 ,
7676 "--max-final-sequences" ,
77- help = "Maximum number of sequences in final MSAs" ,
77+ help = "Maximum number of sequences in final MSAs. " ,
7878 ),
7979 use_env : bool = typer .Option (
8080 True ,
8181 "--use-env/--no-env" ,
82- help = "Include environmental (metagenomic) database" ,
82+ help = "Include environmental (metagenomic) database. " ,
8383 ),
8484 num_workers : int = typer .Option (
8585 32 ,
8686 "--num-workers" ,
8787 "-j" ,
88- help = "Number of CPU threads" ,
88+ help = "Number of CPU threads. " ,
8989 ),
9090 sensitivity : float | None = typer .Option (
9191 8.0 ,
9292 "--sensitivity" ,
93- help = "MMseqs2 sensitivity (lower = faster, sparser MSAs)" ,
93+ help = "MMseqs2 sensitivity (lower = faster, sparser MSAs). " ,
9494 ),
9595 verbose : bool = typer .Option (
9696 False ,
9797 "--verbose" ,
9898 "-v" ,
99- help = "Enable verbose logging" ,
99+ help = "Enable verbose logging. " ,
100100 ),
101101 check_existing : bool = typer .Option (
102102 False ,
103103 "--check-existing/--no-check-existing" ,
104- help = "Check for existing MSAs before generation" ,
104+ help = "Check for existing MSAs before generation. " ,
105105 ),
106106 existing_msa_dirs : str | None = typer .Option (
107107 None ,
108108 "--existing-msa-dirs" ,
109- help = "Comma-separated MSA directories to check (uses LOCAL_MSA_DIRS env var if not specified)" ,
109+ help = "Comma-separated list of MSA directories to check (uses LOCAL_MSA_DIRS env var if not specified). " ,
110110 ),
111111) -> None :
112112 """Generate MSAs from sequences in a CSV file using MMseqs2.
113113
114+ Before using this command users must first install MMseqs2.
115+
114116 Examples:
115117 # Single-column CSV
116118 atomworks msa generate sequences.csv output_msas/
0 commit comments