@@ -66,7 +66,8 @@ def register_arguments(parser):
66
66
"201X-10-01"). Similarly, an ambiguous month makes the
67
67
corresponding day ambiguous (e.g., "2010-XX-01").""" )
68
68
metadata_filter_group .add_argument ('--exclude' , type = str , nargs = "+" , metavar = "FILE" , default = argparse .SUPPRESS ,
69
- help = "File(s) with list of strains to exclude." )
69
+ help = """File(s) with list of strain IDs to exclude. The ID column is
70
+ determined by --metadata-id-columns.""" )
70
71
metadata_filter_group .add_argument ('--exclude-where' , nargs = '+' , metavar = "CONDITION" , default = argparse .SUPPRESS ,
71
72
help = """Exclude strains matching these conditions. Ex: \" host=rat\" or
72
73
\" host!=rat\" . Multiple values are processed as OR (matching any of
@@ -75,8 +76,9 @@ def register_arguments(parser):
75
76
help = """Exclude all strains by default. Use this with the include
76
77
arguments to select a specific subset of strains.""" )
77
78
metadata_filter_group .add_argument ('--include' , type = str , nargs = "+" , metavar = "FILE" , default = argparse .SUPPRESS ,
78
- help = """File(s) with list of strains to include regardless of
79
- priorities, subsampling, or absence of an entry in --sequences.""" )
79
+ help = """File(s) with list of strain IDs to include regardless of
80
+ priorities, subsampling, or absence of an entry in --sequences. The
81
+ ID column is determined by --metadata-id-columns.""" )
80
82
metadata_filter_group .add_argument ('--include-where' , nargs = '+' , metavar = "CONDITION" , default = argparse .SUPPRESS ,
81
83
help = """Include strains with these values. ex: host=rat. Multiple values
82
84
are processed as OR (having any of those specified will be
@@ -128,13 +130,14 @@ def register_arguments(parser):
128
130
129
131
subsample_group .add_argument ('--priority' , type = str , metavar = "FILE" , default = argparse .SUPPRESS ,
130
132
help = """Tab-delimited file with list of priority scores for strains
131
- (e.g., "<strain>\\ t<priority>") and no header. When scores are
133
+ (e.g., "<strain ID >\\ t<priority>") and no header. When scores are
132
134
provided, Augur converts scores to floating point values, sorts
133
135
strains within each subsampling group from highest to lowest
134
136
priority, and selects the top N strains per group where N is the
135
137
calculated or requested number of strains per group. Higher numbers
136
138
indicate higher priority. Since priorities represent relative
137
- values between strains, these values can be arbitrary.""" )
139
+ values between strains, these values can be arbitrary. The ID
140
+ column is determined by --metadata-id-columns.""" )
138
141
subsample_group .add_argument ('--subsample-seed' , type = int , metavar = "N" , default = argparse .SUPPRESS ,
139
142
help = """Random number generator seed to allow reproducible subsampling
140
143
(with same input data).""" )
@@ -149,7 +152,8 @@ def register_arguments(parser):
149
152
output_group .add_argument ('--output-metadata' , metavar = "FILE" , default = argparse .SUPPRESS ,
150
153
help = "Metadata for strains that passed filters." )
151
154
output_group .add_argument ('--output-strains' , metavar = "FILE" , default = argparse .SUPPRESS ,
152
- help = "List of strains that passed filters (no header)." )
155
+ help = """List of strain IDs that passed filters (no header). The ID
156
+ column is determined by --metadata-id-columns.""" )
153
157
output_group .add_argument ('--output-log' , metavar = "FILE" , default = argparse .SUPPRESS ,
154
158
help = """Tab-delimited file with one row for each filtered strain and the
155
159
reason it was filtered. Keyword arguments used for a given filter
0 commit comments