@@ -225,8 +225,9 @@ def __init__(self, index_path : str, *args,
225
225
stemmer : Union [None , str , TerrierStemmer ] = TerrierStemmer .porter ,
226
226
stopwords : Union [None , TerrierStopwords , List [str ]] = TerrierStopwords .terrier ,
227
227
tokeniser : Union [str ,TerrierTokeniser ] = TerrierTokeniser .english ,
228
- type = IndexingType .CLASSIC ,
229
- ** kwargs ):
228
+ type = IndexingType .CLASSIC ,
229
+ properties : Dict [str ,str ] = {}
230
+ ):
230
231
"""
231
232
Constructor called by all indexer subclasses. All arguments listed below are available in
232
233
IterDictIndexer, DFIndexer, TRECCollectionIndexer and FilesIndsexer.
@@ -240,6 +241,7 @@ def __init__(self, index_path : str, *args,
240
241
stopwords (TerrierStopwords): the stopwords list to apply. Default is ``TerrierStemmer.terrier``.
241
242
tokeniser (TerrierTokeniser): the stemmer to apply. Default is ``TerrierTokeniser.english``.
242
243
type (IndexingType): the specific indexing procedure to use. Default is ``IndexingType.CLASSIC``.
244
+ properties (dict): Terrier properties that you wish to overrride.
243
245
"""
244
246
if type is IndexingType .MEMORY :
245
247
self .path = None
@@ -256,6 +258,8 @@ def __init__(self, index_path : str, *args,
256
258
self .tokeniser = TerrierTokeniser ._to_obj (tokeniser )
257
259
self .properties = pt .java .J .Properties ()
258
260
self .setProperties (** self .default_properties )
261
+ for k ,v in properties .items ():
262
+ self .properties [k ] = v
259
263
self .overwrite = overwrite
260
264
self .verbose = verbose
261
265
self .meta_reverse = meta_reverse
0 commit comments