Skip to content

Commit

Permalink
Added example config files
Browse files Browse the repository at this point in the history
  • Loading branch information
RunDevelopment committed Jun 9, 2021
1 parent 19b8f8b commit 9e12323
Show file tree
Hide file tree
Showing 2 changed files with 24 additions and 0 deletions.
12 changes: 12 additions & 0 deletions examples/de.properties
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
# This uses the following datasets:
#
# 1) Web 1T 5-gram, 10 European Languages, Version 1, Linguistic Data Consortium (LDC) catalog number LDC2009T25 and isbn 1-58563-525-1
# 2) Google Ngram Viewer dataset version 1 from 2009-07-15

input = /path/to/corpus-google-web-1t-5-gram-10-european-languages-version1/data/GERMAN \
; /path/to/corpus-google-books-n-grams-version1/googlebooks-ger-all-20090715
output = /path/to/out
temp = /path/to/temp
lang = de
lowercase = false
max-n-gram = 5
12 changes: 12 additions & 0 deletions examples/en.properties
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
# This uses the following datasets:
#
# 1) Web 1T 5-gram Version 1, Linguistic Data Consortium (LDC) catalog number LDC2006T13 and ISBN 1-58563-397-6
# 2) Google Ngram Viewer dataset version 1 from 2009-07-15

input = /path/to/corpus-google-web-1t-5-gram-version1 \
; /path/to/corpus-google-books-n-grams-version1/googlebooks-eng-all-20090715
output = /path/to/out
temp = /path/to/temp
lang = en
lowercase = true
max-n-gram = 5

0 comments on commit 9e12323

Please sign in to comment.