From 4b8c18058164815c0407a64482140a3cfc925f38 Mon Sep 17 00:00:00 2001 From: Denis Parfenov <33306370+tempoden@users.noreply.github.com> Date: Sat, 12 Oct 2024 17:23:51 +0700 Subject: [PATCH 1/2] Add assert for n=1 in count_ngrams --- week03_lm/seminar.ipynb | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/week03_lm/seminar.ipynb b/week03_lm/seminar.ipynb index 90297594..de0a91b5 100644 --- a/week03_lm/seminar.ipynb +++ b/week03_lm/seminar.ipynb @@ -191,7 +191,10 @@ "assert len(dummy_counts[('_UNK_', '_UNK_')]) == 78\n", "assert dummy_counts['_UNK_', 'a']['note'] == 3\n", "assert dummy_counts['p', '=']['np'] == 2\n", - "assert dummy_counts['author', '.']['_EOS_'] == 1" + "assert dummy_counts['author', '.']['_EOS_'] == 1", + "\n", + "single_counts = count_ngrams(dummy_lines, n=1)", + "assert single_counts[()][EOS] == len(dummy_lines)" ] }, { From d9e8b62c3950cb8e86f2a572d22541c56031509e Mon Sep 17 00:00:00 2001 From: Denis Parfenov <33306370+tempoden@users.noreply.github.com> Date: Sat, 12 Oct 2024 17:26:04 +0700 Subject: [PATCH 2/2] Add assert for n=1 in count_ngrams --- week03_lm/seminar.ipynb | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/week03_lm/seminar.ipynb b/week03_lm/seminar.ipynb index de0a91b5..7c2df9a3 100644 --- a/week03_lm/seminar.ipynb +++ b/week03_lm/seminar.ipynb @@ -191,9 +191,9 @@ "assert len(dummy_counts[('_UNK_', '_UNK_')]) == 78\n", "assert dummy_counts['_UNK_', 'a']['note'] == 3\n", "assert dummy_counts['p', '=']['np'] == 2\n", - "assert dummy_counts['author', '.']['_EOS_'] == 1", + "assert dummy_counts['author', '.']['_EOS_'] == 1\n", "\n", - "single_counts = count_ngrams(dummy_lines, n=1)", + "single_counts = count_ngrams(dummy_lines, n=1)\n", "assert single_counts[()][EOS] == len(dummy_lines)" ] },