From 47d9ba41accf6410bb9cf26b49a1c76129a49975 Mon Sep 17 00:00:00 2001 From: Kelly Rauchenberger Date: Wed, 27 Feb 2019 21:52:13 -0500 Subject: The beginning of a corpus should be treated as a new sentence --- kgramstats.cpp | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) (limited to 'kgramstats.cpp') diff --git a/kgramstats.cpp b/kgramstats.cpp index 37830e4..7ece80f 100644 --- a/kgramstats.cpp +++ b/kgramstats.cpp @@ -396,6 +396,33 @@ void rawr::compile(int maxK) int corpid = 0; for (auto corpus : tokens) { + for (int k=0; k