From 1ed82c3071218d759cae6966fa6e9dbf47d38003 Mon Sep 17 00:00:00 2001 From: Kelly Rauchenberger Date: Sat, 20 Feb 2016 00:56:37 -0500 Subject: Added percentage display to preprocessing stage --- kgramstats.cpp | 56 ++++++++++++++++++++++++++++++++++++++++++++++++++++---- 1 file changed, 52 insertions(+), 4 deletions(-) (limited to 'kgramstats.cpp') diff --git a/kgramstats.cpp b/kgramstats.cpp index 8a21d60..07f41f6 100644 --- a/kgramstats.cpp +++ b/kgramstats.cpp @@ -91,9 +91,23 @@ kgramstats::kgramstats(std::string corpus, int maxK) emoji_file.close(); } - std::cout << "Tokenizing corpus..." << std::endl; + std::cout << "Tokenizing corpus... 0%" << std::flush; + int len = corpus.length(); + int per = 0; + int perprime = 0; + std::cout.fill(' '); while (end != std::string::npos) { + perprime = end * 100 / len; + if (perprime != per) + { + per = perprime; + + std::cout << "\b\b\b\b" << std::right; + std::cout.width(3); + std::cout << per << "%" << std::flush; + } + end = corpus.find(" ", start); bool emoji = false; @@ -294,6 +308,8 @@ kgramstats::kgramstats(std::string corpus, int maxK) start = ((end > (std::string::npos - 1) ) ? std::string::npos : end + 1); } + std::cout << "\b\b\b\b100%" << std::endl; + delete_aspell_speller(spell_checker); delete_aspell_config(spell_config); @@ -322,12 +338,25 @@ kgramstats::kgramstats(std::string corpus, int maxK) emoticons.terms.compile(); // kgram distribution - std::cout << "Creating markov chain..." << std::endl; + std::cout << "Creating markov chain... 0%" << std::flush; std::map > tstats; + len = (maxK-1) * tokens.size(); + per = 0; + perprime = 0; for (int k=1; k