diff options
| author | Star Rauchenberger <fefferburbia@gmail.com> | 2022-12-09 16:53:33 -0500 |
|---|---|---|
| committer | Star Rauchenberger <fefferburbia@gmail.com> | 2022-12-09 16:53:33 -0500 |
| commit | 06e4672540094a851542b47abaf022f934b63b09 (patch) | |
| tree | 5333fb4446fce0043600f7d06427dd243a15c543 /generator/generator.cpp | |
| parent | f2731325f551c4cfea861e2e31d214936b9bd619 (diff) | |
| download | verbly-06e4672540094a851542b47abaf022f934b63b09.tar.gz verbly-06e4672540094a851542b47abaf022f934b63b09.tar.bz2 verbly-06e4672540094a851542b47abaf022f934b63b09.zip | |
Generator now splits ImageNet list into per-notion files
Diffstat (limited to 'generator/generator.cpp')
| -rw-r--r-- | generator/generator.cpp | 23 |
1 files changed, 15 insertions, 8 deletions
| diff --git a/generator/generator.cpp b/generator/generator.cpp index fdea10f..969b629 100644 --- a/generator/generator.cpp +++ b/generator/generator.cpp | |||
| @@ -23,13 +23,15 @@ namespace verbly { | |||
| 23 | std::string wordNetPath, | 23 | std::string wordNetPath, |
| 24 | std::string cmudictPath, | 24 | std::string cmudictPath, |
| 25 | std::string imageNetPath, | 25 | std::string imageNetPath, |
| 26 | std::string outputPath) : | 26 | std::string outputPath, |
| 27 | std::string imageNetOutput) : | ||
| 27 | verbNetPath_(verbNetPath), | 28 | verbNetPath_(verbNetPath), |
| 28 | agidPath_(agidPath), | 29 | agidPath_(agidPath), |
| 29 | wordNetPath_(wordNetPath), | 30 | wordNetPath_(wordNetPath), |
| 30 | cmudictPath_(cmudictPath), | 31 | cmudictPath_(cmudictPath), |
| 31 | imageNetPath_(imageNetPath), | 32 | imageNetPath_(imageNetPath), |
| 32 | db_(outputPath, hatkirby::dbmode::create) | 33 | db_(outputPath, hatkirby::dbmode::create), |
| 34 | imageNetOutput_(imageNetOutput) | ||
| 33 | { | 35 | { |
| 34 | // Ensure VerbNet directory exists | 36 | // Ensure VerbNet directory exists |
| 35 | DIR* dir; | 37 | DIR* dir; |
| @@ -75,6 +77,9 @@ namespace verbly { | |||
| 75 | { | 77 | { |
| 76 | throw std::invalid_argument("ImageNet urls.txt file not found"); | 78 | throw std::invalid_argument("ImageNet urls.txt file not found"); |
| 77 | } | 79 | } |
| 80 | |||
| 81 | // Create the ImageNet output directory | ||
| 82 | std::filesystem::create_directory(imageNetOutput_); | ||
| 78 | } | 83 | } |
| 79 | 84 | ||
| 80 | void generator::run() | 85 | void generator::run() |
| @@ -86,7 +91,7 @@ namespace verbly { | |||
| 86 | readAdjectivePositioning(); | 91 | readAdjectivePositioning(); |
| 87 | 92 | ||
| 88 | // Counts the number of URLs ImageNet has per notion | 93 | // Counts the number of URLs ImageNet has per notion |
| 89 | //readImageNetUrls(); | 94 | readImageNetUrls(); |
| 90 | 95 | ||
| 91 | // Creates a word by WordNet sense key lookup table | 96 | // Creates a word by WordNet sense key lookup table |
| 92 | readWordNetSenseKeys(); | 97 | readWordNetSenseKeys(); |
| @@ -118,17 +123,15 @@ namespace verbly { | |||
| 118 | // Writes the database version | 123 | // Writes the database version |
| 119 | writeVersion(); | 124 | writeVersion(); |
| 120 | 125 | ||
| 126 | // Dumps data to the database | ||
| 127 | dumpObjects(); | ||
| 128 | |||
| 121 | // Calculates and writes form merography | 129 | // Calculates and writes form merography |
| 122 | writeMerography(); | 130 | writeMerography(); |
| 123 | 131 | ||
| 124 | // Calculates and writes pronunciation merophony | 132 | // Calculates and writes pronunciation merophony |
| 125 | writeMerophony(); | 133 | writeMerophony(); |
| 126 | 134 | ||
| 127 | // Dumps data to the database | ||
| 128 | dumpObjects(); | ||
| 129 | |||
| 130 | |||
| 131 | |||
| 132 | // Populates the antonymy relationship from WordNet | 135 | // Populates the antonymy relationship from WordNet |
| 133 | readWordNetAntonymy(); | 136 | readWordNetAntonymy(); |
| 134 | 137 | ||
| @@ -286,6 +289,10 @@ namespace verbly { | |||
| 286 | { | 289 | { |
| 287 | // We know that this notion has a wnid and is a noun. | 290 | // We know that this notion has a wnid and is a noun. |
| 288 | notionByWnid_.at(wnid)->incrementNumOfImages(); | 291 | notionByWnid_.at(wnid)->incrementNumOfImages(); |
| 292 | |||
| 293 | std::filesystem::path imagefile = imageNetOutput_ / std::to_string(notionByWnid_[wnid]->getId()); | ||
| 294 | std::ofstream imageoutput(imagefile, std::ios::app); | ||
| 295 | imageoutput << line.substr(line.find("\t") + 1) << std::endl; | ||
| 289 | } | 296 | } |
| 290 | } | 297 | } |
| 291 | } | 298 | } |
