Also make PhraseReplacementMap more tolerant

This also clarifies the test expectations and how parsing errors are
handled.
This commit is contained in:
Lukhnos Liu 2022-01-18 22:46:26 -08:00
parent 9bc3536630
commit 202b1fa058
4 changed files with 70 additions and 11 deletions

View File

@ -11,6 +11,8 @@ add_library(McBopomofoLMLib
ParselessPhraseDB.h
ParselessLM.cpp
ParselessLM.h
PhraseReplacementMap.h
PhraseReplacementMap.cpp
UserPhrasesLM.h
UserPhrasesLM.cpp)
@ -32,6 +34,7 @@ add_executable(McBopomofoLMLibTest
KeyValueBlobReaderTest.cpp
ParselessLMTest.cpp
ParselessPhraseDBTest.cpp
PhraseReplacementMapTest.cpp
UserPhrasesLMTest.cpp)
target_link_libraries(McBopomofoLMLibTest gtest_main McBopomofoLMLib)
include(GoogleTest)

View File

@ -58,11 +58,6 @@ bool PhraseReplacementMap::open(const char *path)
while ((state = reader.Next(&keyValue)) == KeyValueBlobReader::State::HAS_PAIR) {
keyValueMap[keyValue.key] = keyValue.value;
}
if (state == KeyValueBlobReader::State::ERROR) {
close();
return false;
}
return true;
}

View File

@ -0,0 +1,59 @@
// Copyright (c) 2022 and onwards The McBopomofo Authors.
//
// Permission is hereby granted, free of charge, to any person
// obtaining a copy of this software and associated documentation
// files (the "Software"), to deal in the Software without
// restriction, including without limitation the rights to use,
// copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following
// conditions:
//
// The above copyright notice and this permission notice shall be
// included in all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
// EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
// OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
// NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
// HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
// WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
// OTHER DEALINGS IN THE SOFTWARE.
#include <cstdio>
#include <filesystem>
#include <string>
#include "PhraseReplacementMap.h"
#include "gtest/gtest.h"
namespace McBopomofo {
TEST(PhraseReplacementMapTest, LenientReading)
{
std::string tmp_name
= std::string(std::filesystem::temp_directory_path()) + "test.txt";
FILE* f = fopen(tmp_name.c_str(), "w");
ASSERT_NE(f, nullptr);
fprintf(f, "key value\n");
fprintf(f, "key2\n"); // error line
fprintf(f, "key3 value2\n");
int r = fclose(f);
ASSERT_EQ(r, 0);
PhraseReplacementMap map;
map.open(tmp_name.c_str());
ASSERT_EQ(map.valueForKey("key"), "value");
ASSERT_EQ(map.valueForKey("key2"), "");
// key2 causes parsing error, and the line that has key3 won't be parsed.
ASSERT_EQ(map.valueForKey("key3"), "");
r = remove(tmp_name.c_str());
ASSERT_EQ(r, 0);
}
} // namespace McBopomofo

View File

@ -38,17 +38,19 @@ TEST(UserPhreasesLMTest, LenientReading)
FILE* f = fopen(tmp_name.c_str(), "w");
ASSERT_NE(f, nullptr);
fprintf(f, "bar foo\n");
fprintf(f, "bar \n"); // error line
fprintf(f, "argh baz\n");
fprintf(f, "value1 reading1\n");
fprintf(f, "value2 \n"); // error line
fprintf(f, "value3 reading2\n");
int r = fclose(f);
ASSERT_EQ(r, 0);
UserPhrasesLM lm;
lm.open(tmp_name.c_str());
ASSERT_TRUE(lm.hasUnigramsForKey("foo"));
ASSERT_FALSE(lm.hasUnigramsForKey("bar"));
ASSERT_FALSE(lm.hasUnigramsForKey("baz"));
ASSERT_TRUE(lm.hasUnigramsForKey("reading1"));
ASSERT_FALSE(lm.hasUnigramsForKey("value2"));
// Anything after the error won't be parsed, so reading2 won't be found.
ASSERT_FALSE(lm.hasUnigramsForKey("reading2"));
r = remove(tmp_name.c_str());
ASSERT_EQ(r, 0);