2015-01-09 20:52:31 +01:00
|
|
|
|
#include "apps/openmw/mwdialogue/keywordsearch.hpp"
|
2023-12-26 14:38:39 +01:00
|
|
|
|
|
2015-01-09 20:52:31 +01:00
|
|
|
|
#include <gtest/gtest.h>
|
|
|
|
|
|
|
|
|
|
struct KeywordSearchTest : public ::testing::Test
|
|
|
|
|
{
|
|
|
|
|
protected:
|
2020-10-22 23:57:53 +02:00
|
|
|
|
void SetUp() override {}
|
2022-09-22 21:26:05 +03:00
|
|
|
|
|
2020-10-22 23:57:53 +02:00
|
|
|
|
void TearDown() override {}
|
2015-01-09 20:52:31 +01:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_conflict_resolution)
|
|
|
|
|
{
|
|
|
|
|
// test to make sure the longest keyword in a chain of conflicting keywords gets chosen
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2015-01-09 20:52:31 +01:00
|
|
|
|
search.seed("foo bar", 0);
|
|
|
|
|
search.seed("bar lock", 0);
|
|
|
|
|
search.seed("lock switch", 0);
|
|
|
|
|
|
|
|
|
|
std::string text = "foo bar lock switch";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2015-01-09 20:52:31 +01:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
|
|
|
|
// Should contain: "foo bar", "lock switch"
|
2021-09-20 19:56:47 +02:00
|
|
|
|
EXPECT_EQ(matches.size(), 2);
|
|
|
|
|
EXPECT_EQ(std::string(matches.front().mBeg, matches.front().mEnd), "foo bar");
|
|
|
|
|
EXPECT_EQ(std::string(matches.rbegin()->mBeg, matches.rbegin()->mEnd), "lock switch");
|
2015-01-09 20:52:31 +01:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_conflict_resolution2)
|
|
|
|
|
{
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2015-01-09 20:52:31 +01:00
|
|
|
|
search.seed("the dwemer", 0);
|
|
|
|
|
search.seed("dwemer language", 0);
|
|
|
|
|
|
|
|
|
|
std::string text = "the dwemer language";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2015-01-09 20:52:31 +01:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
2021-09-20 19:56:47 +02:00
|
|
|
|
EXPECT_EQ(matches.size(), 1);
|
|
|
|
|
EXPECT_EQ(std::string(matches.front().mBeg, matches.front().mEnd), "dwemer language");
|
2015-01-09 20:52:31 +01:00
|
|
|
|
}
|
2015-01-10 00:26:13 +01:00
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_conflict_resolution3)
|
|
|
|
|
{
|
|
|
|
|
// testing that the longest keyword is chosen, rather than maximizing the
|
|
|
|
|
// amount of highlighted characters by highlighting the first and last keyword
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2015-01-10 00:26:13 +01:00
|
|
|
|
search.seed("foo bar", 0);
|
|
|
|
|
search.seed("bar lock", 0);
|
|
|
|
|
search.seed("lock so", 0);
|
|
|
|
|
|
|
|
|
|
std::string text = "foo bar lock so";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2015-01-10 00:26:13 +01:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
2021-09-20 19:56:47 +02:00
|
|
|
|
EXPECT_EQ(matches.size(), 1);
|
|
|
|
|
EXPECT_EQ(std::string(matches.front().mBeg, matches.front().mEnd), "bar lock");
|
2015-01-10 00:26:13 +01:00
|
|
|
|
}
|
2021-09-19 15:05:48 +02:00
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_utf8_word_begin)
|
|
|
|
|
{
|
|
|
|
|
// We make sure that the search works well even if the character is not ASCII
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2021-09-19 20:29:32 +02:00
|
|
|
|
search.seed("états", 0);
|
|
|
|
|
search.seed("ïrradiés", 0);
|
|
|
|
|
search.seed("ça nous déçois", 0);
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.seed("ois", 0);
|
2021-09-19 15:05:48 +02:00
|
|
|
|
|
2021-09-19 20:29:32 +02:00
|
|
|
|
std::string text
|
|
|
|
|
= "les nations unis ont réunis le monde entier, états units inclus pour parler du problème des gens ïrradiés "
|
|
|
|
|
"et ça nous déçois";
|
2021-09-19 15:05:48 +02:00
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2021-09-19 15:05:48 +02:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
2021-09-20 19:56:47 +02:00
|
|
|
|
EXPECT_EQ(matches.size(), 3);
|
|
|
|
|
EXPECT_EQ(std::string(matches[0].mBeg, matches[0].mEnd), "états");
|
|
|
|
|
EXPECT_EQ(std::string(matches[1].mBeg, matches[1].mEnd), "ïrradiés");
|
|
|
|
|
EXPECT_EQ(std::string(matches[2].mBeg, matches[2].mEnd), "ça nous déçois");
|
2021-09-19 15:05:48 +02:00
|
|
|
|
}
|
2021-10-07 13:26:40 +00:00
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_non_alpha_non_whitespace_word_begin)
|
|
|
|
|
{
|
|
|
|
|
// We make sure that the search works well even if the separator is not a whitespace
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.seed("Report to caius cosades", 0);
|
|
|
|
|
|
|
|
|
|
std::string text = "I was told to \"Report to caius cosades\"";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
|
|
|
|
EXPECT_EQ(matches.size(), 1);
|
|
|
|
|
EXPECT_EQ(std::string(matches[0].mBeg, matches[0].mEnd), "Report to caius cosades");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_russian_non_ascii_before)
|
|
|
|
|
{
|
|
|
|
|
// We make sure that the search works well even if the separator is not a whitespace with russian chars
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.seed("Доложить Каю Косадесу", 0);
|
|
|
|
|
|
|
|
|
|
std::string text
|
|
|
|
|
= "Что? Да. Я Кай Косадес. То есть как это, вам велели «Доложить Каю Косадесу»? О чем вы говорите?";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
|
|
|
|
EXPECT_EQ(matches.size(), 1);
|
|
|
|
|
EXPECT_EQ(std::string(matches[0].mBeg, matches[0].mEnd), "Доложить Каю Косадесу");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TEST_F(KeywordSearchTest, keyword_test_russian_ascii_before)
|
|
|
|
|
{
|
|
|
|
|
// We make sure that the search works well even if the separator is not a whitespace with russian chars
|
2023-05-04 19:46:49 +02:00
|
|
|
|
MWDialogue::KeywordSearch<int> search;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.seed("Доложить Каю Косадесу", 0);
|
|
|
|
|
|
|
|
|
|
std::string text
|
|
|
|
|
= "Что? Да. Я Кай Косадес. То есть как это, вам велели 'Доложить Каю Косадесу'? О чем вы говорите?";
|
|
|
|
|
|
2023-05-04 19:46:49 +02:00
|
|
|
|
std::vector<MWDialogue::KeywordSearch<int>::Match> matches;
|
2021-10-07 13:26:40 +00:00
|
|
|
|
search.highlightKeywords(text.begin(), text.end(), matches);
|
|
|
|
|
|
|
|
|
|
EXPECT_EQ(matches.size(), 1);
|
|
|
|
|
EXPECT_EQ(std::string(matches[0].mBeg, matches[0].mEnd), "Доложить Каю Косадесу");
|
|
|
|
|
}
|