You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
114 lines
3.9 KiB
114 lines
3.9 KiB
7 months ago
|
/*
|
||
|
* Copyright (C) 2018 The Android Open Source Project
|
||
|
*
|
||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
* you may not use this file except in compliance with the License.
|
||
|
* You may obtain a copy of the License at
|
||
|
*
|
||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||
|
*
|
||
|
* Unless required by applicable law or agreed to in writing, software
|
||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
* See the License for the specific language governing permissions and
|
||
|
* limitations under the License.
|
||
|
*/
|
||
|
|
||
|
#include "utils/regex-match.h"
|
||
|
|
||
|
#include <memory>
|
||
|
|
||
|
#include "utils/jvm-test-utils.h"
|
||
|
#include "utils/utf8/unicodetext.h"
|
||
|
#include "utils/utf8/unilib.h"
|
||
|
#include "gmock/gmock.h"
|
||
|
#include "gtest/gtest.h"
|
||
|
|
||
|
namespace libtextclassifier3 {
|
||
|
namespace {
|
||
|
|
||
|
class RegexMatchTest : public testing::Test {
|
||
|
protected:
|
||
|
RegexMatchTest() : unilib_(libtextclassifier3::CreateUniLibForTesting()) {}
|
||
|
std::unique_ptr<UniLib> unilib_;
|
||
|
};
|
||
|
|
||
|
#ifndef TC3_DISABLE_LUA
|
||
|
TEST_F(RegexMatchTest, HandlesSimpleVerification) {
|
||
|
EXPECT_TRUE(VerifyMatch(/*context=*/"", /*matcher=*/nullptr, "return true;"));
|
||
|
}
|
||
|
#endif // TC3_DISABLE_LUA
|
||
|
|
||
|
#ifndef TC3_DISABLE_LUA
|
||
|
TEST_F(RegexMatchTest, HandlesCustomVerification) {
|
||
|
UnicodeText pattern = UTF8ToUnicodeText("(\\d{16})",
|
||
|
/*do_copy=*/true);
|
||
|
UnicodeText message = UTF8ToUnicodeText("cc: 4012888888881881",
|
||
|
/*do_copy=*/true);
|
||
|
const std::string verifier = R"(
|
||
|
function luhn(candidate)
|
||
|
local sum = 0
|
||
|
local num_digits = string.len(candidate)
|
||
|
local parity = num_digits % 2
|
||
|
for pos = 1,num_digits do
|
||
|
d = tonumber(string.sub(candidate, pos, pos))
|
||
|
if pos % 2 ~= parity then
|
||
|
d = d * 2
|
||
|
end
|
||
|
if d > 9 then
|
||
|
d = d - 9
|
||
|
end
|
||
|
sum = sum + d
|
||
|
end
|
||
|
return (sum % 10) == 0
|
||
|
end
|
||
|
return luhn(match[1].text);
|
||
|
)";
|
||
|
const std::unique_ptr<UniLib::RegexPattern> regex_pattern =
|
||
|
unilib_->CreateRegexPattern(pattern);
|
||
|
ASSERT_TRUE(regex_pattern != nullptr);
|
||
|
const std::unique_ptr<UniLib::RegexMatcher> matcher =
|
||
|
regex_pattern->Matcher(message);
|
||
|
ASSERT_TRUE(matcher != nullptr);
|
||
|
int status = UniLib::RegexMatcher::kNoError;
|
||
|
ASSERT_TRUE(matcher->Find(&status) &&
|
||
|
status == UniLib::RegexMatcher::kNoError);
|
||
|
|
||
|
EXPECT_TRUE(VerifyMatch(message.ToUTF8String(), matcher.get(), verifier));
|
||
|
}
|
||
|
#endif // TC3_DISABLE_LUA
|
||
|
|
||
|
TEST_F(RegexMatchTest, RetrievesMatchGroupTest) {
|
||
|
UnicodeText pattern =
|
||
|
UTF8ToUnicodeText("never gonna (?:give (you) up|let (you) down)",
|
||
|
/*do_copy=*/true);
|
||
|
const std::unique_ptr<UniLib::RegexPattern> regex_pattern =
|
||
|
unilib_->CreateRegexPattern(pattern);
|
||
|
ASSERT_TRUE(regex_pattern != nullptr);
|
||
|
UnicodeText message =
|
||
|
UTF8ToUnicodeText("never gonna give you up - never gonna let you down");
|
||
|
const std::unique_ptr<UniLib::RegexMatcher> matcher =
|
||
|
regex_pattern->Matcher(message);
|
||
|
ASSERT_TRUE(matcher != nullptr);
|
||
|
int status = UniLib::RegexMatcher::kNoError;
|
||
|
|
||
|
ASSERT_TRUE(matcher->Find(&status) &&
|
||
|
status == UniLib::RegexMatcher::kNoError);
|
||
|
EXPECT_THAT(GetCapturingGroupText(matcher.get(), 0).value(),
|
||
|
testing::Eq("never gonna give you up"));
|
||
|
EXPECT_THAT(GetCapturingGroupText(matcher.get(), 1).value(),
|
||
|
testing::Eq("you"));
|
||
|
EXPECT_FALSE(GetCapturingGroupText(matcher.get(), 2).has_value());
|
||
|
|
||
|
ASSERT_TRUE(matcher->Find(&status) &&
|
||
|
status == UniLib::RegexMatcher::kNoError);
|
||
|
EXPECT_THAT(GetCapturingGroupText(matcher.get(), 0).value(),
|
||
|
testing::Eq("never gonna let you down"));
|
||
|
EXPECT_FALSE(GetCapturingGroupText(matcher.get(), 1).has_value());
|
||
|
EXPECT_THAT(GetCapturingGroupText(matcher.get(), 2).value(),
|
||
|
testing::Eq("you"));
|
||
|
}
|
||
|
|
||
|
} // namespace
|
||
|
} // namespace libtextclassifier3
|