/* * Copyright (C) 2018 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "annotator/annotator_jni.h" #include "gmock/gmock.h" #include "gtest/gtest.h" namespace libtextclassifier3 { namespace { TEST(Annotator, ConvertIndicesBMPUTF8) { // Test boundary cases. EXPECT_EQ(ConvertIndicesBMPToUTF8("hello", {0, 5}), CodepointSpan(0, 5)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("hello", {0, 5}), std::make_pair(0, 5)); EXPECT_EQ(ConvertIndicesBMPToUTF8("hello world", {0, 5}), CodepointSpan(0, 5)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("hello world", {0, 5}), std::make_pair(0, 5)); EXPECT_EQ(ConvertIndicesBMPToUTF8("๐Ÿ˜ello world", {0, 6}), CodepointSpan(0, 5)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("๐Ÿ˜ello world", {0, 5}), std::make_pair(0, 6)); EXPECT_EQ(ConvertIndicesBMPToUTF8("hello world", {6, 11}), CodepointSpan(6, 11)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("hello world", {6, 11}), std::make_pair(6, 11)); EXPECT_EQ(ConvertIndicesBMPToUTF8("hello worl๐Ÿ˜", {6, 12}), CodepointSpan(6, 11)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("hello worl๐Ÿ˜", {6, 11}), std::make_pair(6, 12)); // Simple example where the longer character is before the selection. // character ๐Ÿ˜ is 0x1f601 EXPECT_EQ(ConvertIndicesBMPToUTF8("๐Ÿ˜ Hello World.", {3, 8}), CodepointSpan(2, 7)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("๐Ÿ˜ Hello World.", {2, 7}), std::make_pair(3, 8)); // Longer character is before and in selection. EXPECT_EQ(ConvertIndicesBMPToUTF8("๐Ÿ˜ Hell๐Ÿ˜ World.", {3, 9}), CodepointSpan(2, 7)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("๐Ÿ˜ Hell๐Ÿ˜ World.", {2, 7}), std::make_pair(3, 9)); // Longer character is before and after selection. EXPECT_EQ(ConvertIndicesBMPToUTF8("๐Ÿ˜ Hello๐Ÿ˜World.", {3, 8}), CodepointSpan(2, 7)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("๐Ÿ˜ Hello๐Ÿ˜World.", {2, 7}), std::make_pair(3, 8)); // Longer character is before in after selection. EXPECT_EQ(ConvertIndicesBMPToUTF8("๐Ÿ˜ Hell๐Ÿ˜๐Ÿ˜World.", {3, 9}), CodepointSpan(2, 7)); EXPECT_EQ(ConvertIndicesUTF8ToBMP("๐Ÿ˜ Hell๐Ÿ˜๐Ÿ˜World.", {2, 7}), std::make_pair(3, 9)); } } // namespace } // namespace libtextclassifier3