aboutsummaryrefslogtreecommitdiff
path: root/icing/query/advanced_query_parser/util/string-util_test.cc
blob: a7ccf3e8fdbaf254db665777f832998bfd8fd65a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
// Copyright (C) 2023 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//      http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "icing/query/advanced_query_parser/util/string-util.h"

#include "gmock/gmock.h"
#include "gtest/gtest.h"
#include "icing/testing/common-matchers.h"

namespace icing {
namespace lib {

namespace {

using ::testing::Eq;
using ::testing::IsEmpty;

TEST(StringUtilTest, UnescapeStringEmptyString) {
  EXPECT_THAT(string_util::UnescapeStringValue(""), IsOkAndHolds(IsEmpty()));
}

TEST(StringUtilTest, UnescapeStringStringWithNoEscapes) {
  EXPECT_THAT(string_util::UnescapeStringValue("foo"), IsOkAndHolds("foo"));
  EXPECT_THAT(string_util::UnescapeStringValue("f o o"), IsOkAndHolds("f o o"));
  EXPECT_THAT(string_util::UnescapeStringValue("f\to\to"),
              IsOkAndHolds("f\to\to"));
  EXPECT_THAT(string_util::UnescapeStringValue("f.o.o"), IsOkAndHolds("f.o.o"));
}

TEST(StringUtilTest, UnescapeStringStringWithEscapes) {
  EXPECT_THAT(string_util::UnescapeStringValue("f\\oo"), IsOkAndHolds("foo"));
  EXPECT_THAT(string_util::UnescapeStringValue("f\\\\oo"),
              IsOkAndHolds("f\\oo"));
  EXPECT_THAT(string_util::UnescapeStringValue("f\\\"oo"),
              IsOkAndHolds("f\"oo"));
  EXPECT_THAT(string_util::UnescapeStringValue("foo\\"), IsOkAndHolds("foo"));
  EXPECT_THAT(string_util::UnescapeStringValue("foo b\\a\\\"r baz"),
              IsOkAndHolds("foo ba\"r baz"));
  EXPECT_THAT(string_util::UnescapeStringValue("bar b\\aar bar\\s bart"),
              IsOkAndHolds("bar baar bars bart"));
  EXPECT_THAT(string_util::UnescapeStringValue("\\\\\\\\a"),
              IsOkAndHolds("\\\\a"));
}

TEST(StringUtilTest, UnescapeStringQuoteWithoutEscape) {
  EXPECT_THAT(string_util::UnescapeStringValue("f\\o\"o"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
  EXPECT_THAT(string_util::UnescapeStringValue("f\"oo"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
}

TEST(StringUtilTest, FindEscapedTokenEmptyUnescapedToken) {
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", ""),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
}

TEST(StringUtilTest, FindEscapedTokenTokenNotPresent) {
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", "elephant"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", "bat"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", "taz"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", "bazz"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
}

TEST(StringUtilTest, FindEscapedTokenMatchInMiddleToken) {
  EXPECT_THAT(string_util::FindEscapedToken("babar", "bar"),
              IsOkAndHolds("bar"));
}

TEST(StringUtilTest, FindEscapedTokenMatches) {
  EXPECT_THAT(string_util::FindEscapedToken("foo b\\a\\\"r baz", "ba\"r"),
              IsOkAndHolds("b\\a\\\"r"));
  EXPECT_THAT(string_util::FindEscapedToken("\\\\\\\\a", "\\\\a"),
              IsOkAndHolds("\\\\\\\\a"));
}

TEST(StringUtilTest, FindEscapedTokenTraversesThroughEscapedText) {
  std::string_view escaped_text = "bar b\\aar bar\\s bart";
  ICING_ASSERT_OK_AND_ASSIGN(
      std::string_view result,
      string_util::FindEscapedToken(escaped_text, "bar"));
  // escaped_text = "bar b\\aar bar\\s bart";
  // escaped_token   ^  ^
  EXPECT_THAT(result, Eq("bar"));

  // escaped_text = "b\\aar bar\\s bart";
  // escaped_token          ^  ^
  const char* result_end = result.data() + result.length();
  escaped_text = escaped_text.substr(result_end - escaped_text.data());
  ICING_ASSERT_OK_AND_ASSIGN(
      result, string_util::FindEscapedToken(escaped_text, "bar"));
  EXPECT_THAT(result, Eq("bar"));

  // escaped_text = "\\s bart";
  // escaped_token       ^  ^
  result_end = result.data() + result.length();
  escaped_text = escaped_text.substr(result_end - escaped_text.data());
  ICING_ASSERT_OK_AND_ASSIGN(
      result, string_util::FindEscapedToken(escaped_text, "bar"));
  EXPECT_THAT(result, Eq("bar"));

  result_end = result.data() + result.length();
  escaped_text = escaped_text.substr(result_end - escaped_text.data());
  EXPECT_THAT(string_util::FindEscapedToken(escaped_text, "bar"),
              StatusIs(libtextclassifier3::StatusCode::INVALID_ARGUMENT));
}

}  // namespace

}  // namespace lib
}  // namespace icing