1 //
2 // Copyright 2017 The Abseil Authors.
3 //
4 // Licensed under the Apache License, Version 2.0 (the "License");
5 // you may not use this file except in compliance with the License.
6 // You may obtain a copy of the License at
7 //
8 //      https://www.apache.org/licenses/LICENSE-2.0
9 //
10 // Unless required by applicable law or agreed to in writing, software
11 // distributed under the License is distributed on an "AS IS" BASIS,
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 // See the License for the specific language governing permissions and
14 // limitations under the License.
15 //
16 // -----------------------------------------------------------------------------
17 // File: str_replace.h
18 // -----------------------------------------------------------------------------
19 //
20 // This file defines `absl::StrReplaceAll()`, a general-purpose string
21 // replacement function designed for large, arbitrary text substitutions,
22 // especially on strings which you are receiving from some other system for
23 // further processing (e.g. processing regular expressions, escaping HTML
24 // entities, etc.). `StrReplaceAll` is designed to be efficient even when only
25 // one substitution is being performed, or when substitution is rare.
26 //
27 // If the string being modified is known at compile-time, and the substitutions
28 // vary, `absl::Substitute()` may be a better choice.
29 //
30 // Example:
31 //
32 // std::string html_escaped = absl::StrReplaceAll(user_input, {
33 //                                                {"&", "&"},
34 //                                                {"<", "&lt;"},
35 //                                                {">", "&gt;"},
36 //                                                {"\"", "&quot;"},
37 //                                                {"'", "&#39;"}});
38 #ifndef ABSL_STRINGS_STR_REPLACE_H_
39 #define ABSL_STRINGS_STR_REPLACE_H_
40 
41 #include <string>
42 #include <utility>
43 #include <vector>
44 
45 #include "absl/base/attributes.h"
46 #include "absl/strings/string_view.h"
47 
48 namespace absl {
49 ABSL_NAMESPACE_BEGIN
50 
51 // StrReplaceAll()
52 //
53 // Replaces character sequences within a given string with replacements provided
54 // within an initializer list of key/value pairs. Candidate replacements are
55 // considered in order as they occur within the string, with earlier matches
56 // taking precedence, and longer matches taking precedence for candidates
57 // starting at the same position in the string. Once a substitution is made, the
58 // replaced text is not considered for any further substitutions.
59 //
60 // Example:
61 //
62 //   std::string s = absl::StrReplaceAll(
63 //       "$who bought $count #Noun. Thanks $who!",
64 //       {{"$count", absl::StrCat(5)},
65 //        {"$who", "Bob"},
66 //        {"#Noun", "Apples"}});
67 //   EXPECT_EQ("Bob bought 5 Apples. Thanks Bob!", s);
68 ABSL_MUST_USE_RESULT std::string StrReplaceAll(
69     absl::string_view s,
70     std::initializer_list<std::pair<absl::string_view, absl::string_view>>
71         replacements);
72 
73 // Overload of `StrReplaceAll()` to accept a container of key/value replacement
74 // pairs (typically either an associative map or a `std::vector` of `std::pair`
75 // elements). A vector of pairs is generally more efficient.
76 //
77 // Examples:
78 //
79 //   std::map<const absl::string_view, const absl::string_view> replacements;
80 //   replacements["$who"] = "Bob";
81 //   replacements["$count"] = "5";
82 //   replacements["#Noun"] = "Apples";
83 //   std::string s = absl::StrReplaceAll(
84 //       "$who bought $count #Noun. Thanks $who!",
85 //       replacements);
86 //   EXPECT_EQ("Bob bought 5 Apples. Thanks Bob!", s);
87 //
88 //   // A std::vector of std::pair elements can be more efficient.
89 //   std::vector<std::pair<const absl::string_view, std::string>> replacements;
90 //   replacements.push_back({"&", "&amp;"});
91 //   replacements.push_back({"<", "&lt;"});
92 //   replacements.push_back({">", "&gt;"});
93 //   std::string s = absl::StrReplaceAll("if (ptr < &foo)",
94 //                                  replacements);
95 //   EXPECT_EQ("if (ptr &lt; &amp;foo)", s);
96 template <typename StrToStrMapping>
97 std::string StrReplaceAll(absl::string_view s,
98                           const StrToStrMapping& replacements);
99 
100 // Overload of `StrReplaceAll()` to replace character sequences within a given
101 // output string *in place* with replacements provided within an initializer
102 // list of key/value pairs, returning the number of substitutions that occurred.
103 //
104 // Example:
105 //
106 //   std::string s = std::string("$who bought $count #Noun. Thanks $who!");
107 //   int count;
108 //   count = absl::StrReplaceAll({{"$count", absl::StrCat(5)},
109 //                               {"$who", "Bob"},
110 //                               {"#Noun", "Apples"}}, &s);
111 //  EXPECT_EQ(count, 4);
112 //  EXPECT_EQ("Bob bought 5 Apples. Thanks Bob!", s);
113 int StrReplaceAll(
114     std::initializer_list<std::pair<absl::string_view, absl::string_view>>
115         replacements,
116     std::string* target);
117 
118 // Overload of `StrReplaceAll()` to replace patterns within a given output
119 // string *in place* with replacements provided within a container of key/value
120 // pairs.
121 //
122 // Example:
123 //
124 //   std::string s = std::string("if (ptr < &foo)");
125 //   int count = absl::StrReplaceAll({{"&", "&amp;"},
126 //                                    {"<", "&lt;"},
127 //                                    {">", "&gt;"}}, &s);
128 //  EXPECT_EQ(count, 2);
129 //  EXPECT_EQ("if (ptr &lt; &amp;foo)", s);
130 template <typename StrToStrMapping>
131 int StrReplaceAll(const StrToStrMapping& replacements, std::string* target);
132 
133 // Implementation details only, past this point.
134 namespace strings_internal {
135 
136 struct ViableSubstitution {
137   absl::string_view old;
138   absl::string_view replacement;
139   size_t offset;
140 
ViableSubstitutionViableSubstitution141   ViableSubstitution(absl::string_view old_str,
142                      absl::string_view replacement_str, size_t offset_val)
143       : old(old_str), replacement(replacement_str), offset(offset_val) {}
144 
145   // One substitution occurs "before" another (takes priority) if either
146   // it has the lowest offset, or it has the same offset but a larger size.
OccursBeforeViableSubstitution147   bool OccursBefore(const ViableSubstitution& y) const {
148     if (offset != y.offset) return offset < y.offset;
149     return old.size() > y.old.size();
150   }
151 };
152 
153 // Build a vector of ViableSubstitutions based on the given list of
154 // replacements. subs can be implemented as a priority_queue. However, it turns
155 // out that most callers have small enough a list of substitutions that the
156 // overhead of such a queue isn't worth it.
157 template <typename StrToStrMapping>
FindSubstitutions(absl::string_view s,const StrToStrMapping & replacements)158 std::vector<ViableSubstitution> FindSubstitutions(
159     absl::string_view s, const StrToStrMapping& replacements) {
160   std::vector<ViableSubstitution> subs;
161   subs.reserve(replacements.size());
162 
163   for (const auto& rep : replacements) {
164     using std::get;
165     absl::string_view old(get<0>(rep));
166 
167     size_t pos = s.find(old);
168     if (pos == s.npos) continue;
169 
170     // Ignore attempts to replace "". This condition is almost never true,
171     // but above condition is frequently true. That's why we test for this
172     // now and not before.
173     if (old.empty()) continue;
174 
175     subs.emplace_back(old, get<1>(rep), pos);
176 
177     // Insertion sort to ensure the last ViableSubstitution comes before
178     // all the others.
179     size_t index = subs.size();
180     while (--index && subs[index - 1].OccursBefore(subs[index])) {
181       std::swap(subs[index], subs[index - 1]);
182     }
183   }
184   return subs;
185 }
186 
187 int ApplySubstitutions(absl::string_view s,
188                        std::vector<ViableSubstitution>* subs_ptr,
189                        std::string* result_ptr);
190 
191 }  // namespace strings_internal
192 
193 template <typename StrToStrMapping>
StrReplaceAll(absl::string_view s,const StrToStrMapping & replacements)194 std::string StrReplaceAll(absl::string_view s,
195                           const StrToStrMapping& replacements) {
196   auto subs = strings_internal::FindSubstitutions(s, replacements);
197   std::string result;
198   result.reserve(s.size());
199   strings_internal::ApplySubstitutions(s, &subs, &result);
200   return result;
201 }
202 
203 template <typename StrToStrMapping>
StrReplaceAll(const StrToStrMapping & replacements,std::string * target)204 int StrReplaceAll(const StrToStrMapping& replacements, std::string* target) {
205   auto subs = strings_internal::FindSubstitutions(*target, replacements);
206   if (subs.empty()) return 0;
207 
208   std::string result;
209   result.reserve(target->size());
210   int substitutions =
211       strings_internal::ApplySubstitutions(*target, &subs, &result);
212   target->swap(result);
213   return substitutions;
214 }
215 
216 ABSL_NAMESPACE_END
217 }  // namespace absl
218 
219 #endif  // ABSL_STRINGS_STR_REPLACE_H_
220