envoyproxy · mattklein123 · Jul 30, 2019 · Jul 17, 2019 · Jul 17, 2019 · Jul 18, 2019
diff --git a/source/common/http/conn_manager_utility.cc b/source/common/http/conn_manager_utility.cc
@@ -397,7 +397,7 @@ bool ConnectionManagerUtility::maybeNormalizePath(HeaderMap& request_headers,
     is_valid_path = PathUtil::canonicalPath(*request_headers.Path());
   }
   // Merge slashes after path normalization to catch potential edge cases with percent encoding.
-  if (config.shouldMergeSlashes()) {
+  if (is_valid_path && config.shouldMergeSlashes()) {
     PathUtil::mergeSlashes(*request_headers.Path());
   }
   return is_valid_path;

diff --git a/source/common/http/path_utility.cc b/source/common/http/path_utility.cc
@@ -52,41 +52,25 @@ bool PathUtil::canonicalPath(HeaderEntry& path_header) {
   return true;
 }
 
-/* static */
 void PathUtil::mergeSlashes(HeaderEntry& path_header) {
   const auto original_path = path_header.value().getStringView();
-  if (original_path.empty()) {
-    return;
-  }
-
-  bool has_adjacent_slashes = false;
-  for (size_t i = 1; i < original_path.size(); ++i) {
-    if (original_path[i] == '/' && original_path[i - 1] == '/') {
-      has_adjacent_slashes = true;
-      break;
-    }
-    // Only operate on path component in URL.
-    if (original_path[i] == '?') {
-      break;
-    }
-  }
-  if (!has_adjacent_slashes) {
+  // Only operate on path component in URL.
+  const size_t query_start = original_path.find('?');
+  const auto path = original_path.substr(0, query_start);
+  const auto query = absl::ClippedSubstr(original_path, query_start);
+  if (path.find("//") == absl::string_view::npos) {
     return;
   }
 
   std::string simplified_path;
   simplified_path.reserve(original_path.size());
-  for (size_t i = 0; i < original_path.size(); ++i) {
-    if (i > 0 && original_path[i] == '/' && original_path[i - 1] == '/') {
+  for (size_t i = 0; i < path.size(); ++i) {
+    if (i > 0 && path[i] == '/' && path[i - 1] == '/') {
       continue;
     }
-    // Only operate on path component in URL.
-    if (original_path[i] == '?') {
-      simplified_path.insert(simplified_path.end(), original_path.begin() + i, original_path.end());
-      break;
-    }
-    simplified_path.push_back(original_path[i]);
+    simplified_path.push_back(path[i]);
   }
+  simplified_path.insert(simplified_path.end(), query.begin(), query.end());
   path_header.value(simplified_path);
 }
 

diff --git a/test/common/http/path_utility_test.cc b/test/common/http/path_utility_test.cc
@@ -87,21 +87,20 @@ TEST_F(PathUtilityTest, NormalizeCasePath) {
 
 // Paths that are valid get normalized.
 TEST_F(PathUtilityTest, MergeSlashes) {
-  const std::vector<std::pair<std::string, std::string>> non_normal_pairs{
-      {"", ""},                        // empty
-      {"/a", "/a"},                    // no-op
-      {"//a/b/c", "/a/b/c"},           // double / start
-      {"/a//b/c", "/a/b/c"},           // double / in the middle
-      {"/a//b?a=///c", "/a/b?a=///c"}, // slashes in the query are ignored
-      {"/a//b?", "/a/b?"},             // empty query
-  };
-
-  for (const auto& path_pair : non_normal_pairs) {
-    auto& path_header = pathHeaderEntry(path_pair.first);
+  auto mergeSlashes = [this](const std::string& path_value) {
+    auto& path_header = pathHeaderEntry(path_value);
     PathUtil::mergeSlashes(path_header);
-    EXPECT_EQ(path_header.value().getStringView(), path_pair.second)
-        << "original path: " << path_pair.first;
-  }
+    auto sanitized_path_value = path_header.value().getStringView();
+    return std::string(sanitized_path_value.begin(), sanitized_path_value.end());
+  };
+  EXPECT_EQ("", mergeSlashes(""));                        // empty
+  EXPECT_EQ("/a", mergeSlashes("/a"));                    // no-op
+  EXPECT_EQ("/a/b/c", mergeSlashes("//a/b/c"));           // double / start
+  EXPECT_EQ("/a/b/c", mergeSlashes("/a//b/c"));           // double / in the middle
+  EXPECT_EQ("/a/b/c", mergeSlashes("/a///b/c"));          // triple / in the middle
+  EXPECT_EQ("/a/b/c", mergeSlashes("/a////b/c"));         // quadruple / in the middle
+  EXPECT_EQ("/a/b?a=///c", mergeSlashes("/a//b?a=///c")); // slashes in the query are ignored
+  EXPECT_EQ("/a/b?", mergeSlashes("/a//b?"));             // empty query
 }
 
 } // namespace Http