GCC Code Coverage Report

Directory:	libs/url/
File:	libs/url/src/detail/normalize.cpp
Date:	2024-04-08 19:38:36
	Exec	Total	Coverage
Lines:	399	402	99.3%
Functions:	20	20	100.0%
Branches:	213	228	93.4%
  
      Line
      Branch
      Exec
      Source
    
      //
    
      // Copyright (c) 2016-2019 Vinnie Falco (vinnie dot falco at gmail dot com)
    
      // Copyright (c) 2022 Alan de Freitas (alandefreitas@gmail.com)
    
      //
    
      // Distributed under the Boost Software License, Version 1.0. (See accompanying
    
      // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
    
      //
    
      // Official repository: https://github.com/boostorg/url
    
      //
    
      #include <boost/url/detail/config.hpp>
    
      #include <boost/url/decode_view.hpp>
    
      #include "decode.hpp"
    
      #include <boost/url/segments_encoded_view.hpp>
    
      #include <boost/url/grammar/ci_string.hpp>
    
      #include <boost/assert.hpp>
    
      #include <boost/core/ignore_unused.hpp>
    
      #include <cstring>
    
      #include "normalize.hpp"
    
      namespace boost {
    
      namespace urls {
    
      namespace detail {
    
      void
    
      7280
      pop_encoded_front(
    
          core::string_view& s,
    
          char& c,
    
          std::size_t& n) noexcept
    
      {
    
        2/2✓ Branch 1 taken 7190 times.
✓ Branch 2 taken 90 times.

      7280
          if(s.front() != '%')
    
          {
    
      7190
              c = s.front();
    
      7190
              s.remove_prefix(1);
    
          }
    
          else
    
          {
    
      90
              detail::decode_unsafe(
    
                  &c,
    
                  &c + 1,
    
                  s.substr(0, 3));
    
      90
              s.remove_prefix(3);
    
          }
    
      7280
          ++n;
    
      7280
      }
    
      int
    
      77
      compare_encoded(
    
          core::string_view lhs,
    
          core::string_view rhs) noexcept
    
      {
    
      77
          std::size_t n0 = 0;
    
      77
          std::size_t n1 = 0;
    
      77
          char c0 = 0;
    
      77
          char c1 = 0;
    
      205
          while(
    
        4/4✓ Branch 1 taken 253 times.
✓ Branch 2 taken 29 times.
✓ Branch 3 taken 240 times.
✓ Branch 4 taken 42 times.

      535
              !lhs.empty() &&
    
        2/2✓ Branch 1 taken 240 times.
✓ Branch 2 taken 13 times.

      253
              !rhs.empty())
    
          {
    
      240
              pop_encoded_front(lhs, c0, n0);
    
      240
              pop_encoded_front(rhs, c1, n1);
    
        2/2✓ Branch 0 taken 20 times.
✓ Branch 1 taken 220 times.

      240
              if (c0 < c1)
    
      20
                  return -1;
    
        2/2✓ Branch 0 taken 15 times.
✓ Branch 1 taken 205 times.

      220
              if (c1 < c0)
    
      15
                  return 1;
    
          }
    
      42
          n0 += detail::decode_bytes_unsafe(lhs);
    
      42
          n1 += detail::decode_bytes_unsafe(rhs);
    
        2/2✓ Branch 0 taken 21 times.
✓ Branch 1 taken 21 times.

      42
          if (n0 == n1)
    
      21
              return 0;
    
        2/2✓ Branch 0 taken 8 times.
✓ Branch 1 taken 13 times.

      21
          if (n0 < n1)
    
      8
              return -1;
    
      13
          return 1;
    
      }
    
      void
    
      1216
      digest_encoded(
    
          core::string_view s,
    
          fnv_1a& hasher) noexcept
    
      {
    
      1216
          char c = 0;
    
      1216
          std::size_t n = 0;
    
        2/2✓ Branch 1 taken 508 times.
✓ Branch 2 taken 1216 times.

      1724
          while(!s.empty())
    
          {
    
      508
              pop_encoded_front(s, c, n);
    
      508
              hasher.put(c);
    
          }
    
      1216
      }
    
      int
    
      159
      ci_compare_encoded(
    
          core::string_view lhs,
    
          core::string_view rhs) noexcept
    
      {
    
      159
          std::size_t n0 = 0;
    
      159
          std::size_t n1 = 0;
    
      159
          char c0 = 0;
    
      159
          char c1 = 0;
    
      2105
          while (
    
        4/4✓ Branch 1 taken 2121 times.
✓ Branch 2 taken 143 times.
✓ Branch 3 taken 2115 times.
✓ Branch 4 taken 149 times.

      4385
              !lhs.empty() &&
    
        2/2✓ Branch 1 taken 2115 times.
✓ Branch 2 taken 6 times.

      2121
              !rhs.empty())
    
          {
    
      2115
              pop_encoded_front(lhs, c0, n0);
    
      2115
              pop_encoded_front(rhs, c1, n1);
    
      2115
              c0 = grammar::to_lower(c0);
    
      2115
              c1 = grammar::to_lower(c1);
    
        2/2✓ Branch 0 taken 8 times.
✓ Branch 1 taken 2107 times.

      2115
              if (c0 < c1)
    
      8
                  return -1;
    
        2/2✓ Branch 0 taken 2 times.
✓ Branch 1 taken 2105 times.

      2107
              if (c1 < c0)
    
      2
                  return 1;
    
          }
    
      149
          n0 += detail::decode_bytes_unsafe(lhs);
    
      149
          n1 += detail::decode_bytes_unsafe(rhs);
    
        2/2✓ Branch 0 taken 142 times.
✓ Branch 1 taken 7 times.

      149
          if (n0 == n1)
    
      142
              return 0;
    
        2/2✓ Branch 0 taken 1 times.
✓ Branch 1 taken 6 times.

      7
          if (n0 < n1)
    
      1
              return -1;
    
      6
          return 1;
    
      }
    
      void
    
      304
      ci_digest_encoded(
    
          core::string_view s,
    
          fnv_1a& hasher) noexcept
    
      {
    
      304
          char c = 0;
    
      304
          std::size_t n = 0;
    
        2/2✓ Branch 1 taken 2062 times.
✓ Branch 2 taken 304 times.

      2366
          while(!s.empty())
    
          {
    
      2062
              pop_encoded_front(s, c, n);
    
      2062
              c = grammar::to_lower(c);
    
      2062
              hasher.put(c);
    
          }
    
      304
      }
    
      int
    
      46
      compare(
    
          core::string_view lhs,
    
          core::string_view rhs) noexcept
    
      {
    
      46
          auto rlen = (std::min)(lhs.size(), rhs.size());
    
        2/2✓ Branch 0 taken 79 times.
✓ Branch 1 taken 25 times.

      104
          for (std::size_t i = 0; i < rlen; ++i)
    
          {
    
      79
              char c0 = lhs[i];
    
      79
              char c1 = rhs[i];
    
        2/2✓ Branch 0 taken 13 times.
✓ Branch 1 taken 66 times.

      79
              if (c0 < c1)
    
      13
                  return -1;
    
        2/2✓ Branch 0 taken 8 times.
✓ Branch 1 taken 58 times.

      66
              if (c1 < c0)
    
      8
                  return 1;
    
          }
    
        2/2✓ Branch 2 taken 4 times.
✓ Branch 3 taken 21 times.

      25
          if ( lhs.size() == rhs.size() )
    
      4
              return 0;
    
        2/2✓ Branch 2 taken 8 times.
✓ Branch 3 taken 13 times.

      21
          if ( lhs.size() < rhs.size() )
    
      8
              return -1;
    
      13
          return 1;
    
      }
    
      int
    
      196
      ci_compare(
    
          core::string_view lhs,
    
          core::string_view rhs) noexcept
    
      {
    
      196
          auto rlen = (std::min)(lhs.size(), rhs.size());
    
        2/2✓ Branch 0 taken 800 times.
✓ Branch 1 taken 189 times.

      989
          for (std::size_t i = 0; i < rlen; ++i)
    
          {
    
      800
              char c0 = grammar::to_lower(lhs[i]);
    
      800
              char c1 = grammar::to_lower(rhs[i]);
    
        2/2✓ Branch 0 taken 6 times.
✓ Branch 1 taken 794 times.

      800
              if (c0 < c1)
    
      6
                  return -1;
    
        2/2✓ Branch 0 taken 1 times.
✓ Branch 1 taken 793 times.

      794
              if (c1 < c0)
    
      1
                  return 1;
    
          }
    
        2/2✓ Branch 2 taken 182 times.
✓ Branch 3 taken 7 times.

      189
          if ( lhs.size() == rhs.size() )
    
      182
              return 0;
    
        2/2✓ Branch 2 taken 6 times.
✓ Branch 3 taken 1 times.

      7
          if ( lhs.size() < rhs.size() )
    
      6
              return -1;
    
      1
          return 1;
    
      }
    
      void
    
      304
      ci_digest(
    
          core::string_view s,
    
          fnv_1a& hasher) noexcept
    
      {
    
        2/2✓ Branch 2 taken 730 times.
✓ Branch 3 taken 304 times.

      1034
          for (char c: s)
    
          {
    
      730
              c = grammar::to_lower(c);
    
      730
              hasher.put(c);
    
          }
    
      304
      }
    
      /* Check if a string ends with the specified suffix (decoded comparison)
    
         This function determines if a string ends with the specified suffix
    
         when the string and suffix are compared after percent-decoding.
    
         @param str The string to check (percent-encoded)
    
         @param suffix The suffix to check for (percent-decoded)
    
         @return The number of encoded chars consumed in the string
    
       */
    
      std::size_t
    
      2136
      path_ends_with(
    
          core::string_view str,
    
          core::string_view suffix) noexcept
    
      {
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 2136 times.

      2136
          BOOST_ASSERT(!str.empty());
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 2136 times.

      2136
          BOOST_ASSERT(!suffix.empty());
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 2136 times.

      2136
          BOOST_ASSERT(!suffix.contains("%2F"));
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 2136 times.

      2136
          BOOST_ASSERT(!suffix.contains("%2f"));
    
      5848
          auto consume_last = [](
    
              core::string_view::iterator& it,
    
              core::string_view::iterator& end,
    
              char& c)
    
          {
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 5848 times.

      5848
              BOOST_ASSERT(end > it);
    
        1/2✗ Branch 0 not taken.
✓ Branch 1 taken 5848 times.

      5848
              BOOST_ASSERT(it != end);
    
        4/4✓ Branch 0 taken 3960 times.
✓ Branch 1 taken 1888 times.
✓ Branch 2 taken 5800 times.
✓ Branch 3 taken 48 times.

      9808
              if ((end - it) < 3 ||
    
        2/2✓ Branch 1 taken 3912 times.
✓ Branch 2 taken 48 times.

      3960
                  *(std::prev(end, 3)) != '%')
    
              {
    
      5800
                  c = *--end;
    
      5800
                  return false;
    
              }
    
        1/2✓ Branch 2 taken 48 times.
✗ Branch 3 not taken.

      48
              detail::decode_unsafe(
    
                  &c,
    
                  &c + 1,
    
                  core::string_view(std::prev(
    
                      end, 3), 3));
    
      48
              end -= 3;
    
      48
              return true;
    
          };
    
      2136
          auto it0 = str.begin();
    
      2136
          auto end0 = str.end();
    
      2136
          auto it1 = suffix.begin();
    
      2136
          auto end1 = suffix.end();
    
      2136
          char c0 = 0;
    
      2136
          char c1 = 0;
    
      1112
          while(
    
        2/2✓ Branch 0 taken 3006 times.
✓ Branch 1 taken 242 times.

      3248
              it0 < end0 &&
    
        2/2✓ Branch 0 taken 2932 times.
✓ Branch 1 taken 74 times.

      3006
              it1 < end1)
    
          {
    
      2932
              bool const is_encoded = consume_last(it0, end0, c0);
    
              // The suffix never contains an encoded slash (%2F), and a decoded
    
              // slash is not equivalent to an encoded slash
    
        4/4✓ Branch 0 taken 48 times.
✓ Branch 1 taken 2884 times.
✓ Branch 2 taken 16 times.
✓ Branch 3 taken 32 times.

      2932
              if (is_encoded && c0 == '/')
    
      16
                  return 0;
    
      2916
              consume_last(it1, end1, c1);
    
        2/2✓ Branch 0 taken 1804 times.
✓ Branch 1 taken 1112 times.

      2916
              if (c0 != c1)
    
      1804
                  return 0;
    
          }
    
      316
          bool const consumed_suffix = it1 == end1;
    
        2/2✓ Branch 0 taken 110 times.
✓ Branch 1 taken 206 times.

      316
          if (consumed_suffix)
    
          {
    
      110
              std::size_t const consumed_encoded = str.end() - end0;
    
      110
              return consumed_encoded;
    
          }
    
      206
          return 0;
    
      }
    
      std::size_t
    
      832
      remove_dot_segments(
    
          char* dest0,
    
          char const* end,
    
          core::string_view input) noexcept
    
      {
    
          // 1. The input buffer `s` is initialized with
    
          // the now-appended path components and the
    
          // output buffer `dest0` is initialized to
    
          // the empty string.
    
      832
          char* dest = dest0;
    
      832
          bool const is_absolute = input.starts_with('/');
    
          // Step 2 is a loop through 5 production rules:
    
          // https://www.rfc-editor.org/rfc/rfc3986#section-5.2.4
    
          //
    
          // There are no transitions between all rules,
    
          // which enables some optimizations.
    
          //
    
          // Initial:
    
          // - Rule A: handle initial dots
    
          // If the input buffer begins with a
    
          // prefix of "../" or "./", then remove
    
          // that prefix from the input buffer.
    
          // Rule A can only happen at the beginning.
    
          // Errata 4547: Keep "../" in the beginning
    
          // https://www.rfc-editor.org/errata/eid4547
    
          //
    
          // Then:
    
          // - Rule D: ignore a final ".." or "."
    
          // if the input buffer consists only  of "."
    
          // or "..", then remove that from the input
    
          // buffer.
    
          // Rule D can only happen after Rule A because:
    
          // - B and C write "/" to the input
    
          // - E writes "/" to input or returns
    
          //
    
          // Then:
    
          // - Rule B: ignore ".": write "/" to the input
    
          // - Rule C: apply "..": remove seg and write "/"
    
          // - Rule E: copy complete segment
    
          auto append =
    
      1492
              [](char*& first, char const* last, core::string_view in)
    
          {
    
              // append `in` to `dest`
    
        1/2✗ Branch 1 not taken.
✓ Branch 2 taken 1492 times.

      1492
              BOOST_ASSERT(in.size() <= std::size_t(last - first));
    
      1492
              std::memmove(first, in.data(), in.size());
    
      1492
              first += in.size();
    
              ignore_unused(last);
    
      1492
          };
    
      9563
          auto dot_starts_with = [](
    
              core::string_view str, core::string_view dots, std::size_t& n)
    
          {
    
              // starts_with for encoded/decoded dots
    
              // or decoded otherwise. return how many
    
              // chars in str match the dots
    
      9563
              n = 0;
    
        2/2✓ Branch 2 taken 16368 times.
✓ Branch 3 taken 550 times.

      16918
              for (char c: dots)
    
              {
    
        2/2✓ Branch 1 taken 7355 times.
✓ Branch 2 taken 9013 times.

      16368
                  if (str.starts_with(c))
    
                  {
    
      7355
                      str.remove_prefix(1);
    
      7355
                      ++n;
    
      7355
                      continue;
    
                  }
    
                  // In the general case, we would need to
    
                  // check if the next char is an encoded
    
                  // dot.
    
                  // However, an encoded dot in `str`
    
                  // would have already been decoded in
    
                  // url_base::normalize_path().
    
                  // This needs to be undone if
    
                  // `remove_dot_segments` is used in a
    
                  // different context.
    
                  // if (str.size() > 2 &&
    
                  //     c == '.'
    
                  //     &&
    
                  //     str[0] == '%' &&
    
                  //     str[1] == '2' &&
    
                  //     (str[2] == 'e' ||
    
                  //      str[2] == 'E'))
    
                  // {
    
                  //     str.remove_prefix(3);
    
                  //     n += 3;
    
                  //     continue;
    
                  // }
    
      9013
                  n = 0;
    
      9013
                  return false;
    
              }
    
      550
              return true;
    
          };
    
      4777
          auto dot_equal = [&dot_starts_with](
    
      4777
              core::string_view str, core::string_view dots)
    
          {
    
      4777
              std::size_t n = 0;
    
      4777
              dot_starts_with(str, dots, n);
    
      4777
              return n == str.size();
    
      832
          };
    
          // Rule A
    
          std::size_t n;
    
        2/2✓ Branch 1 taken 767 times.
✓ Branch 2 taken 81 times.

      848
          while (!input.empty())
    
          {
    
        2/2✓ Branch 2 taken 4 times.
✓ Branch 3 taken 763 times.

      767
              if (dot_starts_with(input, "../", n))
    
              {
    
                  // Errata 4547
    
      4
                  append(dest, end, "../");
    
      4
                  input.remove_prefix(n);
    
      4
                  continue;
    
              }
    
        2/2✓ Branch 2 taken 751 times.
✓ Branch 3 taken 12 times.

      763
              else if (!dot_starts_with(input, "./", n))
    
              {
    
      751
                  break;
    
              }
    
      12
              input.remove_prefix(n);
    
          }
    
          // Rule D
    
        2/2✓ Branch 2 taken 82 times.
✓ Branch 3 taken 750 times.

      832
          if( dot_equal(input, "."))
    
          {
    
      82
              input = {};
    
          }
    
        2/2✓ Branch 2 taken 3 times.
✓ Branch 3 taken 747 times.

      750
          else if( dot_equal(input, "..") )
    
          {
    
              // Errata 4547
    
      3
              append(dest, end, "..");
    
      3
              input = {};
    
          }
    
          // 2. While the input buffer is not empty,
    
          // loop as follows:
    
        2/2✓ Branch 1 taken 1648 times.
✓ Branch 2 taken 793 times.

      2441
          while (!input.empty())
    
          {
    
              // Rule B
    
      1648
              bool const is_dot_seg = dot_starts_with(input, "/./", n);
    
        2/2✓ Branch 0 taken 32 times.
✓ Branch 1 taken 1616 times.

      1648
              if (is_dot_seg)
    
              {
    
      32
                  input.remove_prefix(n - 1);
    
      32
                  continue;
    
              }
    
      1616
              bool const is_final_dot_seg = dot_equal(input, "/.");
    
        2/2✓ Branch 0 taken 8 times.
✓ Branch 1 taken 1608 times.

      1616
              if (is_final_dot_seg)
    
              {
    
                  // We can't remove "." from a core::string_view
    
                  // So what we do here is equivalent to
    
                  // replacing s with '/' as required
    
                  // in Rule B and executing the next
    
                  // iteration, which would append this
    
                  // '/' to  the output, as required by
    
                  // Rule E
    
      8
                  append(dest, end, input.substr(0, 1));
    
      8
                  input = {};
    
      8
                  break;
    
              }
    
              // Rule C
    
      1608
              bool const is_dotdot_seg = dot_starts_with(input, "/../", n);
    
        2/2✓ Branch 0 taken 193 times.
✓ Branch 1 taken 1415 times.

      1608
              if (is_dotdot_seg)
    
              {
    
      193
                  core::string_view cur_out(dest0, dest - dest0);
    
      193
                  std::size_t p = cur_out.find_last_of('/');
    
      193
                  bool const has_multiple_segs = p != core::string_view::npos;
    
        2/2✓ Branch 0 taken 132 times.
✓ Branch 1 taken 61 times.

      193
                  if (has_multiple_segs)
    
                  {
    
                      // output has multiple segments
    
                      // "erase" [p, end] if not "/.."
    
      132
                      core::string_view last_seg(dest0 + p, dest - (dest0 + p));
    
      132
                      bool const prev_is_dotdot_seg = dot_equal(last_seg, "/..");
    
        2/2✓ Branch 0 taken 121 times.
✓ Branch 1 taken 11 times.

      132
                      if (!prev_is_dotdot_seg)
    
                      {
    
      121
                          dest = dest0 + p;
    
                      }
    
                      else
    
                      {
    
      11
                          append(dest, end, "/..");
    
                      }
    
                  }
    
        2/2✓ Branch 0 taken 11 times.
✓ Branch 1 taken 50 times.

      61
                  else if (dest0 != dest)
    
                  {
    
                      // Only one segment in the output: remove it
    
      11
                      core::string_view last_seg(dest0, dest - dest0);
    
      11
                      bool const prev_is_dotdot_seg = dot_equal(last_seg, "..");
    
        2/2✓ Branch 0 taken 9 times.
✓ Branch 1 taken 2 times.

      11
                      if (!prev_is_dotdot_seg)
    
                      {
    
      9
                          dest = dest0;
    
        1/2✓ Branch 0 taken 9 times.
✗ Branch 1 not taken.

      9
                          if (!is_absolute)
    
                          {
    
      9
                              input.remove_prefix(1);
    
                          }
    
                      }
    
                      else
    
                      {
    
      2
                          append(dest, end, "/..");
    
                      }
    
                  }
    
                  else
    
                  {
    
                      // Output is empty
    
        1/2✓ Branch 0 taken 50 times.
✗ Branch 1 not taken.

      50
                      if (is_absolute)
    
                      {
    
      50
                          append(dest, end, "/..");
    
                      }
    
                      else
    
                      {
    
                          // AFREITAS: Although we have no formal proof
    
                          // for that, the output can't be relative
    
                          // and empty at this point because relative
    
                          // paths will fall in the `dest0 != dest`
    
                          // case above of this rule C and then the
    
                          // general case of rule E for "..".
    
      ✗
                          append(dest, end, "..");
    
                      }
    
                  }
    
      193
                  input.remove_prefix(n - 1);
    
      193
                  continue;
    
              }
    
      1415
              bool const is_final_dotdot_seg = dot_equal(input, "/..");
    
        2/2✓ Branch 0 taken 31 times.
✓ Branch 1 taken 1384 times.

      1415
              if (is_final_dotdot_seg)
    
              {
    
      31
                  core::string_view cur_out(dest0, dest - dest0);
    
      31
                  std::size_t p = cur_out.find_last_of('/');
    
      31
                  bool const has_multiple_segs = p != core::string_view::npos;
    
        2/2✓ Branch 0 taken 18 times.
✓ Branch 1 taken 13 times.

      31
                  if (has_multiple_segs)
    
                  {
    
                      // output has multiple segments
    
                      // "erase" [p, end] if not "/.."
    
      18
                      core::string_view last_seg(dest0 + p, dest - (dest0 + p));
    
      18
                      bool const prev_is_dotdot_seg = dot_equal(last_seg, "/..");
    
        2/2✓ Branch 0 taken 14 times.
✓ Branch 1 taken 4 times.

      18
                      if (!prev_is_dotdot_seg)
    
                      {
    
      14
                          dest = dest0 + p;
    
      14
                          append(dest, end, "/");
    
                      }
    
                      else
    
                      {
    
      4
                          append(dest, end, "/..");
    
                      }
    
                  }
    
        2/2✓ Branch 0 taken 3 times.
✓ Branch 1 taken 10 times.

      13
                  else if (dest0 != dest)
    
                  {
    
                      // Only one segment in the output: remove it
    
      3
                      core::string_view last_seg(dest0, dest - dest0);
    
      3
                      bool const prev_is_dotdot_seg = dot_equal(last_seg, "..");
    
        2/2✓ Branch 0 taken 1 times.
✓ Branch 1 taken 2 times.

      3
                      if (!prev_is_dotdot_seg) {
    
      1
                          dest = dest0;
    
                      }
    
                      else
    
                      {
    
      2
                          append(dest, end, "/..");
    
                      }
    
                  }
    
                  else
    
                  {
    
                      // Output is empty: append dotdot
    
        1/2✓ Branch 0 taken 10 times.
✗ Branch 1 not taken.

      10
                      if (is_absolute)
    
                      {
    
      10
                          append(dest, end, "/..");
    
                      }
    
                      else
    
                      {
    
                          // AFREITAS: Although we have no formal proof
    
                          // for that, the output can't be relative
    
                          // and empty at this point because relative
    
                          // paths will fall in the `dest0 != dest`
    
                          // case above of this rule C and then the
    
                          // general case of rule E for "..".
    
      ✗
                          append(dest, end, "..");
    
                      }
    
                  }
    
      31
                  input = {};
    
      31
                  break;
    
              }
    
              // Rule E
    
      1384
              std::size_t p = input.find_first_of('/', 1);
    
        2/2✓ Branch 0 taken 676 times.
✓ Branch 1 taken 708 times.

      1384
              if (p != core::string_view::npos)
    
              {
    
      676
                  append(dest, end, input.substr(0, p));
    
      676
                  input.remove_prefix(p);
    
              }
    
              else
    
              {
    
      708
                  append(dest, end, input);
    
      708
                  input = {};
    
              }
    
          }
    
          // 3. Finally, the output buffer is set
    
          // as the result of remove_dot_segments,
    
          // and we return its size
    
      832
          return dest - dest0;
    
      }
    
      char
    
      1154
      path_pop_back( core::string_view& s )
    
      {
    
        4/4✓ Branch 1 taken 522 times.
✓ Branch 2 taken 632 times.
✓ Branch 3 taken 1102 times.
✓ Branch 4 taken 52 times.

      1676
          if (s.size() < 3 ||
    
        3/4✓ Branch 2 taken 522 times.
✗ Branch 3 not taken.
✓ Branch 4 taken 470 times.
✓ Branch 5 taken 52 times.

      522
              *std::prev(s.end(), 3) != '%')
    
          {
    
      1102
              char c = s.back();
    
      1102
              s.remove_suffix(1);
    
      1102
              return c;
    
          }
    
      52
          char c = 0;
    
        1/2✓ Branch 2 taken 52 times.
✗ Branch 3 not taken.

      104
          detail::decode_unsafe(
    
      104
              &c, &c + 1, s.substr(s.size() - 3));
    
        2/2✓ Branch 0 taken 44 times.
✓ Branch 1 taken 8 times.

      52
          if (c != '/')
    
          {
    
      44
              s.remove_suffix(3);
    
      44
              return c;
    
          }
    
      8
          c = s.back();
    
      8
          s.remove_suffix(1);
    
      8
          return c;
    
      };
    
      void
    
      538
      pop_last_segment(
    
          core::string_view& str,
    
          core::string_view& seg,
    
          std::size_t& level,
    
          bool remove_unmatched) noexcept
    
      {
    
      538
          seg = {};
    
      538
          std::size_t n = 0;
    
        2/2✓ Branch 1 taken 558 times.
✓ Branch 2 taken 142 times.

      700
          while (!str.empty())
    
          {
    
              // B.  if the input buffer begins with a
    
              // prefix of "/./" or "/.", where "." is
    
              // a complete path segment, then replace
    
              // that prefix with "/" in the input
    
              // buffer; otherwise,
    
      558
              n = detail::path_ends_with(str, "/./");
    
        2/2✓ Branch 0 taken 10 times.
✓ Branch 1 taken 548 times.

      558
              if (n)
    
              {
    
      10
                  seg = str.substr(str.size() - n);
    
      10
                  str.remove_suffix(n);
    
      10
                  continue;
    
              }
    
      548
              n = detail::path_ends_with(str, "/.");
    
        2/2✓ Branch 0 taken 12 times.
✓ Branch 1 taken 536 times.

      548
              if (n)
    
              {
    
      12
                  seg = str.substr(str.size() - n, 1);
    
      12
                  str.remove_suffix(n);
    
      12
                  continue;
    
              }
    
              // C. if the input buffer begins with a
    
              // prefix of "/../" or "/..", where ".."
    
              // is a complete path segment, then
    
              // replace that prefix with "/" in the
    
              // input buffer and remove the last
    
              // segment and its preceding "/"
    
              // (if any) from the output buffer
    
              // otherwise,
    
      536
              n = detail::path_ends_with(str, "/../");
    
        2/2✓ Branch 0 taken 42 times.
✓ Branch 1 taken 494 times.

      536
              if (n)
    
              {
    
      42
                  seg = str.substr(str.size() - n);
    
      42
                  str.remove_suffix(n);
    
      42
                  ++level;
    
      42
                  continue;
    
              }
    
      494
              n = detail::path_ends_with(str, "/..");
    
        2/2✓ Branch 0 taken 46 times.
✓ Branch 1 taken 448 times.

      494
              if (n)
    
              {
    
      46
                  seg = str.substr(str.size() - n);
    
      46
                  str.remove_suffix(n);
    
      46
                  ++level;
    
      46
                  continue;
    
              }
    
              // E.  move the first path segment in the
    
              // input buffer to the end of the output
    
              // buffer, including the initial "/"
    
              // character (if any) and any subsequent
    
              // characters up to, but not including,
    
              // the next "/" character or the end of
    
              // the input buffer.
    
      448
              std::size_t p = str.size() > 1
    
        2/2✓ Branch 0 taken 374 times.
✓ Branch 1 taken 74 times.

      448
                  ? str.find_last_of('/', str.size() - 2)
    
      448
                  : core::string_view::npos;
    
        2/2✓ Branch 0 taken 276 times.
✓ Branch 1 taken 172 times.

      448
              if (p != core::string_view::npos)
    
              {
    
      276
                  seg = str.substr(p + 1);
    
      276
                  str.remove_suffix(seg.size());
    
              }
    
              else
    
              {
    
      172
                  seg = str;
    
      172
                  str = {};
    
              }
    
        2/2✓ Branch 0 taken 396 times.
✓ Branch 1 taken 52 times.

      448
              if (level == 0)
    
      396
                  return;
    
        2/2✓ Branch 1 taken 42 times.
✓ Branch 2 taken 10 times.

      52
              if (!str.empty())
    
      42
                  --level;
    
          }
    
          // we still need to skip n_skip + 1
    
          // but the string is empty
    
        4/4✓ Branch 0 taken 42 times.
✓ Branch 1 taken 100 times.
✓ Branch 2 taken 34 times.
✓ Branch 3 taken 8 times.

      142
          if (remove_unmatched && level)
    
          {
    
      34
              seg = "/";
    
      34
              level = 0;
    
      34
              return;
    
          }
    
        2/2✓ Branch 0 taken 4 times.
✓ Branch 1 taken 104 times.

      108
          else if (level)
    
          {
    
        1/2✓ Branch 1 taken 4 times.
✗ Branch 2 not taken.

      4
              if (!seg.empty())
    
              {
    
      4
                  seg = "/../";
    
              }
    
              else
    
              {
    
                  // AFREITAS: this condition
    
                  // is correct, but it might
    
                  // unreachable.
    
      ✗
                  seg = "/..";
    
              }
    
      4
              --level;
    
      4
              return;
    
          }
    
      104
          seg = {};
    
      }
    
      void
    
      304
      normalized_path_digest(
    
          core::string_view str,
    
          bool remove_unmatched,
    
          fnv_1a& hasher) noexcept
    
      {
    
      304
          core::string_view seg;
    
      304
          std::size_t level = 0;
    
      234
          do
    
          {
    
      538
              pop_last_segment(
    
                  str, seg, level, remove_unmatched);
    
        2/2✓ Branch 1 taken 1154 times.
✓ Branch 2 taken 538 times.

      1692
              while (!seg.empty())
    
              {
    
      1154
                  char c = path_pop_back(seg);
    
      1154
                  hasher.put(c);
    
              }
    
          }
    
        2/2✓ Branch 1 taken 234 times.
✓ Branch 2 taken 304 times.

      538
          while (!str.empty());
    
      304
      }
    
      // compare segments as if there were a normalized
    
      int
    
      173
      segments_compare(
    
          segments_encoded_view seg0,
    
          segments_encoded_view seg1) noexcept
    
      {
    
          // calculate path size as if it were normalized
    
          auto normalized_size =
    
      346
              [](segments_encoded_view seg) -> std::size_t
    
          {
    
        2/2✓ Branch 1 taken 108 times.
✓ Branch 2 taken 238 times.

      346
              if (seg.empty())
    
      108
                  return seg.is_absolute();
    
      238
              std::size_t n = 0;
    
      238
              std::size_t skip = 0;
    
      238
              auto begin = seg.begin();
    
      238
              auto it = seg.end();
    
        2/2✓ Branch 1 taken 662 times.
✓ Branch 2 taken 238 times.

      900
              while (it != begin)
    
              {
    
      662
                  --it;
    
      662
                  decode_view dseg = **it;
    
        2/2✓ Branch 1 taken 167 times.
✓ Branch 2 taken 495 times.

      662
                  if (dseg == "..")
    
      167
                      ++skip;
    
        2/2✓ Branch 1 taken 457 times.
✓ Branch 2 taken 38 times.

      495
                  else if (dseg != ".")
    
                  {
    
        2/2✓ Branch 0 taken 85 times.
✓ Branch 1 taken 372 times.

      457
                      if (skip)
    
      85
                          --skip;
    
                      else
    
      372
                          n += dseg.size() + 1;
    
                  }
    
              }
    
      238
              n += skip * 3;
    
      238
              n -= !seg.is_absolute();
    
      238
              return n;
    
          };
    
          // find the normalized size for the comparison
    
      173
          std::size_t n0 = normalized_size(seg0);
    
      173
          std::size_t n1 = normalized_size(seg1);
    
      173
          std::size_t n00 = n0;
    
      173
          std::size_t n10 = n1;
    
          // consume the last char from a segment range
    
          auto consume_last =
    
      1640
              [](
    
                  std::size_t& n,
    
                  decode_view& dseg,
    
                  segments_encoded_view::iterator& begin,
    
                  segments_encoded_view::iterator& it,
    
                  decode_view::iterator& cit,
    
                  std::size_t& skip,
    
                  bool& at_slash) -> char
    
          {
    
        2/2✓ Branch 2 taken 1009 times.
✓ Branch 3 taken 631 times.

      1640
              if (cit != dseg.begin())
    
              {
    
                  // return last char from current segment
    
      1009
                  at_slash = false;
    
      1009
                  --cit;
    
      1009
                  --n;
    
      1009
                  return *cit;
    
              }
    
        2/2✓ Branch 0 taken 371 times.
✓ Branch 1 taken 260 times.

      631
              if (!at_slash)
    
              {
    
                  // current segment dseg is over and
    
                  // previous char was not a slash
    
                  // so we output one
    
      371
                  at_slash = true;
    
      371
                  --n;
    
      371
                  return '/';
    
              }
    
              // current segment dseg is over and
    
              // last char was already the slash
    
              // between segments, so take the
    
              // next final segment to consume
    
      260
              at_slash = false;
    
        1/2✓ Branch 2 taken 498 times.
✗ Branch 3 not taken.

      498
              while (cit == dseg.begin())
    
              {
    
                  // take next segment
    
        2/2✓ Branch 1 taken 376 times.
✓ Branch 2 taken 122 times.

      498
                  if (it != begin)
    
      376
                      --it;
    
                  else
    
      122
                      break;
    
        2/2✓ Branch 3 taken 140 times.
✓ Branch 4 taken 236 times.

      376
                  if (**it == "..")
    
                  {
    
                      // skip next if this is ".."
    
      140
                      ++skip;
    
                  }
    
        2/2✓ Branch 3 taken 208 times.
✓ Branch 4 taken 28 times.

      236
                  else if (**it != ".")
    
                  {
    
        2/2✓ Branch 0 taken 70 times.
✓ Branch 1 taken 138 times.

      208
                      if (skip)
    
                      {
    
                          // discount skips
    
      70
                          --skip;
    
                      }
    
                      else
    
                      {
    
                          // or update current seg
    
      138
                          dseg = **it;
    
      138
                          cit = dseg.end();
    
      138
                          break;
    
                      }
    
                  }
    
              }
    
              // consume from the new current
    
              // segment
    
      260
              --n;
    
        2/2✓ Branch 2 taken 123 times.
✓ Branch 3 taken 137 times.

      260
              if (cit != dseg.begin())
    
              {
    
                  // in the general case, we consume
    
                  // one more character from the end
    
      123
                  --cit;
    
      123
                  return *cit;
    
              }
    
              // nothing left to consume in the
    
              // current and new segment
    
        2/2✓ Branch 1 taken 128 times.
✓ Branch 2 taken 9 times.

      137
              if (it == begin)
    
              {
    
                  // if this is the first
    
                  // segment, the segments are
    
                  // over and there can only
    
                  // be repetitions of "../" to
    
                  // output
    
      128
                  return "/.."[n % 3];
    
              }
    
              // at other segments, we need
    
              // a slash to transition to the
    
              // next segment
    
      9
              at_slash = true;
    
      9
              return '/';
    
          };
    
          // consume final segments from seg0 that
    
          // should not influence the comparison
    
      173
          auto begin0 = seg0.begin();
    
      173
          auto it0 = seg0.end();
    
      173
          decode_view dseg0;
    
        2/2✓ Branch 2 taken 119 times.
✓ Branch 3 taken 54 times.

      173
          if (it0 != seg0.begin())
    
          {
    
      119
              --it0;
    
      119
              dseg0 = **it0;
    
          }
    
      173
          decode_view::iterator cit0 = dseg0.end();
    
      173
          std::size_t skip0 = 0;
    
      173
          bool at_slash0 = true;
    
        2/2✓ Branch 0 taken 134 times.
✓ Branch 1 taken 173 times.

      307
          while (n0 > n1)
    
          {
    
      134
              consume_last(n0, dseg0, begin0, it0, cit0, skip0, at_slash0);
    
          }
    
          // consume final segments from seg1 that
    
          // should not influence the comparison
    
      173
          auto begin1 = seg1.begin();
    
      173
          auto it1 = seg1.end();
    
      173
          decode_view dseg1;
    
        2/2✓ Branch 2 taken 119 times.
✓ Branch 3 taken 54 times.

      173
          if (it1 != seg1.begin())
    
          {
    
      119
              --it1;
    
      119
              dseg1 = **it1;
    
          }
    
      173
          decode_view::iterator cit1 = dseg1.end();
    
      173
          std::size_t skip1 = 0;
    
      173
          bool at_slash1 = true;
    
        2/2✓ Branch 0 taken 34 times.
✓ Branch 1 taken 173 times.

      207
          while (n1 > n0)
    
          {
    
      34
              consume_last(n1, dseg1, begin1, it1, cit1, skip1, at_slash1);
    
          }
    
      173
          int cmp = 0;
    
        2/2✓ Branch 0 taken 736 times.
✓ Branch 1 taken 173 times.

      909
          while (n0)
    
          {
    
      736
              char c0 = consume_last(
    
                  n0, dseg0, begin0, it0, cit0, skip0, at_slash0);
    
      736
              char c1 = consume_last(
    
                  n1, dseg1, begin1, it1, cit1, skip1, at_slash1);
    
        2/2✓ Branch 0 taken 36 times.
✓ Branch 1 taken 700 times.

      736
              if (c0 < c1)
    
      36
                  cmp = -1;
    
        2/2✓ Branch 0 taken 41 times.
✓ Branch 1 taken 659 times.

      700
              else if (c1 < c0)
    
      41
                  cmp = +1;
    
          }
    
        2/2✓ Branch 0 taken 41 times.
✓ Branch 1 taken 132 times.

      173
          if (cmp != 0)
    
      41
              return cmp;
    
        2/2✓ Branch 0 taken 130 times.
✓ Branch 1 taken 2 times.

      132
          if ( n00 == n10 )
    
      130
              return 0;
    
        2/2✓ Branch 0 taken 1 times.
✓ Branch 1 taken 1 times.

      2
          if ( n00 < n10 )
    
      1
              return -1;
    
      1
          return 1;
    
      }
    
      } // detail
    
      } // urls
    
      } // boost