1c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// Copyright 2013 The Chromium Authors. All rights reserved.
2c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be
3c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// found in the LICENSE file.
4c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
5c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#include "base/logging.h"
6c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#include "url/url_canon.h"
7c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#include "url/url_canon_internal.h"
8c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)#include "url/url_parse_internal.h"
9c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
100529e5d033099cbfc42635f6f6183833b09dff6eBen Murdochnamespace url {
11c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
12c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)namespace {
13c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
14c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)enum CharacterFlags {
15c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // Pass through unchanged, whether escaped or unescaped. This doesn't
16c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // actually set anything so you can't OR it to check, it's just to make the
17c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // table below more clear when neither ESCAPE or UNESCAPE is set.
18c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  PASS = 0,
19c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
20c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // This character requires special handling in DoPartialPath. Doing this test
21c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // first allows us to filter out the common cases of regular characters that
22c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // can be directly copied.
23c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  SPECIAL = 1,
24c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
25c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // This character must be escaped in the canonical output. Note that all
26c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // escaped chars also have the "special" bit set so that the code that looks
27c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // for this is triggered. Not valid with PASS or ESCAPE
28c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  ESCAPE_BIT = 2,
29c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  ESCAPE = ESCAPE_BIT | SPECIAL,
30c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
31c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // This character must be unescaped in canonical output. Not valid with
32c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // ESCAPE or PASS. We DON'T set the SPECIAL flag since if we encounter these
33c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // characters unescaped, they should just be copied.
34c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  UNESCAPE = 4,
35c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
36c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // This character is disallowed in URLs. Note that the "special" bit is also
37c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // set to trigger handling.
38c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  INVALID_BIT = 8,
39c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  INVALID = INVALID_BIT | SPECIAL,
40c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)};
41c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
42c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// This table contains one of the above flag values. Note some flags are more
43c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// than one bits because they also turn on the "special" flag. Special is the
44c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// only flag that may be combined with others.
45c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
46c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// This table is designed to match exactly what IE does with the characters.
47c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
48c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// Dot is even more special, and the escaped version is handled specially by
49c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// IsDot. Therefore, we don't need the "escape" flag, and even the "unescape"
50c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// bit is never handled (we just need the "special") bit.
51c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)const unsigned char kPathCharLookup[0x100] = {
52c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   NULL     control chars...
53c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     INVALID, ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
54c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   control chars...
55c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
56c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   ' '      !        "        #        $        %        &        '        (        )        *        +        ,        -        .        /
57c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  PASS,    ESCAPE,  ESCAPE,  PASS,    ESCAPE,  PASS,    PASS,    PASS,    PASS,    PASS,    PASS,    PASS,    UNESCAPE,SPECIAL, PASS,
58c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   0        1        2        3        4        5        6        7        8        9        :        ;        <        =        >        ?
59c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,PASS,    PASS,    ESCAPE,  PASS,    ESCAPE,  ESCAPE,
60c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   @        A        B        C        D        E        F        G        H        I        J        K        L        M        N        O
61c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     PASS,    UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,
62c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   P        Q        R        S        T        U        V        W        X        Y        Z        [        \        ]        ^        _
63c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,PASS,    ESCAPE,  PASS,    ESCAPE,  UNESCAPE,
64c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   `        a        b        c        d        e        f        g        h        i        j        k        l        m        n        o
65c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,
66c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   p        q        r        s        t        u        v        w        x        y        z        {        |        }        ~        <NBSP>
67c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,UNESCAPE,ESCAPE,  ESCAPE,  ESCAPE,  UNESCAPE,ESCAPE,
68c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//   ...all the high-bit characters are escaped
69c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
70c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
71c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
72c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
73c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
74c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
75c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,
76c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)     ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE,  ESCAPE};
77c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
78c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)enum DotDisposition {
79c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // The given dot is just part of a filename and is not special.
80c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  NOT_A_DIRECTORY,
81c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
82c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // The given dot is the current directory.
83c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DIRECTORY_CUR,
84c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
85c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // The given dot is the first of a double dot that should take us up one.
86c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DIRECTORY_UP
87c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)};
88c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
89c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// When the path resolver finds a dot, this function is called with the
90c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// character following that dot to see what it is. The return value
91c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// indicates what type this dot is (see above). This code handles the case
92c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// where the dot is at the end of the input.
93c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
94c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// |*consumed_len| will contain the number of characters in the input that
95c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// express what we found.
96c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
97c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// If the input is "../foo", |after_dot| = 1, |end| = 6, and
98c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// at the end, |*consumed_len| = 2 for the "./" this function consumed. The
99c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// original dot length should be handled by the caller.
100c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)template<typename CHAR>
101c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)DotDisposition ClassifyAfterDot(const CHAR* spec, int after_dot,
102c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                                int end, int* consumed_len) {
103c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (after_dot == end) {
104c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // Single dot at the end.
105c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    *consumed_len = 0;
106c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    return DIRECTORY_CUR;
107c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
1080529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch  if (IsURLSlash(spec[after_dot])) {
109c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // Single dot followed by a slash.
110c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    *consumed_len = 1;  // Consume the slash
111c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    return DIRECTORY_CUR;
112c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
113c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
114c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  int second_dot_len = IsDot(spec, after_dot, end);
115c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (second_dot_len) {
116c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    int after_second_dot = after_dot + second_dot_len;
117c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    if (after_second_dot == end) {
118c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // Double dot at the end.
119c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      *consumed_len = second_dot_len;
120c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      return DIRECTORY_UP;
121c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    }
1220529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch    if (IsURLSlash(spec[after_second_dot])) {
123c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // Double dot followed by a slash.
124c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      *consumed_len = second_dot_len + 1;
125c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      return DIRECTORY_UP;
126c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    }
127c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
128c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
129c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // The dots are followed by something else, not a directory.
130c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  *consumed_len = 0;
131c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  return NOT_A_DIRECTORY;
132c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
133c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
134c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// Rewinds the output to the previous slash. It is assumed that the output
135c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// ends with a slash and this doesn't count (we call this when we are
136c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// appending directory paths, so the previous path component has and ending
137c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// slash).
138c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
139c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// This will stop at the first slash (assumed to be at position
140c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// |path_begin_in_output| and not go any higher than that. Some web pages
141c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// do ".." too many times, so we need to handle that brokenness.
142c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
143c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// It searches for a literal slash rather than including a backslash as well
144c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// because it is run only on the canonical output.
145c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
146c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// The output is guaranteed to end in a slash when this function completes.
147c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)void BackUpToPreviousSlash(int path_begin_in_output,
148c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                           CanonOutput* output) {
149c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DCHECK(output->length() > 0);
150c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
151c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  int i = output->length() - 1;
152c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  DCHECK(output->at(i) == '/');
153c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (i == path_begin_in_output)
154c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    return;  // We're at the first slash, nothing to do.
155c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
156c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // Now back up (skipping the trailing slash) until we find another slash.
157c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  i--;
158c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  while (output->at(i) != '/' && i > path_begin_in_output)
159c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    i--;
160c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
161c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  // Now shrink the output to just include that last slash we found.
162c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  output->set_length(i + 1);
163c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
164c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
165c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// Appends the given path to the output. It assumes that if the input path
166c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// starts with a slash, it should be copied to the output. If no path has
167c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// already been appended to the output (the case when not resolving
168c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// relative URLs), the path should begin with a slash.
169c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
170c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// If there are already path components (this mode is used when appending
171c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// relative paths for resolving), it assumes that the output already has
172c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// a trailing slash and that if the input begins with a slash, it should be
173c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// copied to the output.
174c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)//
175c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// We do not collapse multiple slashes in a row to a single slash. It seems
176c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// no web browsers do this, and we don't want incompababilities, even though
177c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)// it would be correct for most systems.
178c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)template<typename CHAR, typename UCHAR>
179c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool DoPartialPath(const CHAR* spec,
1800529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                   const Component& path,
181c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                   int path_begin_in_output,
182c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                   CanonOutput* output) {
183c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  int end = path.end();
184c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
185c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  bool success = true;
186c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  for (int i = path.begin; i < end; i++) {
187c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    UCHAR uch = static_cast<UCHAR>(spec[i]);
188c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    if (sizeof(CHAR) > sizeof(char) && uch >= 0x80) {
189c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // We only need to test wide input for having non-ASCII characters. For
190c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // narrow input, we'll always just use the lookup table. We don't try to
191c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // do anything tricky with decoding/validating UTF-8. This function will
192c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // read one or two UTF-16 characters and append the output as UTF-8. This
193c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // call will be removed in 8-bit mode.
194c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      success &= AppendUTF8EscapedChar(spec, &i, end, output);
195c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    } else {
196c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      // Normal ASCII character or 8-bit input, use the lookup table.
197c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      unsigned char out_ch = static_cast<unsigned char>(uch);
198c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      unsigned char flags = kPathCharLookup[out_ch];
199c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      if (flags & SPECIAL) {
200c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        // Needs special handling of some sort.
201c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        int dotlen;
202c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        if ((dotlen = IsDot(spec, i, end)) > 0) {
203c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // See if this dot was preceeded by a slash in the output. We
204c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // assume that when canonicalizing paths, they will always
205c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // start with a slash and not a dot, so we don't have to
206c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // bounds check the output.
207c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          //
208c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // Note that we check this in the case of dots so we don't have to
209c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // special case slashes. Since slashes are much more common than
210c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // dots, this actually increases performance measurably (though
211c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // slightly).
212c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          DCHECK(output->length() > path_begin_in_output);
213c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          if (output->length() > path_begin_in_output &&
214c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->at(output->length() - 1) == '/') {
215c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // Slash followed by a dot, check to see if this is means relative
216c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            int consumed_len;
217c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            switch (ClassifyAfterDot<CHAR>(spec, i + dotlen, end,
218c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                                           &consumed_len)) {
219c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              case NOT_A_DIRECTORY:
220c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                // Copy the dot to the output, it means nothing special.
221c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                output->push_back('.');
222c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                i += dotlen - 1;
223c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                break;
224c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              case DIRECTORY_CUR:  // Current directory, just skip the input.
225c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                i += dotlen + consumed_len - 1;
226c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                break;
227c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              case DIRECTORY_UP:
228c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                BackUpToPreviousSlash(path_begin_in_output, output);
229c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                i += dotlen + consumed_len - 1;
230c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                break;
231c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            }
232c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          } else {
233c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // This dot is not preceeded by a slash, it is just part of some
234c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // file name.
235c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            output->push_back('.');
236c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            i += dotlen - 1;
237c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          }
238c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
239c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        } else if (out_ch == '\\') {
240c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // Convert backslashes to forward slashes
241c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          output->push_back('/');
242c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
243c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        } else if (out_ch == '%') {
244c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // Handle escape sequences.
245c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          unsigned char unescaped_value;
246c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          if (DecodeEscaped(spec, &i, end, &unescaped_value)) {
247c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // Valid escape sequence, see if we keep, reject, or unescape it.
248c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            char unescaped_flags = kPathCharLookup[unescaped_value];
249c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
250c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            if (unescaped_flags & UNESCAPE) {
251c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // This escaped value shouldn't be escaped, copy it.
252c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back(unescaped_value);
253c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            } else if (unescaped_flags & INVALID_BIT) {
254c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // Invalid escaped character, copy it and remember the error.
255c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back('%');
256c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back(static_cast<char>(spec[i - 1]));
257c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back(static_cast<char>(spec[i]));
258c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              success = false;
259c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            } else {
260c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // Valid escaped character but we should keep it escaped. We
261c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // don't want to change the case of any hex letters in case
262c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // the server is sensitive to that, so we just copy the two
263c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // characters without checking (DecodeEscape will have advanced
264c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              // to the last character of the pair).
265c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back('%');
266c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back(static_cast<char>(spec[i - 1]));
267c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)              output->push_back(static_cast<char>(spec[i]));
268c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            }
269c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          } else {
270c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // Invalid escape sequence. IE7 rejects any URLs with such
271c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // sequences, while Firefox, IE6, and Safari all pass it through
272c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // unchanged. We are more permissive unlike IE7. I don't think this
273c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // can cause significant problems, if it does, we should change
274c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            // to be more like IE7.
275c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            output->push_back('%');
276c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          }
277c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
278c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        } else if (flags & INVALID_BIT) {
279c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // For NULLs, etc. fail.
280c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          AppendEscapedChar(out_ch, output);
281c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          success = false;
282c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
283c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        } else if (flags & ESCAPE_BIT) {
284c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          // This character should be escaped.
285c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)          AppendEscapedChar(out_ch, output);
286c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        }
287c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      } else {
288c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        // Nothing special about this character, just append it.
289c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)        output->push_back(out_ch);
290c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      }
291c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    }
292c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
293c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  return success;
294c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
295c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
296c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)template<typename CHAR, typename UCHAR>
297c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool DoPath(const CHAR* spec,
2980529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch            const Component& path,
299c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)            CanonOutput* output,
3000529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch            Component* out_path) {
301c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  bool success = true;
302c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  out_path->begin = output->length();
303c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  if (path.len > 0) {
304c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // Write out an initial slash if the input has none. If we just parse a URL
305c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // and then canonicalize it, it will of course have a slash already. This
306c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // check is for the replacement and relative URL resolving cases of file
307c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // URLs.
3080529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch    if (!IsURLSlash(spec[path.begin]))
309c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)      output->push_back('/');
310c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
311c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    success = DoPartialPath<CHAR, UCHAR>(spec, path, out_path->begin, output);
312c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  } else {
313c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    // No input, canonical path is a slash.
314c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)    output->push_back('/');
315c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  }
316c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  out_path->len = output->length() - out_path->begin;
317c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  return success;
318c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
319c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
320c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}  // namespace
321c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
322c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool CanonicalizePath(const char* spec,
3230529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                      const Component& path,
324c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                      CanonOutput* output,
3250529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                      Component* out_path) {
326c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  return DoPath<char, unsigned char>(spec, path, output, out_path);
327c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
328c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
3297d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)bool CanonicalizePath(const base::char16* spec,
3300529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                      const Component& path,
331c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                      CanonOutput* output,
3320529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                      Component* out_path) {
3337d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)  return DoPath<base::char16, base::char16>(spec, path, output, out_path);
334c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
335c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
336c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)bool CanonicalizePartialPath(const char* spec,
3370529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                             const Component& path,
338c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                             int path_begin_in_output,
339c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                             CanonOutput* output) {
340c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)  return DoPartialPath<char, unsigned char>(spec, path, path_begin_in_output,
341c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                                            output);
342c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
343c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
3447d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)bool CanonicalizePartialPath(const base::char16* spec,
3450529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch                             const Component& path,
346c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                             int path_begin_in_output,
347c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)                             CanonOutput* output) {
3487d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)  return DoPartialPath<base::char16, base::char16>(spec, path,
3497d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)                                                   path_begin_in_output,
3507d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)                                                   output);
351c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)}
352c2e0dbddbe15c98d52c4786dac06cb8952a8ae6dTorne (Richard Coles)
3530529e5d033099cbfc42635f6f6183833b09dff6eBen Murdoch}  // namespace url
354