// Copyright (c) 2010 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "net/tools/dump_cache/url_utilities.h"
#include "base/logging.h"
#include "base/strings/string_number_conversions.h"
#include "base/strings/string_util.h"
namespace net {
std::string UrlUtilities::GetUrlHost(const std::string& url) {
size_t b = url.find("//");
if (b == std::string::npos)
b = 0;
else
b += 2;
size_t next_slash = url.find_first_of('/', b);
size_t next_colon = url.find_first_of(':', b);
if (next_slash != std::string::npos
&& next_colon != std::string::npos
&& next_colon < next_slash) {
return std::string(url, b, next_colon - b);
}
if (next_slash == std::string::npos) {
if (next_colon != std::string::npos) {
return std::string(url, b, next_colon - b);
} else {
next_slash = url.size();
}
}
return std::string(url, b, next_slash - b);
}
std::string UrlUtilities::GetUrlHostPath(const std::string& url) {
size_t b = url.find("//");
if (b == std::string::npos)
b = 0;
else
b += 2;
return std::string(url, b);
}
std::string UrlUtilities::GetUrlPath(const std::string& url) {
size_t b = url.find("//");
if (b == std::string::npos)
b = 0;
else
b += 2;
b = url.find("/", b);
if (b == std::string::npos)
return "/";
size_t e = url.find("#", b+1);
if (e != std::string::npos)
return std::string(url, b, (e - b));
return std::string(url, b);
}
namespace {
// Parsing states for UrlUtilities::Unescape
enum UnescapeState {
NORMAL, // We are not in the middle of parsing an escape.
ESCAPE1, // We just parsed % .
ESCAPE2 // We just parsed %X for some hex digit X.
};
} // namespace
std::string UrlUtilities::Unescape(const std::string& escaped_url) {
std::string unescaped_url, escape_text;
int escape_value;
UnescapeState state = NORMAL;
std::string::const_iterator iter = escaped_url.begin();
while (iter < escaped_url.end()) {
char c = *iter;
switch (state) {
case NORMAL:
if (c == '%') {
escape_text.clear();
state = ESCAPE1;
} else {
unescaped_url.push_back(c);
}
++iter;
break;
case ESCAPE1:
if (IsHexDigit(c)) {
escape_text.push_back(c);
state = ESCAPE2;
++iter;
} else {
// Unexpected, % followed by non-hex chars, pass it through.
unescaped_url.push_back('%');
state = NORMAL;
}
break;
case ESCAPE2:
if (IsHexDigit(c)) {
escape_text.push_back(c);
bool ok = base::HexStringToInt(escape_text, &escape_value);
DCHECK(ok);
unescaped_url.push_back(static_cast<unsigned char>(escape_value));
state = NORMAL;
++iter;
} else {
// Unexpected, % followed by non-hex chars, pass it through.
unescaped_url.push_back('%');
unescaped_url.append(escape_text);
state = NORMAL;
}
break;
}
}
// Unexpected, % followed by end of string, pass it through.
if (state == ESCAPE1 || state == ESCAPE2) {
unescaped_url.push_back('%');
unescaped_url.append(escape_text);
}
return unescaped_url;
}
} // namespace net