UriExtract.cxx 3.91 KB
Newer Older
Max Kellermann's avatar
Max Kellermann committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50
/*
 * Copyright 2008-2019 Max Kellermann <max.kellermann@gmail.com>
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * - Redistributions of source code must retain the above copyright
 * notice, this list of conditions and the following disclaimer.
 *
 * - Redistributions in binary form must reproduce the above copyright
 * notice, this list of conditions and the following disclaimer in the
 * documentation and/or other materials provided with the
 * distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE
 * FOUNDATION OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
 * OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include "UriExtract.hxx"
#include "CharUtil.hxx"
#include "StringView.hxx"

#include <string.h>

static constexpr bool
IsValidSchemeStart(char ch)
{
	return IsLowerAlphaASCII(ch);
}

static constexpr bool
IsValidSchemeChar(char ch)
{
	return IsLowerAlphaASCII(ch) || IsDigitASCII(ch) ||
		ch == '+' || ch == '.' || ch == '-';
}

gcc_pure
static bool
51
IsValidScheme(std::string_view p) noexcept
Max Kellermann's avatar
Max Kellermann committed
52 53 54 55
{
	if (p.empty() || !IsValidSchemeStart(p.front()))
		return false;

56
	for (size_t i = 1; i < p.size(); ++i)
Max Kellermann's avatar
Max Kellermann committed
57 58 59 60 61 62 63 64 65 66 67
		if (!IsValidSchemeChar(p[i]))
			return false;

	return true;
}

/**
 * Return the URI part after the scheme specification (and after the
 * double slash).
 */
gcc_pure
68 69
static std::string_view
uri_after_scheme(std::string_view uri) noexcept
Max Kellermann's avatar
Max Kellermann committed
70
{
71 72 73 74 75 76 77 78 79 80 81 82 83 84
	if (uri.length() > 2 &&
	    uri[0] == '/' && uri[1] == '/' && uri[2] != '/')
		return uri.substr(2);

	auto colon = uri.find(':');
	if (colon == std::string_view::npos ||
	    !IsValidScheme(uri.substr(0, colon)))
		return {};

	uri = uri.substr(colon + 1);
	if (uri[0] != '/' || uri[1] != '/')
		return {};

	return uri.substr(2);
Max Kellermann's avatar
Max Kellermann committed
85 86 87
}

bool
88
uri_has_scheme(std::string_view uri) noexcept
Max Kellermann's avatar
Max Kellermann committed
89
{
90
	return !uri_get_scheme(uri).empty();
Max Kellermann's avatar
Max Kellermann committed
91 92
}

93 94
std::string_view
uri_get_scheme(std::string_view uri) noexcept
Max Kellermann's avatar
Max Kellermann committed
95
{
96 97 98
	auto end = uri.find("://");
	if (end == std::string_view::npos)
		return {};
Max Kellermann's avatar
Max Kellermann committed
99

100
	return uri.substr(0, end);
Max Kellermann's avatar
Max Kellermann committed
101 102
}

103 104 105 106 107 108
bool
uri_is_relative_path(const char *uri) noexcept
{
	return !uri_has_scheme(uri) && *uri != '/';
}

109 110
std::string_view
uri_get_path(std::string_view uri) noexcept
Max Kellermann's avatar
Max Kellermann committed
111
{
112 113 114 115 116 117 118
	auto ap = uri_after_scheme(uri);
	if (ap.data() != nullptr) {
		auto slash = ap.find('/');
		if (slash == std::string_view::npos)
			return {};
		return ap.substr(slash);
	}
Max Kellermann's avatar
Max Kellermann committed
119 120 121 122 123 124 125 126

	return uri;
}

/* suffixes should be ascii only characters */
const char *
uri_get_suffix(const char *uri) noexcept
{
Rosen Penev's avatar
Rosen Penev committed
127
	const char *suffix = std::strrchr(uri, '.');
Max Kellermann's avatar
Max Kellermann committed
128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146
	if (suffix == nullptr || suffix == uri ||
	    suffix[-1] == '/' || suffix[-1] == '\\')
		return nullptr;

	++suffix;

	if (strpbrk(suffix, "/\\") != nullptr)
		return nullptr;

	return suffix;
}

const char *
uri_get_suffix(const char *uri, UriSuffixBuffer &buffer) noexcept
{
	const char *suffix = uri_get_suffix(uri);
	if (suffix == nullptr)
		return nullptr;

Rosen Penev's avatar
Rosen Penev committed
147
	const char *q = std::strchr(suffix, '?');
Max Kellermann's avatar
Max Kellermann committed
148 149 150 151 152 153 154 155
	if (q != nullptr && size_t(q - suffix) < sizeof(buffer.data)) {
		memcpy(buffer.data, suffix, q - suffix);
		buffer.data[q - suffix] = 0;
		suffix = buffer.data;
	}

	return suffix;
}
156 157 158 159

const char *
uri_get_fragment(const char *uri) noexcept
{
Rosen Penev's avatar
Rosen Penev committed
160
	const char *fragment = std::strchr(uri, '#');
161 162 163 164 165
	if (fragment == nullptr)
		return nullptr;

	return fragment + 1;
}