UriUtil.cxx 5.12 KB
Newer Older
1
/*
Max Kellermann's avatar
Max Kellermann committed
2
 * Copyright 2003-2017 The Music Player Daemon Project
3 4 5 6 7 8 9 10 11 12 13
 * http://www.musicpd.org
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14 15 16 17
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
18 19
 */

Max Kellermann's avatar
Max Kellermann committed
20
#include "UriUtil.hxx"
21
#include "StringCompare.hxx"
22
#include "CharUtil.hxx"
23

24
#include <assert.h>
25 26
#include <string.h>

27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
static constexpr bool
IsValidSchemeStart(char ch)
{
	return IsLowerAlphaASCII(ch);
}

static constexpr bool
IsValidSchemeChar(char ch)
{
	return IsLowerAlphaASCII(ch) || IsDigitASCII(ch) ||
		ch == '+' || ch == '.' || ch == '-';
}

gcc_pure
static bool
IsValidScheme(StringView p)
{
	if (p.IsEmpty() || !IsValidSchemeStart(p.front()))
		return false;

	for (size_t i = 1; i < p.size; ++i)
		if (!IsValidSchemeChar(p[i]))
			return false;

	return true;
}

/**
 * Return the URI part after the scheme specification (and after the
 * double slash).
 */
gcc_pure
static const char *
uri_after_scheme(const char *uri)
{
	if (uri[0] == '/' && uri[1] == '/' && uri[2] != '/')
		return uri + 2;

	const char *colon = strchr(uri, ':');
	return colon != nullptr &&
		IsValidScheme({uri, colon}) &&
		colon[1] == '/' && colon[2] == '/'
		? colon + 3
		: nullptr;
}

73 74
bool uri_has_scheme(const char *uri)
{
Max Kellermann's avatar
Max Kellermann committed
75
	return strstr(uri, "://") != nullptr;
76 77
}

78 79 80 81 82 83 84 85 86 87
std::string
uri_get_scheme(const char *uri)
{
	const char *end = strstr(uri, "://");
	if (end == nullptr)
		end = uri;

	return std::string(uri, end);
}

88 89 90 91 92 93 94 95 96 97
const char *
uri_get_path(const char *uri)
{
	const char *ap = uri_after_scheme(uri);
	if (ap != nullptr)
		return strchr(ap, '/');

	return uri;
}

98 99 100 101
/* suffixes should be ascii only characters */
const char *
uri_get_suffix(const char *uri)
{
102
	const char *suffix = strrchr(uri, '.');
103 104
	if (suffix == nullptr || suffix == uri ||
	    suffix[-1] == '/' || suffix[-1] == '\\')
Max Kellermann's avatar
Max Kellermann committed
105
		return nullptr;
106 107 108

	++suffix;

Max Kellermann's avatar
Max Kellermann committed
109 110
	if (strpbrk(suffix, "/\\") != nullptr)
		return nullptr;
111

112
	return suffix;
113
}
114

115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
const char *
uri_get_suffix(const char *uri, UriSuffixBuffer &buffer)
{
	const char *suffix = uri_get_suffix(uri);
	if (suffix == nullptr)
		return nullptr;

	const char *q = strchr(suffix, '?');
	if (q != nullptr && size_t(q - suffix) < sizeof(buffer.data)) {
		memcpy(buffer.data, suffix, q - suffix);
		buffer.data[q - suffix] = 0;
		suffix = buffer.data;
	}

	return suffix;
}

132 133 134
static const char *
verify_uri_segment(const char *p)
{
135
	unsigned dots = 0;
136
	while (*p == '.') {
137
		++p;
138 139 140
		++dots;
	}

141
	if (dots <= 2 && (*p == 0 || *p == '/'))
Max Kellermann's avatar
Max Kellermann committed
142
		return nullptr;
143

144
	const char *q = strchr(p + 1, '/');
Max Kellermann's avatar
Max Kellermann committed
145
	return q != nullptr ? q : "";
146 147 148 149 150 151 152
}

bool
uri_safe_local(const char *uri)
{
	while (true) {
		uri = verify_uri_segment(uri);
Max Kellermann's avatar
Max Kellermann committed
153
		if (uri == nullptr)
154 155 156 157 158 159 160 161 162 163 164
			return false;

		if (*uri == 0)
			return true;

		assert(*uri == '/');

		++uri;
	}
}

165 166 167
gcc_pure
static const char *
SkipUriScheme(const char *uri)
168
{
169 170 171 172 173 174 175 176
	const char *const schemes[] = { "http://", "https://", "ftp://" };
	for (auto scheme : schemes) {
		auto result = StringAfterPrefix(uri, scheme);
		if (result != nullptr)
			return result;
	}

	return nullptr;
177 178 179 180 181 182 183
}

std::string
uri_remove_auth(const char *uri)
{
	const char *auth = SkipUriScheme(uri);
	if (auth == nullptr)
184
		/* unrecognized URI */
185
		return std::string();
186

187
	const char *slash = strchr(auth, '/');
Max Kellermann's avatar
Max Kellermann committed
188
	if (slash == nullptr)
189 190
		slash = auth + strlen(auth);

191
	const char *at = (const char *)memchr(auth, '@', slash - auth);
Max Kellermann's avatar
Max Kellermann committed
192
	if (at == nullptr)
193
		/* no auth info present, do nothing */
194
		return std::string();
195 196 197

	/* duplicate the full URI and then delete the auth
	   information */
198 199 200
	std::string result(uri);
	result.erase(auth - uri, at + 1 - auth);
	return result;
201
}
202 203 204 205

bool
uri_is_child(const char *parent, const char *child)
{
206 207
#if !CLANG_CHECK_VERSION(3,6)
	/* disabled on clang due to -Wtautological-pointer-compare */
208 209
	assert(parent != nullptr);
	assert(child != nullptr);
210
#endif
211 212 213 214 215 216 217 218 219 220 221 222

	const size_t parent_length = strlen(parent);
	return memcmp(parent, child, parent_length) == 0 &&
		child[parent_length] == '/';
}


bool
uri_is_child_or_same(const char *parent, const char *child)
{
	return strcmp(parent, child) == 0 || uri_is_child(parent, child);
}
223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250

std::string
uri_apply_base(const std::string &uri, const std::string &base)
{
	if (uri.front() == '/') {
		/* absolute path: replace the whole URI path in base */

		auto i = base.find("://");
		if (i == base.npos)
			/* no scheme: override base completely */
			return uri;

		/* find the first slash after the host part */
		i = base.find('/', i + 3);
		if (i == base.npos)
			/* there's no URI path - simply append uri */
			i = base.length();

		return base.substr(0, i) + uri;
	}

	std::string out(base);
	if (out.back() != '/')
		out.push_back('/');

	out += uri;
	return out;
}