UriUtil.cxx 5.24 KB
Newer Older
1
/*
2
 * Copyright 2003-2018 The Music Player Daemon Project
3 4 5 6 7 8 9 10 11 12 13
 * http://www.musicpd.org
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
14 15 16 17
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
18 19
 */

Max Kellermann's avatar
Max Kellermann committed
20
#include "UriUtil.hxx"
21
#include "ASCII.hxx"
22
#include "CharUtil.hxx"
23

24
#include <assert.h>
25 26
#include <string.h>

27 28 29 30 31 32 33 34 35 36 37 38 39 40 41
static constexpr bool
IsValidSchemeStart(char ch)
{
	return IsLowerAlphaASCII(ch);
}

static constexpr bool
IsValidSchemeChar(char ch)
{
	return IsLowerAlphaASCII(ch) || IsDigitASCII(ch) ||
		ch == '+' || ch == '.' || ch == '-';
}

gcc_pure
static bool
42
IsValidScheme(StringView p) noexcept
43
{
44
	if (p.empty() || !IsValidSchemeStart(p.front()))
45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
		return false;

	for (size_t i = 1; i < p.size; ++i)
		if (!IsValidSchemeChar(p[i]))
			return false;

	return true;
}

/**
 * Return the URI part after the scheme specification (and after the
 * double slash).
 */
gcc_pure
static const char *
60
uri_after_scheme(const char *uri) noexcept
61 62 63 64 65 66 67 68 69 70 71 72
{
	if (uri[0] == '/' && uri[1] == '/' && uri[2] != '/')
		return uri + 2;

	const char *colon = strchr(uri, ':');
	return colon != nullptr &&
		IsValidScheme({uri, colon}) &&
		colon[1] == '/' && colon[2] == '/'
		? colon + 3
		: nullptr;
}

73 74
bool
uri_has_scheme(const char *uri) noexcept
75
{
Max Kellermann's avatar
Max Kellermann committed
76
	return strstr(uri, "://") != nullptr;
77 78
}

79
std::string
80
uri_get_scheme(const char *uri) noexcept
81 82 83 84 85 86 87 88
{
	const char *end = strstr(uri, "://");
	if (end == nullptr)
		end = uri;

	return std::string(uri, end);
}

89
const char *
90
uri_get_path(const char *uri) noexcept
91 92 93 94 95 96 97 98
{
	const char *ap = uri_after_scheme(uri);
	if (ap != nullptr)
		return strchr(ap, '/');

	return uri;
}

99 100
/* suffixes should be ascii only characters */
const char *
101
uri_get_suffix(const char *uri) noexcept
102
{
103
	const char *suffix = strrchr(uri, '.');
104 105
	if (suffix == nullptr || suffix == uri ||
	    suffix[-1] == '/' || suffix[-1] == '\\')
Max Kellermann's avatar
Max Kellermann committed
106
		return nullptr;
107 108 109

	++suffix;

Max Kellermann's avatar
Max Kellermann committed
110 111
	if (strpbrk(suffix, "/\\") != nullptr)
		return nullptr;
112

113
	return suffix;
114
}
115

116
const char *
117
uri_get_suffix(const char *uri, UriSuffixBuffer &buffer) noexcept
118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
{
	const char *suffix = uri_get_suffix(uri);
	if (suffix == nullptr)
		return nullptr;

	const char *q = strchr(suffix, '?');
	if (q != nullptr && size_t(q - suffix) < sizeof(buffer.data)) {
		memcpy(buffer.data, suffix, q - suffix);
		buffer.data[q - suffix] = 0;
		suffix = buffer.data;
	}

	return suffix;
}

133
static const char *
134
verify_uri_segment(const char *p) noexcept
135
{
136
	unsigned dots = 0;
137
	while (*p == '.') {
138
		++p;
139 140 141
		++dots;
	}

142
	if (dots <= 2 && (*p == 0 || *p == '/'))
Max Kellermann's avatar
Max Kellermann committed
143
		return nullptr;
144

145
	const char *q = strchr(p + 1, '/');
Max Kellermann's avatar
Max Kellermann committed
146
	return q != nullptr ? q : "";
147 148 149
}

bool
150
uri_safe_local(const char *uri) noexcept
151 152 153
{
	while (true) {
		uri = verify_uri_segment(uri);
Max Kellermann's avatar
Max Kellermann committed
154
		if (uri == nullptr)
155 156 157 158 159 160 161 162 163 164 165
			return false;

		if (*uri == 0)
			return true;

		assert(*uri == '/');

		++uri;
	}
}

166 167
gcc_pure
static const char *
168
SkipUriScheme(const char *uri) noexcept
169
{
170 171
	const char *const schemes[] = { "http://", "https://", "ftp://" };
	for (auto scheme : schemes) {
172
		auto result = StringAfterPrefixCaseASCII(uri, scheme);
173 174 175 176 177
		if (result != nullptr)
			return result;
	}

	return nullptr;
178 179 180
}

std::string
181
uri_remove_auth(const char *uri) noexcept
182 183 184
{
	const char *auth = SkipUriScheme(uri);
	if (auth == nullptr)
185
		/* unrecognized URI */
186
		return std::string();
187

188
	const char *slash = strchr(auth, '/');
Max Kellermann's avatar
Max Kellermann committed
189
	if (slash == nullptr)
190 191
		slash = auth + strlen(auth);

192
	const char *at = (const char *)memchr(auth, '@', slash - auth);
Max Kellermann's avatar
Max Kellermann committed
193
	if (at == nullptr)
194
		/* no auth info present, do nothing */
195
		return std::string();
196 197 198

	/* duplicate the full URI and then delete the auth
	   information */
199 200 201
	std::string result(uri);
	result.erase(auth - uri, at + 1 - auth);
	return result;
202
}
203 204

bool
205
uri_is_child(const char *parent, const char *child) noexcept
206
{
207 208
#if !CLANG_CHECK_VERSION(3,6)
	/* disabled on clang due to -Wtautological-pointer-compare */
209 210
	assert(parent != nullptr);
	assert(child != nullptr);
211
#endif
212 213 214 215 216 217 218 219

	const size_t parent_length = strlen(parent);
	return memcmp(parent, child, parent_length) == 0 &&
		child[parent_length] == '/';
}


bool
220
uri_is_child_or_same(const char *parent, const char *child) noexcept
221 222 223
{
	return strcmp(parent, child) == 0 || uri_is_child(parent, child);
}
224 225

std::string
226
uri_apply_base(const std::string &uri, const std::string &base) noexcept
227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251
{
	if (uri.front() == '/') {
		/* absolute path: replace the whole URI path in base */

		auto i = base.find("://");
		if (i == base.npos)
			/* no scheme: override base completely */
			return uri;

		/* find the first slash after the host part */
		i = base.find('/', i + 3);
		if (i == base.npos)
			/* there's no URI path - simply append uri */
			i = base.length();

		return base.substr(0, i) + uri;
	}

	std::string out(base);
	if (out.back() != '/')
		out.push_back('/');

	out += uri;
	return out;
}