2 * URL utility functions
3 * Copyright (c) 2000, 2001, 2002 Fabrice Bellard
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
30 #include "libavutil/avassert.h"
31 #include "libavutil/avstring.h"
35 * URL utility functions.
38 int ff_url_join(char *str, int size, const char *proto,
39 const char *authorization, const char *hostname,
40 int port, const char *fmt, ...)
43 struct addrinfo hints = { 0 }, *ai;
48 av_strlcatf(str, size, "%s://", proto);
49 if (authorization && authorization[0])
50 av_strlcatf(str, size, "%s@", authorization);
51 #if CONFIG_NETWORK && defined(AF_INET6)
52 /* Determine if hostname is a numerical IPv6 address,
53 * properly escape it within [] in that case. */
54 hints.ai_flags = AI_NUMERICHOST;
55 if (!getaddrinfo(hostname, NULL, &hints, &ai)) {
56 if (ai->ai_family == AF_INET6) {
57 av_strlcat(str, "[", size);
58 av_strlcat(str, hostname, size);
59 av_strlcat(str, "]", size);
61 av_strlcat(str, hostname, size);
66 /* Not an IPv6 address, just output the plain string. */
67 av_strlcat(str, hostname, size);
70 av_strlcatf(str, size, ":%d", port);
73 size_t len = strlen(str);
76 vsnprintf(str + len, size > len ? size - len : 0, fmt, vl);
82 static const char *find_delim(const char *delim, const char *cur, const char *end)
84 while (cur < end && !strchr(delim, *cur))
89 int ff_url_decompose(URLComponents *uc, const char *url, const char *end)
91 const char *cur, *aend, *p;
95 end = url + strlen(url);
100 p = find_delim(":/?#", cur, end); /* lavf "schemes" can contain options but not some RFC 3986 delimiters */
106 if (end - cur >= 2 && cur[0] == '/' && cur[1] == '/') {
108 aend = find_delim("/?#", cur, end);
112 p = find_delim("@", cur, aend);
118 if (*cur == '[') { /* hello IPv6, thanks for using colons! */
119 p = find_delim("]", cur, aend);
121 return AVERROR(EINVAL);
122 if (p + 1 < aend && p[1] != ':')
123 return AVERROR(EINVAL);
126 cur = find_delim(":", cur, aend);
133 uc->userinfo = uc->host = uc->port = cur;
138 cur = find_delim("?#", cur, end);
143 cur = find_delim("#", cur, end);
152 static int is_fq_dos_path(const char *path)
154 if ((path[0] >= 'a' && path[0] <= 'z' || path[0] >= 'A' && path[0] <= 'Z') &&
156 (path[2] == '/' || path[2] == '\\'))
158 if ((path[0] == '/' || path[0] == '\\') &&
159 (path[1] == '/' || path[1] == '\\'))
164 static int append_path(char *root, char *out_end, char **rout,
165 const char *in, const char *in_end)
168 const char *d, *next;
170 if (in < in_end && *in == '/')
171 in++; /* already taken care of */
172 while (in < in_end) {
173 d = find_delim("/", in, in_end);
174 next = d + (d < in_end && *d == '/');
175 if (d - in == 1 && in[0] == '.') {
177 } else if (d - in == 2 && in[0] == '.' && in[1] == '.') {
178 av_assert1(out[-1] == '/');
180 while (out > root && (--out)[-1] != '/');
182 if (out_end - out < next - in)
183 return AVERROR(ENOMEM);
184 memmove(out, in, next - in);
193 int ff_make_absolute_url(char *buf, int size, const char *base,
196 URLComponents ub, uc;
197 char *out, *out_end, *path;
198 const char *keep, *base_path_end;
199 int use_base_path, simplify_path = 0, ret;
200 const char *base_separators = "/";
203 For HTTP, http://server/site/page + ../media/file
204 should resolve into http://server/media/file
205 but for filesystem access, dir/playlist + ../media/file
206 should resolve into dir/../media/file
207 because dir could be a symlink, and .. points to
208 the actual parent of the target directory.
210 We'll consider that URLs with an actual scheme and authority,
211 i.e. starting with scheme://, need parent dir simplification,
212 while bare paths or pseudo-URLs starting with proto: without
213 the double slash do not.
215 For real URLs, the processing is similar to the algorithm described
217 https://tools.ietf.org/html/rfc3986#section-5
221 return AVERROR(ENOMEM);
223 out_end = buf + size - 1;
227 if (HAVE_DOS_PATHS) {
228 if ((ret = ff_url_decompose(&ub, base, NULL)) < 0)
230 if (is_fq_dos_path(base) || av_strstart(base, "file:", NULL) || ub.path == ub.url) {
231 base_separators = "/\\";
232 if (is_fq_dos_path(rel))
236 if ((ret = ff_url_decompose(&ub, base, NULL)) < 0 ||
237 (ret = ff_url_decompose(&uc, rel, NULL)) < 0)
241 #define KEEP(component, also) do { \
242 if (uc.url_component_end_##component == uc.url && \
243 ub.url_component_end_##component > keep) { \
244 keep = ub.url_component_end_##component; \
249 KEEP(authority_full, simplify_path = 1;);
254 #define COPY(start, end) do { \
255 size_t len = end - start; \
256 if (len > out_end - out) { \
257 ret = AVERROR(ENOMEM); \
260 memmove(out, start, len); \
264 COPY(uc.url, uc.path);
266 use_base_path = URL_COMPONENT_HAVE(ub, path) && keep <= ub.path;
267 if (uc.path > uc.url)
269 if (URL_COMPONENT_HAVE(uc, path) && uc.path[0] == '/')
272 base_path_end = ub.url_component_end_path;
273 if (URL_COMPONENT_HAVE(uc, path))
274 while (base_path_end > ub.path && !strchr(base_separators, base_path_end[-1]))
279 if (URL_COMPONENT_HAVE(uc, scheme))
281 if (URL_COMPONENT_HAVE(uc, authority))
283 /* No path at all, leave it */
284 if (!use_base_path && !URL_COMPONENT_HAVE(uc, path))
288 const char *root = "/";
289 COPY(root, root + 1);
292 ret = append_path(path, out_end, &out, ub.path, base_path_end);
296 if (URL_COMPONENT_HAVE(uc, path)) {
297 ret = append_path(path, out_end, &out, uc.path, uc.url_component_end_path);
303 COPY(ub.path, base_path_end);
304 COPY(uc.path, uc.url_component_end_path);
307 COPY(uc.url_component_end_path, uc.end);
313 snprintf(buf, size, "invalid:%s",
314 ret == AVERROR(ENOMEM) ? "truncated" :
315 ret == AVERROR(EINVAL) ? "syntax_error" : "");
319 AVIODirEntry *ff_alloc_dir_entry(void)
321 AVIODirEntry *entry = av_mallocz(sizeof(AVIODirEntry));
323 entry->type = AVIO_ENTRY_UNKNOWN;
325 entry->modification_timestamp = -1;
326 entry->access_timestamp = -1;
327 entry->status_change_timestamp = -1;
329 entry->group_id = -1;
330 entry->filemode = -1;