Skip site navigation (1)Skip section navigation (2)
Date:      Mon, 9 Apr 2012 16:50:51 -0400
From:      Ed Maste <emaste@freebsd.org>
To:        <freebsd-current@freebsd.org>
Subject:   [PATCH] percent-encoding for libfetch
Message-ID:  <20120409205051.GA27392@sandvine.com>

next in thread | raw e-mail | index | archive | help
--NDin8bjvE/0mNLFQ
Content-Type: text/plain; charset="us-ascii"
Content-Disposition: inline

Libfetch supports a username and password in a FTP or HTTP URL, but lacks
a method to specify '@' or ':' there, as they're used as URL component
separators.  I discovered this issue because I have an FTP server that
uses an email address as the username, and I can't use fetch(1) or
libfetch against it.

The attached patch adds decoding of percent-encoded usernames and
passwords, in order to use a URL like
ftp://foo%40example.com:password@host:port/file.bar .

Please review.  I plan to commit in the next few days.

-Ed

--NDin8bjvE/0mNLFQ
Content-Type: text/plain; charset="us-ascii"
Content-Disposition: attachment; filename="fetch.diff"

Index: fetch.c
===================================================================
--- fetch.c	(revision 233584)
+++ fetch.c	(working copy)
@@ -289,6 +289,49 @@
 }
 
 /*
+ * Return value of the given hex digit.
+ */
+static int
+fetch_hexval(char ch)
+{
+
+	if (ch >= '0' && ch <= '9')
+		return (ch - '0');
+	else if (ch >= 'a' && ch <= 'f')
+		return (ch - 'a' + 10);
+	else if (ch >= 'A' && ch <= 'F')
+		return (ch - 'A' + 10);
+	return (-1);
+}
+
+/*
+ * Decode percent-encoded URL component from src into dst, stopping at end
+ * of string, or at @ or : separators.  Returns a pointer to the unhandled
+ * part of the input string (null terminator, @, or :).  No terminator is
+ * written to dst (it is the caller's responsibility).
+ */
+static const char *
+fetch_pctdecode(char *dst, const char *src, size_t dlen)
+{
+	int d1, d2;
+	char c;
+	const char *s;
+
+	for (s = src; *s != '\0' && *s != '@' && *s != ':'; s++) {
+		if (s[0] == '%' && (d1 = fetch_hexval(s[1])) >= 0 &&
+		    (d2 = fetch_hexval(s[2])) >= 0) {
+			c = d1 << 4 | d2;
+			s += 2;
+		} else {
+			c = *s;
+		}
+		if (dlen-- > 0)
+			*dst++ = c;
+	}
+	return (s);
+}
+
+/*
  * Split an URL into components. URL syntax is:
  * [method:/][/[user[:pwd]@]host[:port]/][document]
  * This almost, but not quite, RFC1738 URL syntax.
@@ -329,15 +372,11 @@
 	p = strpbrk(URL, "/@");
 	if (p && *p == '@') {
 		/* username */
-		for (q = URL, i = 0; (*q != ':') && (*q != '@'); q++)
-			if (i < URL_USERLEN)
-				u->user[i++] = *q;
+		q = fetch_pctdecode(u->user, URL, URL_USERLEN);
 
 		/* password */
 		if (*q == ':')
-			for (q++, i = 0; (*q != ':') && (*q != '@'); q++)
-				if (i < URL_PWDLEN)
-					u->pwd[i++] = *q;
+			q = fetch_pctdecode(u->pwd, ++q, URL_PWDLEN);
 
 		p++;
 	} else {

--NDin8bjvE/0mNLFQ--



Want to link to this message? Use this URL: <https://mail-archive.FreeBSD.org/cgi/mid.cgi?20120409205051.GA27392>