From: Alex Schroeder Date: Wed, 4 Aug 2021 14:27:17 +0000 (+0200) Subject: Add IRI support X-Git-Tag: v3.3.0~22^2 X-Git-Url: https://thelambdalab.xyz/gitweb/index.cgi?p=elpher.git;a=commitdiff_plain;h=65621cde0534f742b5cbd9b523938b296bdd8080 Add IRI support When getting the address of a URL, use the current scheme as URL type, if one exists. If no scheme is provided for a URL, the current context specifies the scheme to use, so if we’re looking at a gemini page, then the default type is "gemini" even if elpher-default-url-type is "gopher". When creating the display-string for a page from a URL, use a new functino that creates an IRI instead. It decodes percent-escapes and handles punycode in the host name. It also hides the password, if any, since that's what RFC 3986 says we should do. When getting the display-string of a Gemini link line without a text, do the same: don't just use the URL, use the corresponding IRI, decoding percent-escapes and handling punycode in the host name. When getting the URL of a Gemini link line, do the reverse: if this is an IRI instead of a URI, use punycode for the host; percent-escaping is already handled by url-generic-parse-url. --- diff --git a/elpher.el b/elpher.el index 2e3c5ec..925afa3 100644 --- a/elpher.el +++ b/elpher.el @@ -332,7 +332,7 @@ the start page." (unless (and (not (url-fullness url)) (url-type url)) (setf (url-fullness url) t) (unless (url-type url) - (setf (url-type url) elpher-default-url-type)) + (setf (url-type url) (elpher-get-default-url-type))) (unless (url-host url) (let ((p (split-string (url-filename url) "/" nil nil))) (setf (url-host url) (car p)) @@ -353,6 +353,18 @@ the start page." (elpher-remove-redundant-ports url)) (set-match-data data)))) +(defun elpher-get-default-url-type () + "Get the current URL type or `elpher-default-url-type'. +If no scheme is provided for a URL, the current context specifies +the scheme to use, so if we're looking at a gemini page, then the +default type is \"gemini\" even if `elpher-default-url-type' is +\"gopher\"." + (or (and elpher-current-page + (symbol-name + (elpher-address-type + (elpher-page-address elpher-current-page)))) + elpher-default-url-type)) + (defun elpher-remove-redundant-ports (address) "Remove redundant port specifiers from ADDRESS. Here 'redundant' means that the specified port matches the default @@ -502,9 +514,32 @@ If no address is defined, returns 0. (This is for compatibility with the URL li "Create a page with address and display string defined by URL. The URL is unhexed prior to its use as a display string to improve readability." - (elpher-make-page (elpher-decode (url-unhex-string url)) + (elpher-make-page (elpher-url-to-iri url) (elpher-address-from-url url))) +(defun elpher-url-to-iri (url) + "Return an IRI for URL. +Decode percent-escapes and handle punycode in the domain name. +Drop the password, if any." + (let* ((address (elpher-address-from-url (elpher-decode (url-unhex-string url)))) + (host (url-host address)) + (pass (url-password address))) + (when host + (setf (url-host address) (puny-decode-domain host))) + (when pass ; RFC 3986 says we should not render + (setf (url-password address) nil)) ; the password as clear text + (url-recreate-url address))) + +(defun elpher-encode-url (iri) + "Return an URL for the IRI. +Encode and use percent-escapes, use punycode for the domain name +if necessary." + (let* ((address (url-generic-parse-url iri)) + (host (url-host address))) + (when host + (setf (url-host address) (puny-encode-domain host))) + (url-recreate-url address))) + (defvar elpher-current-page nil "The current page for this Elpher buffer.") @@ -1416,7 +1451,7 @@ Returns nil in the event that the contents of the line following the => prefix are empty." (let ((l (split-string (substring link-line 2)))) (if l - (string-trim (elt l 0)) + (elpher-encode-url (string-trim (elt l 0))) nil))) (defun elpher-gemini-get-link-display-string (link-line) @@ -1426,7 +1461,7 @@ Returns the url portion in the event that the display-string portion is empty." (idx (string-match "[ \t]" rest))) (string-trim (if idx (substring rest (+ idx 1)) - rest)))) + (elpher-url-to-iri rest))))) (defun elpher-collapse-dot-sequences (filename) "Collapse dot sequences in FILENAME.