2013-01-05 10:08:07 -05:00
|
|
|
|
;;; GNU Guix --- Functional package management for GNU
|
2024-02-23 08:42:43 -05:00
|
|
|
|
;;; Copyright © 2012-2022, 2024 Ludovic Courtès <ludo@gnu.org>
|
2015-02-18 19:33:10 -05:00
|
|
|
|
;;; Copyright © 2015 Mark H Weaver <mhw@netris.org>
|
2017-08-28 09:46:10 -04:00
|
|
|
|
;;; Copyright © 2017 Tobias Geerinckx-Rice <me@tobias.gr>
|
2021-03-19 23:03:25 -04:00
|
|
|
|
;;; Copyright © 2021 Timothy Sample <samplet@ngyro.com>
|
2012-11-12 17:10:26 -05:00
|
|
|
|
;;;
|
2013-01-05 10:08:07 -05:00
|
|
|
|
;;; This file is part of GNU Guix.
|
2012-11-12 17:10:26 -05:00
|
|
|
|
;;;
|
2013-01-05 10:08:07 -05:00
|
|
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
2012-11-12 17:10:26 -05:00
|
|
|
|
;;; under the terms of the GNU General Public License as published by
|
|
|
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
|
;;; your option) any later version.
|
|
|
|
|
;;;
|
2013-01-05 10:08:07 -05:00
|
|
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
2012-11-12 17:10:26 -05:00
|
|
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
;;; GNU General Public License for more details.
|
|
|
|
|
;;;
|
|
|
|
|
;;; You should have received a copy of the GNU General Public License
|
2013-01-05 10:08:07 -05:00
|
|
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
|
|
|
|
(define-module (guix build download)
|
|
|
|
|
#:use-module (web uri)
|
2015-11-12 16:37:32 -05:00
|
|
|
|
#:use-module (web http)
|
2015-05-06 04:31:11 -04:00
|
|
|
|
#:use-module ((web client) #:hide (open-socket-for-uri))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
#:use-module (web response)
|
2016-06-28 09:36:34 -04:00
|
|
|
|
#:use-module (guix base64)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
#:use-module (guix ftp-client)
|
|
|
|
|
#:use-module (guix build utils)
|
Add (guix progress).
Among other things, this removes (guix utils), (guix ui), (guix config),
etc. from the closure of (guix build download), as was the case since
798648515b77507c242752457b4dc17c155bad6e.
* guix/utils.scm (<progress-reporter>, call-with-progress-reporter):
Move to...
* guix/progress.scm: ... here. New file.
* Makefile.am (MODULES): Add it.
* guix/build/download.scm (current-terminal-columns)
(nearest-exact-integer, duration->seconds, seconds->string)
(byte-count->string, progress-bar, string-pad-middle)
(rate-limited, progress-reporter/file, dump-port*)
(time-monotonic): Move to progress.scm.
* guix/scripts/download.scm: Adjust accordingly.
* guix/scripts/substitute.scm: Likewise.
2017-10-16 17:16:39 -04:00
|
|
|
|
#:use-module (guix progress)
|
2022-03-03 16:42:31 -05:00
|
|
|
|
#:use-module (guix memoization)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
#:use-module (rnrs io ports)
|
2016-06-28 09:36:34 -04:00
|
|
|
|
#:use-module (rnrs bytevectors)
|
2012-11-12 17:20:06 -05:00
|
|
|
|
#:use-module (srfi srfi-1)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
#:use-module (srfi srfi-11)
|
2015-02-27 09:00:38 -05:00
|
|
|
|
#:use-module (srfi srfi-19)
|
2012-11-12 17:20:06 -05:00
|
|
|
|
#:use-module (srfi srfi-26)
|
2016-11-07 17:07:08 -05:00
|
|
|
|
#:autoload (ice-9 ftw) (scandir)
|
2021-03-19 23:03:25 -04:00
|
|
|
|
#:autoload (guix base16) (bytevector->base16-string)
|
2021-10-14 08:54:49 -04:00
|
|
|
|
#:autoload (guix swh) (swh-download-directory %verify-swh-certificate?)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
#:use-module (ice-9 match)
|
2013-01-06 12:24:53 -05:00
|
|
|
|
#:use-module (ice-9 format)
|
2024-02-23 08:42:43 -05:00
|
|
|
|
#:export (%download-methods
|
|
|
|
|
download-method-enabled?
|
|
|
|
|
|
|
|
|
|
open-socket-for-uri
|
2015-05-06 04:31:11 -04:00
|
|
|
|
open-connection-for-uri
|
2017-10-16 16:31:50 -04:00
|
|
|
|
http-fetch
|
2017-03-13 16:51:27 -04:00
|
|
|
|
%x509-certificate-directory
|
2016-03-17 16:34:33 -04:00
|
|
|
|
close-connection
|
2015-02-18 19:33:10 -05:00
|
|
|
|
resolve-uri-reference
|
2014-12-29 14:51:12 -05:00
|
|
|
|
maybe-expand-mirrors
|
2014-12-28 11:55:16 -05:00
|
|
|
|
url-fetch
|
2015-09-15 01:31:11 -04:00
|
|
|
|
byte-count->string
|
|
|
|
|
uri-abbreviation
|
2016-04-20 17:01:41 -04:00
|
|
|
|
nar-uri-abbreviation
|
2015-09-15 01:31:11 -04:00
|
|
|
|
store-path-abbreviation))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
|
|
|
|
;;; Commentary:
|
|
|
|
|
;;;
|
|
|
|
|
;;; Fetch data such as tarballs over HTTP or FTP (builder-side code).
|
|
|
|
|
;;;
|
|
|
|
|
;;; Code:
|
|
|
|
|
|
2015-02-27 08:57:54 -05:00
|
|
|
|
(define %http-receive-buffer-size
|
|
|
|
|
;; Size of the HTTP receive buffer.
|
|
|
|
|
65536)
|
|
|
|
|
|
2015-10-01 05:28:58 -04:00
|
|
|
|
(define* (ellipsis #:optional (port (current-output-port)))
|
|
|
|
|
"Make a rough guess at whether Unicode's HORIZONTAL ELLIPSIS can be written
|
|
|
|
|
in PORT's encoding, and return either that or ASCII dots."
|
|
|
|
|
(if (equal? (port-encoding port) "UTF-8")
|
|
|
|
|
"…"
|
|
|
|
|
"..."))
|
|
|
|
|
|
2015-09-15 01:31:11 -04:00
|
|
|
|
(define* (store-path-abbreviation store-path #:optional (prefix-length 6))
|
2015-09-24 15:54:37 -04:00
|
|
|
|
"If STORE-PATH is the file name of a store entry, return an abbreviation of
|
|
|
|
|
STORE-PATH for display, showing PREFIX-LENGTH characters of the hash.
|
|
|
|
|
Otherwise return STORE-PATH."
|
|
|
|
|
(if (string-prefix? (%store-directory) store-path)
|
|
|
|
|
(let ((base (basename store-path)))
|
|
|
|
|
(string-append (string-take base prefix-length)
|
2015-10-01 05:28:58 -04:00
|
|
|
|
(ellipsis)
|
2015-09-24 15:54:37 -04:00
|
|
|
|
(string-drop base 32)))
|
|
|
|
|
store-path))
|
2015-09-15 01:31:11 -04:00
|
|
|
|
|
2013-01-11 09:41:58 -05:00
|
|
|
|
(define* (uri-abbreviation uri #:optional (max-length 42))
|
|
|
|
|
"If URI's string representation is larger than MAX-LENGTH, return an
|
|
|
|
|
abbreviation of URI showing the scheme, host, and basename of the file."
|
|
|
|
|
(define uri-as-string
|
|
|
|
|
(uri->string uri))
|
|
|
|
|
|
|
|
|
|
(define (elide-path)
|
2016-04-20 16:52:35 -04:00
|
|
|
|
(let* ((path (uri-path uri))
|
|
|
|
|
(base (basename path))
|
|
|
|
|
(prefix (string-append (symbol->string (uri-scheme uri)) "://"
|
|
|
|
|
|
|
|
|
|
;; `file' URIs have no host part.
|
|
|
|
|
(or (uri-host uri) "")
|
|
|
|
|
|
|
|
|
|
(string-append "/" (ellipsis) "/"))))
|
|
|
|
|
(if (> (+ (string-length prefix) (string-length base)) max-length)
|
|
|
|
|
(string-append prefix (ellipsis)
|
|
|
|
|
(string-drop base (quotient (string-length base) 2)))
|
|
|
|
|
(string-append prefix base))))
|
2013-01-11 09:41:58 -05:00
|
|
|
|
|
|
|
|
|
(if (> (string-length uri-as-string) max-length)
|
|
|
|
|
(let ((short (elide-path)))
|
|
|
|
|
(if (< (string-length short) (string-length uri-as-string))
|
|
|
|
|
short
|
|
|
|
|
uri-as-string))
|
|
|
|
|
uri-as-string))
|
|
|
|
|
|
2016-04-20 17:01:41 -04:00
|
|
|
|
(define (nar-uri-abbreviation uri)
|
|
|
|
|
"Abbreviate URI, which is assumed to be the URI of a nar as served by Hydra
|
|
|
|
|
and 'guix publish', something like
|
|
|
|
|
\"http://example.org/nar/1ldrllwbna0aw5z8kpci4fsvbd2w8cw4-texlive-bin-2015\"."
|
|
|
|
|
(let* ((uri (if (string? uri) (string->uri uri) uri))
|
|
|
|
|
(path (basename (uri-path uri))))
|
|
|
|
|
(if (and (> (string-length path) 33)
|
|
|
|
|
(char=? (string-ref path 32) #\-))
|
|
|
|
|
(string-drop path 33)
|
|
|
|
|
path)))
|
|
|
|
|
|
2018-09-12 09:08:38 -04:00
|
|
|
|
(define* (ftp-fetch uri file #:key timeout print-build-trace?)
|
2016-05-27 04:33:23 -04:00
|
|
|
|
"Fetch data from URI and write it to FILE. Return FILE on success. Bail
|
|
|
|
|
out if the connection could not be established in less than TIMEOUT seconds."
|
2017-03-28 07:27:56 -04:00
|
|
|
|
(let* ((conn (match (and=> (uri-userinfo uri)
|
|
|
|
|
(cut string-split <> #\:))
|
2017-03-21 07:15:14 -04:00
|
|
|
|
(((? string? user))
|
|
|
|
|
(ftp-open (uri-host uri) #:timeout timeout
|
|
|
|
|
#:username user))
|
|
|
|
|
(((? string? user) (? string? pass))
|
|
|
|
|
(ftp-open (uri-host uri) #:timeout timeout
|
|
|
|
|
#:username user
|
|
|
|
|
#:password pass))
|
|
|
|
|
(_ (ftp-open (uri-host uri) #:timeout timeout))))
|
2013-01-06 12:24:53 -05:00
|
|
|
|
(size (false-if-exception (ftp-size conn (uri-path uri))))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(in (ftp-retr conn (basename (uri-path uri))
|
2017-11-14 03:51:50 -05:00
|
|
|
|
(dirname (uri-path uri))
|
|
|
|
|
#:timeout timeout)))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(call-with-output-file file
|
|
|
|
|
(lambda (out)
|
2017-09-16 16:10:18 -04:00
|
|
|
|
(dump-port* in out
|
|
|
|
|
#:buffer-size %http-receive-buffer-size
|
2018-09-12 09:08:38 -04:00
|
|
|
|
#:reporter
|
|
|
|
|
(if print-build-trace?
|
|
|
|
|
(progress-reporter/trace
|
|
|
|
|
file (uri->string uri) size)
|
|
|
|
|
(progress-reporter/file
|
|
|
|
|
(uri-abbreviation uri) size)))))
|
|
|
|
|
|
|
|
|
|
(ftp-close conn)
|
|
|
|
|
(unless print-build-trace?
|
|
|
|
|
(newline))
|
|
|
|
|
file))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
2013-01-20 16:28:38 -05:00
|
|
|
|
;; Autoload GnuTLS so that this module can be used even when GnuTLS is
|
|
|
|
|
;; not available. At compile time, this yields "possibly unbound
|
|
|
|
|
;; variable" warnings, but these are OK: we know that the variables will
|
|
|
|
|
;; be bound if we need them, because (guix download) adds GnuTLS as an
|
|
|
|
|
;; input in that case.
|
|
|
|
|
|
2020-01-06 09:14:09 -05:00
|
|
|
|
(define (load-gnutls)
|
|
|
|
|
;; XXX: Use this hack instead of #:autoload to avoid compilation errors.
|
|
|
|
|
;; See <http://bugs.gnu.org/12202>.
|
2020-01-07 05:45:56 -05:00
|
|
|
|
(module-use! (resolve-module '(guix build download))
|
|
|
|
|
(resolve-interface '(gnutls)))
|
2020-01-06 09:14:09 -05:00
|
|
|
|
(set! load-gnutls (const #t)))
|
2013-01-20 16:28:38 -05:00
|
|
|
|
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(define %x509-certificate-directory
|
|
|
|
|
;; The directory where X.509 authority PEM certificates are stored.
|
|
|
|
|
(make-parameter (or (getenv "GUIX_TLS_CERTIFICATE_DIRECTORY")
|
2019-10-21 09:33:32 -04:00
|
|
|
|
(getenv "SSL_CERT_DIR") ;like OpenSSL
|
|
|
|
|
"/etc/ssl/certs")))
|
2016-11-07 17:07:08 -05:00
|
|
|
|
|
2017-05-30 04:11:13 -04:00
|
|
|
|
(define (set-certificate-credentials-x509-trust-file!* cred file format)
|
|
|
|
|
"Like 'set-certificate-credentials-x509-trust-file!', but without the file
|
|
|
|
|
name decoding bug described at
|
|
|
|
|
<https://debbugs.gnu.org/cgi/bugreport.cgi?bug=26948#17>."
|
|
|
|
|
(let ((data (call-with-input-file file get-bytevector-all)))
|
|
|
|
|
(set-certificate-credentials-x509-trust-data! cred data format)))
|
|
|
|
|
|
2022-03-03 16:44:25 -05:00
|
|
|
|
(define make-credentials-with-ca-trust-files
|
2022-03-03 16:42:31 -05:00
|
|
|
|
(mlambda (directory)
|
|
|
|
|
"Return certificate credentials with X.509 authority certificates read from
|
2016-11-07 17:07:08 -05:00
|
|
|
|
DIRECTORY. Those authority certificates are checked when
|
|
|
|
|
'peer-certificate-status' is later called."
|
2022-03-03 16:42:31 -05:00
|
|
|
|
;; Memoize the result to avoid scanning all the certificates every time a
|
|
|
|
|
;; connection is made.
|
|
|
|
|
(let ((cred (make-certificate-credentials))
|
|
|
|
|
(files (match (scandir directory (cut string-suffix? ".pem" <>))
|
|
|
|
|
((or #f ())
|
|
|
|
|
;; Some distros provide nothing but bundles (*.crt) under
|
|
|
|
|
;; /etc/ssl/certs, so look for them.
|
|
|
|
|
(or (scandir directory (cut string-suffix? ".crt" <>))
|
|
|
|
|
'()))
|
|
|
|
|
(pem pem))))
|
|
|
|
|
(for-each (lambda (file)
|
|
|
|
|
(let ((file (string-append directory "/" file)))
|
|
|
|
|
;; Protect against dangling symlinks.
|
|
|
|
|
(when (file-exists? file)
|
|
|
|
|
(set-certificate-credentials-x509-trust-file!*
|
|
|
|
|
cred file
|
|
|
|
|
x509-certificate-format/pem))))
|
|
|
|
|
files)
|
|
|
|
|
cred)))
|
2016-11-07 17:07:08 -05:00
|
|
|
|
|
|
|
|
|
(define (peer-certificate session)
|
|
|
|
|
"Return the certificate of the remote peer in SESSION."
|
|
|
|
|
(match (session-peer-certificate-chain session)
|
|
|
|
|
((first _ ...)
|
|
|
|
|
(import-x509-certificate first x509-certificate-format/der))))
|
|
|
|
|
|
|
|
|
|
(define (assert-valid-server-certificate session server)
|
|
|
|
|
"Return #t if the certificate of the remote peer for SESSION is a valid
|
|
|
|
|
certificate for SERVER, where SERVER is the expected host name of peer."
|
|
|
|
|
(define cert
|
|
|
|
|
(peer-certificate session))
|
|
|
|
|
|
|
|
|
|
;; First check whether the server's certificate matches SERVER.
|
|
|
|
|
(unless (x509-certificate-matches-hostname? cert server)
|
|
|
|
|
(throw 'tls-certificate-error 'host-mismatch cert server))
|
|
|
|
|
|
|
|
|
|
;; Second check its validity and reachability from the set of authority
|
|
|
|
|
;; certificates loaded via 'set-certificate-credentials-x509-trust-file!'.
|
|
|
|
|
(match (peer-certificate-status session)
|
|
|
|
|
(() ;certificate is valid
|
|
|
|
|
#t)
|
|
|
|
|
((statuses ...)
|
|
|
|
|
(throw 'tls-certificate-error 'invalid-certificate cert server
|
|
|
|
|
statuses))))
|
|
|
|
|
|
|
|
|
|
(define (print-tls-certificate-error port key args default-printer)
|
|
|
|
|
"Print the TLS certificate error represented by ARGS in an intelligible
|
|
|
|
|
way."
|
|
|
|
|
(match args
|
|
|
|
|
(('host-mismatch cert server)
|
|
|
|
|
(format port
|
|
|
|
|
"X.509 server certificate for '~a' does not match: ~a~%"
|
|
|
|
|
server (x509-certificate-dn cert)))
|
|
|
|
|
(('invalid-certificate cert server statuses)
|
|
|
|
|
(format port
|
|
|
|
|
"X.509 certificate of '~a' could not be verified:~%~{ ~a~%~}"
|
|
|
|
|
server
|
|
|
|
|
(map certificate-status->string statuses)))))
|
|
|
|
|
|
|
|
|
|
(set-exception-printer! 'tls-certificate-error
|
|
|
|
|
print-tls-certificate-error)
|
|
|
|
|
|
2022-08-01 05:01:52 -04:00
|
|
|
|
(define (wrap-record-port-for-gnutls<3.7.7 record port)
|
|
|
|
|
"Return a port that wraps RECORD to ensure that closing it also closes PORT,
|
|
|
|
|
the actual socket port, and its file descriptor. Make sure it does not
|
|
|
|
|
introduce extra buffering (custom ports are buffered by default as of Guile
|
|
|
|
|
3.0.5).
|
|
|
|
|
|
|
|
|
|
This wrapper is unnecessary with GnuTLS >= 3.7.7, which can automatically
|
|
|
|
|
close SESSION's file descriptor when RECORD is closed."
|
|
|
|
|
(define (read! bv start count)
|
|
|
|
|
(define read
|
|
|
|
|
(catch 'gnutls-error
|
|
|
|
|
(lambda ()
|
|
|
|
|
(get-bytevector-n! record bv start count))
|
|
|
|
|
(lambda (key err proc . rest)
|
|
|
|
|
;; When responding to "Connection: close" requests, some servers
|
|
|
|
|
;; close the connection abruptly after sending the response body,
|
|
|
|
|
;; without doing a proper TLS connection termination. Treat it as
|
|
|
|
|
;; EOF. This is fixed in GnuTLS 3.7.7.
|
|
|
|
|
(if (eq? err error/premature-termination)
|
|
|
|
|
the-eof-object
|
|
|
|
|
(apply throw key err proc rest)))))
|
|
|
|
|
|
|
|
|
|
(if (eof-object? read)
|
|
|
|
|
0
|
|
|
|
|
read))
|
|
|
|
|
(define (write! bv start count)
|
|
|
|
|
(put-bytevector record bv start count)
|
|
|
|
|
(force-output record)
|
|
|
|
|
count)
|
|
|
|
|
(define (get-position)
|
|
|
|
|
(port-position record))
|
|
|
|
|
(define (set-position! new-position)
|
|
|
|
|
(set-port-position! record new-position))
|
|
|
|
|
(define (close)
|
|
|
|
|
(unless (port-closed? port)
|
|
|
|
|
(close-port port))
|
|
|
|
|
(unless (port-closed? record)
|
|
|
|
|
(close-port record)))
|
|
|
|
|
|
|
|
|
|
(define (unbuffered port)
|
|
|
|
|
(setvbuf port 'none)
|
|
|
|
|
port)
|
|
|
|
|
|
|
|
|
|
(unbuffered
|
|
|
|
|
(make-custom-binary-input/output-port "gnutls wrapped port" read! write!
|
|
|
|
|
get-position set-position!
|
|
|
|
|
close)))
|
|
|
|
|
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(define* (tls-wrap port server #:key (verify-certificate? #t))
|
2014-09-22 15:06:39 -04:00
|
|
|
|
"Return PORT wrapped in a TLS connection to SERVER. SERVER must be a DNS
|
|
|
|
|
host name without trailing dot."
|
2013-01-20 16:28:38 -05:00
|
|
|
|
(define (log level str)
|
|
|
|
|
(format (current-error-port)
|
|
|
|
|
"gnutls: [~a|~a] ~a" (getpid) level str))
|
|
|
|
|
|
2020-01-06 09:14:09 -05:00
|
|
|
|
(load-gnutls)
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(let ((session (make-session connection-end/client))
|
|
|
|
|
(ca-certs (%x509-certificate-directory)))
|
2014-09-22 15:06:39 -04:00
|
|
|
|
|
|
|
|
|
;; Some servers such as 'cloud.github.com' require the client to support
|
|
|
|
|
;; the 'SERVER NAME' extension. However, 'set-session-server-name!' is
|
|
|
|
|
;; not available in older GnuTLS releases. See
|
|
|
|
|
;; <http://bugs.gnu.org/18526> for details.
|
|
|
|
|
(if (module-defined? (resolve-interface '(gnutls))
|
|
|
|
|
'set-session-server-name!)
|
|
|
|
|
(set-session-server-name! session server-name-type/dns server)
|
|
|
|
|
(format (current-error-port)
|
|
|
|
|
"warning: TLS 'SERVER NAME' extension not supported~%"))
|
|
|
|
|
|
2013-01-20 16:28:38 -05:00
|
|
|
|
(set-session-transport-fd! session (fileno port))
|
|
|
|
|
(set-session-default-priority! session)
|
2016-04-20 07:12:57 -04:00
|
|
|
|
|
|
|
|
|
;; The "%COMPAT" bit allows us to work around firewall issues (info
|
|
|
|
|
;; "(gnutls) Priority Strings"); see <http://bugs.gnu.org/23311>.
|
|
|
|
|
;; Explicitly disable SSLv3, which is insecure:
|
|
|
|
|
;; <https://tools.ietf.org/html/rfc7568>.
|
2019-12-18 18:32:11 -05:00
|
|
|
|
(set-session-priorities! session "NORMAL:%COMPAT:-VERS-SSL3.0")
|
2016-04-20 07:12:57 -04:00
|
|
|
|
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(set-session-credentials! session
|
|
|
|
|
(if (and verify-certificate? ca-certs)
|
2022-03-03 16:44:25 -05:00
|
|
|
|
(make-credentials-with-ca-trust-files
|
2016-11-07 17:07:08 -05:00
|
|
|
|
ca-certs)
|
|
|
|
|
(make-certificate-credentials)))
|
2013-01-20 16:28:38 -05:00
|
|
|
|
|
|
|
|
|
;; Uncomment the following lines in case of debugging emergency.
|
|
|
|
|
;;(set-log-level! 10)
|
|
|
|
|
;;(set-log-procedure! log)
|
|
|
|
|
|
2021-06-25 10:11:55 -04:00
|
|
|
|
(let loop ((retries 5))
|
|
|
|
|
(catch 'gnutls-error
|
|
|
|
|
(lambda ()
|
|
|
|
|
(handshake session))
|
|
|
|
|
(lambda (key err proc . rest)
|
|
|
|
|
(cond ((eq? err error/warning-alert-received)
|
|
|
|
|
;; Like Wget, do no stop upon non-fatal alerts such as
|
|
|
|
|
;; 'alert-description/unrecognized-name'.
|
|
|
|
|
(format (current-error-port)
|
|
|
|
|
"warning: TLS warning alert received: ~a~%"
|
|
|
|
|
(alert-description->string (alert-get session)))
|
|
|
|
|
(handshake session))
|
|
|
|
|
(else
|
|
|
|
|
(if (or (fatal-error? err) (zero? retries))
|
|
|
|
|
(apply throw key err proc rest)
|
|
|
|
|
(begin
|
|
|
|
|
;; We got 'error/again' or similar; try again.
|
|
|
|
|
(format (current-error-port)
|
|
|
|
|
"warning: TLS non-fatal error: ~a~%"
|
|
|
|
|
(error->string err))
|
|
|
|
|
(loop (- retries 1)))))))))
|
2016-11-07 17:07:08 -05:00
|
|
|
|
|
|
|
|
|
;; Verify the server's certificate if needed.
|
|
|
|
|
(when verify-certificate?
|
|
|
|
|
(catch 'tls-certificate-error
|
|
|
|
|
(lambda ()
|
|
|
|
|
(assert-valid-server-certificate session server))
|
|
|
|
|
(lambda args
|
|
|
|
|
(close-port port)
|
|
|
|
|
(apply throw args))))
|
|
|
|
|
|
2013-05-09 19:14:25 -04:00
|
|
|
|
(let ((record (session-record-port session)))
|
2020-01-03 09:47:12 -05:00
|
|
|
|
(setvbuf record 'block)
|
2022-08-01 05:01:52 -04:00
|
|
|
|
(if (module-defined? (resolve-interface '(gnutls))
|
|
|
|
|
'set-session-record-port-close!) ;GnuTLS >= 3.7.7
|
|
|
|
|
(let ((close-wrapped-port (lambda (_) (close-port port))))
|
|
|
|
|
(set-session-record-port-close! record close-wrapped-port)
|
|
|
|
|
record)
|
|
|
|
|
(wrap-record-port-for-gnutls<3.7.7 record port)))))
|
2013-01-20 16:28:38 -05:00
|
|
|
|
|
2015-11-12 16:37:32 -05:00
|
|
|
|
(define (ensure-uri uri-or-string) ;XXX: copied from (web http)
|
|
|
|
|
(cond
|
|
|
|
|
((string? uri-or-string) (string->uri uri-or-string))
|
|
|
|
|
((uri? uri-or-string) uri-or-string)
|
|
|
|
|
(else (error "Invalid URI" uri-or-string))))
|
|
|
|
|
|
|
|
|
|
(define* (open-socket-for-uri uri-or-string #:key timeout)
|
|
|
|
|
"Return an open input/output port for a connection to URI. When TIMEOUT is
|
|
|
|
|
not #f, it must be a (possibly inexact) number denoting the maximum duration
|
|
|
|
|
in seconds to wait for the connection to complete; passed TIMEOUT, an
|
|
|
|
|
ETIMEDOUT error is raised."
|
|
|
|
|
;; Includes a fix for <http://bugs.gnu.org/15368> which affects Guile's
|
2015-11-12 17:15:18 -05:00
|
|
|
|
;; 'open-socket-for-uri' up to 2.0.11 included, uses 'connect*' instead
|
|
|
|
|
;; of 'connect', and uses AI_ADDRCONFIG.
|
2015-11-12 16:37:32 -05:00
|
|
|
|
|
|
|
|
|
(define http-proxy (current-http-proxy))
|
|
|
|
|
(define uri (ensure-uri (or http-proxy uri-or-string)))
|
|
|
|
|
(define addresses
|
|
|
|
|
(let ((port (uri-port uri)))
|
|
|
|
|
(delete-duplicates
|
|
|
|
|
(getaddrinfo (uri-host uri)
|
|
|
|
|
(cond (port => number->string)
|
|
|
|
|
(else (symbol->string (uri-scheme uri))))
|
2015-11-12 17:15:18 -05:00
|
|
|
|
(if (number? port)
|
|
|
|
|
(logior AI_ADDRCONFIG AI_NUMERICSERV)
|
|
|
|
|
AI_ADDRCONFIG))
|
2015-11-12 16:37:32 -05:00
|
|
|
|
(lambda (ai1 ai2)
|
|
|
|
|
(equal? (addrinfo:addr ai1) (addrinfo:addr ai2))))))
|
|
|
|
|
|
|
|
|
|
(let loop ((addresses addresses))
|
|
|
|
|
(let* ((ai (car addresses))
|
|
|
|
|
(s (with-fluids ((%default-port-encoding #f))
|
|
|
|
|
;; Restrict ourselves to TCP.
|
|
|
|
|
(socket (addrinfo:fam ai) SOCK_STREAM IPPROTO_IP))))
|
|
|
|
|
(catch 'system-error
|
|
|
|
|
(lambda ()
|
|
|
|
|
(connect* s (addrinfo:addr ai) timeout)
|
|
|
|
|
|
|
|
|
|
;; Buffer input and output on this port.
|
2019-01-07 04:57:18 -05:00
|
|
|
|
(setvbuf s 'block)
|
2015-11-12 16:37:32 -05:00
|
|
|
|
;; If we're using a proxy, make a note of that.
|
|
|
|
|
(when http-proxy (set-http-proxy-port?! s #t))
|
|
|
|
|
s)
|
|
|
|
|
(lambda args
|
|
|
|
|
;; Connection failed, so try one of the other addresses.
|
|
|
|
|
(close s)
|
|
|
|
|
(if (null? (cdr addresses))
|
|
|
|
|
(apply throw args)
|
|
|
|
|
(loop (cdr addresses))))))))
|
|
|
|
|
|
2019-05-10 09:27:40 -04:00
|
|
|
|
(define (setup-http-tunnel port uri)
|
|
|
|
|
"Establish over PORT an HTTP tunnel to the destination server of URI."
|
|
|
|
|
(define target
|
|
|
|
|
(string-append (uri-host uri) ":"
|
|
|
|
|
(number->string
|
|
|
|
|
(or (uri-port uri)
|
|
|
|
|
(match (uri-scheme uri)
|
|
|
|
|
('http 80)
|
|
|
|
|
('https 443))))))
|
|
|
|
|
(format port "CONNECT ~a HTTP/1.1\r\n" target)
|
|
|
|
|
(format port "Host: ~a\r\n\r\n" target)
|
|
|
|
|
(force-output port)
|
|
|
|
|
(read-response port))
|
|
|
|
|
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(define* (open-connection-for-uri uri
|
|
|
|
|
#:key
|
|
|
|
|
timeout
|
|
|
|
|
(verify-certificate? #t))
|
2022-03-03 16:33:26 -05:00
|
|
|
|
"Like 'open-socket-for-uri', but also handle HTTPS connections. When
|
2016-11-07 17:07:08 -05:00
|
|
|
|
VERIFY-CERTIFICATE? is true, verify HTTPS server certificates."
|
2017-03-17 18:41:37 -04:00
|
|
|
|
;; Note: Guile 2.2.0's (web client) has a same-named export that's actually
|
|
|
|
|
;; undefined. See Guile commit 011669af3b428e5626f7bbf66b11d57d9768c047.
|
|
|
|
|
|
2015-04-30 16:13:04 -04:00
|
|
|
|
(define https?
|
|
|
|
|
(eq? 'https (uri-scheme uri)))
|
|
|
|
|
|
2019-05-10 09:27:40 -04:00
|
|
|
|
(define https-proxy (let ((proxy (getenv "https_proxy")))
|
|
|
|
|
(and (not (equal? proxy ""))
|
|
|
|
|
proxy)))
|
|
|
|
|
|
2015-04-30 16:13:04 -04:00
|
|
|
|
(let-syntax ((with-https-proxy
|
|
|
|
|
(syntax-rules ()
|
|
|
|
|
((_ exp)
|
|
|
|
|
;; For HTTPS URIs, honor 'https_proxy', not 'http_proxy'.
|
|
|
|
|
(let ((thunk (lambda () exp)))
|
|
|
|
|
(if (and https?
|
|
|
|
|
(module-variable
|
|
|
|
|
(resolve-interface '(web client))
|
|
|
|
|
'current-http-proxy))
|
2019-05-10 09:27:40 -04:00
|
|
|
|
(parameterize ((current-http-proxy https-proxy))
|
2015-04-30 16:13:04 -04:00
|
|
|
|
(thunk))
|
|
|
|
|
(thunk)))))))
|
|
|
|
|
(with-https-proxy
|
2015-11-12 16:37:32 -05:00
|
|
|
|
(let ((s (open-socket-for-uri uri #:timeout timeout)))
|
2015-05-06 03:50:15 -04:00
|
|
|
|
;; Buffer input and output on this port.
|
2019-01-07 04:57:18 -05:00
|
|
|
|
(setvbuf s 'block %http-receive-buffer-size)
|
2015-05-06 03:50:15 -04:00
|
|
|
|
|
2019-05-10 09:27:40 -04:00
|
|
|
|
(when (and https? https-proxy)
|
|
|
|
|
(setup-http-tunnel s uri))
|
|
|
|
|
|
2015-04-30 16:13:04 -04:00
|
|
|
|
(if https?
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(tls-wrap s (uri-host uri)
|
|
|
|
|
#:verify-certificate? verify-certificate?)
|
2015-04-30 16:13:04 -04:00
|
|
|
|
s)))))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
2020-01-03 09:47:12 -05:00
|
|
|
|
(define (close-connection port) ;deprecated
|
2016-03-17 16:34:33 -04:00
|
|
|
|
(unless (port-closed? port)
|
2020-01-03 09:47:12 -05:00
|
|
|
|
(close-port port)))
|
2016-03-17 16:34:33 -04:00
|
|
|
|
|
2012-11-12 17:10:26 -05:00
|
|
|
|
;; XXX: This is an awful hack to make sure the (set-port-encoding! p
|
|
|
|
|
;; "ISO-8859-1") call in `read-response' passes, even during bootstrap
|
|
|
|
|
;; where iconv is not available.
|
|
|
|
|
(module-define! (resolve-module '(web response))
|
|
|
|
|
'set-port-encoding!
|
|
|
|
|
(lambda (p e) #f))
|
|
|
|
|
|
2015-02-18 19:33:10 -05:00
|
|
|
|
(define (resolve-uri-reference ref base)
|
|
|
|
|
"Resolve the URI reference REF, interpreted relative to the BASE URI, into a
|
|
|
|
|
target URI, according to the algorithm specified in RFC 3986 section 5.2.2.
|
|
|
|
|
Return the resulting target URI."
|
|
|
|
|
|
|
|
|
|
(define (merge-paths base-path rel-path)
|
|
|
|
|
(let* ((base-components (string-split base-path #\/))
|
|
|
|
|
(base-directory-components (match base-components
|
|
|
|
|
((components ... last) components)
|
|
|
|
|
(() '())))
|
|
|
|
|
(base-directory (string-join base-directory-components "/")))
|
|
|
|
|
(string-append base-directory "/" rel-path)))
|
|
|
|
|
|
|
|
|
|
(define (remove-dot-segments path)
|
|
|
|
|
(let loop ((in
|
|
|
|
|
;; Drop leading "." and ".." components from a relative path.
|
|
|
|
|
;; (absolute paths will start with a "" component)
|
|
|
|
|
(drop-while (match-lambda
|
|
|
|
|
((or "." "..") #t)
|
|
|
|
|
(_ #f))
|
|
|
|
|
(string-split path #\/)))
|
|
|
|
|
(out '()))
|
|
|
|
|
(match in
|
|
|
|
|
(("." . rest)
|
|
|
|
|
(loop rest out))
|
|
|
|
|
((".." . rest)
|
|
|
|
|
(match out
|
|
|
|
|
((or () (""))
|
|
|
|
|
(error "remove-dot-segments: too many '..' components" path))
|
|
|
|
|
(_
|
|
|
|
|
(loop rest (cdr out)))))
|
|
|
|
|
((component . rest)
|
|
|
|
|
(loop rest (cons component out)))
|
|
|
|
|
(()
|
|
|
|
|
(string-join (reverse out) "/")))))
|
|
|
|
|
|
|
|
|
|
(cond ((or (uri-scheme ref)
|
|
|
|
|
(uri-host ref))
|
|
|
|
|
(build-uri (or (uri-scheme ref)
|
|
|
|
|
(uri-scheme base))
|
|
|
|
|
#:userinfo (uri-userinfo ref)
|
|
|
|
|
#:host (uri-host ref)
|
|
|
|
|
#:port (uri-port ref)
|
|
|
|
|
#:path (remove-dot-segments (uri-path ref))
|
|
|
|
|
#:query (uri-query ref)
|
|
|
|
|
#:fragment (uri-fragment ref)))
|
|
|
|
|
((string-null? (uri-path ref))
|
|
|
|
|
(build-uri (uri-scheme base)
|
|
|
|
|
#:userinfo (uri-userinfo base)
|
|
|
|
|
#:host (uri-host base)
|
|
|
|
|
#:port (uri-port base)
|
|
|
|
|
#:path (remove-dot-segments (uri-path base))
|
|
|
|
|
#:query (or (uri-query ref)
|
|
|
|
|
(uri-query base))
|
|
|
|
|
#:fragment (uri-fragment ref)))
|
|
|
|
|
(else
|
|
|
|
|
(build-uri (uri-scheme base)
|
|
|
|
|
#:userinfo (uri-userinfo base)
|
|
|
|
|
#:host (uri-host base)
|
|
|
|
|
#:port (uri-port base)
|
|
|
|
|
#:path (remove-dot-segments
|
|
|
|
|
(if (string-prefix? "/" (uri-path ref))
|
|
|
|
|
(uri-path ref)
|
|
|
|
|
(merge-paths (uri-path base)
|
|
|
|
|
(uri-path ref))))
|
|
|
|
|
#:query (uri-query ref)
|
|
|
|
|
#:fragment (uri-fragment ref)))))
|
|
|
|
|
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(define* (http-fetch uri #:key timeout (verify-certificate? #t))
|
|
|
|
|
"Return an input port containing the data at URI, and the expected number of
|
|
|
|
|
bytes available or #f. When TIMEOUT is true, bail out if the connection could
|
|
|
|
|
not be established in less than TIMEOUT seconds. When VERIFY-CERTIFICATE? is
|
|
|
|
|
true, verify HTTPS certificates; otherwise simply ignore them."
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
2014-02-09 18:03:34 -05:00
|
|
|
|
(define headers
|
2016-06-28 09:36:34 -04:00
|
|
|
|
`(;; Some web sites, such as http://dist.schmorp.de, would block you if
|
2014-10-19 06:07:26 -04:00
|
|
|
|
;; there's no 'User-Agent' header, presumably on the assumption that
|
|
|
|
|
;; you're a spammer. So work around that.
|
|
|
|
|
(User-Agent . "GNU Guile")
|
|
|
|
|
|
|
|
|
|
;; Some servers, such as https://alioth.debian.org, return "406 Not
|
|
|
|
|
;; Acceptable" when not explicitly told that everything is accepted.
|
2016-06-28 09:36:34 -04:00
|
|
|
|
(Accept . "*/*")
|
|
|
|
|
|
|
|
|
|
;; Basic authentication, if needed.
|
|
|
|
|
,@(match (uri-userinfo uri)
|
|
|
|
|
((? string? str)
|
|
|
|
|
`((Authorization . ,(string-append "Basic "
|
|
|
|
|
(base64-encode
|
|
|
|
|
(string->utf8 str))))))
|
|
|
|
|
(_ '()))))
|
2014-02-09 18:03:34 -05:00
|
|
|
|
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(let*-values (((connection)
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(open-connection-for-uri uri
|
|
|
|
|
#:timeout timeout
|
|
|
|
|
#:verify-certificate?
|
|
|
|
|
verify-certificate?))
|
2017-10-16 16:21:02 -04:00
|
|
|
|
((resp port)
|
2017-03-17 18:07:01 -04:00
|
|
|
|
(http-get uri #:port connection #:decode-body? #f
|
|
|
|
|
#:streaming? #t
|
|
|
|
|
#:headers headers))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
((code)
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(response-code resp)))
|
2012-11-12 17:09:32 -05:00
|
|
|
|
(case code
|
|
|
|
|
((200) ; OK
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(values port (response-content-length resp)))
|
2013-01-25 15:36:26 -05:00
|
|
|
|
((301 ; moved permanently
|
2016-04-12 04:14:59 -04:00
|
|
|
|
302 ; found (redirection)
|
2017-08-28 09:46:10 -04:00
|
|
|
|
303 ; see other
|
|
|
|
|
307 ; temporary redirection
|
|
|
|
|
308) ; permanent redirection
|
2015-02-18 19:33:10 -05:00
|
|
|
|
(let ((uri (resolve-uri-reference (response-location resp) uri)))
|
2012-11-12 17:09:32 -05:00
|
|
|
|
(format #t "following redirection to `~a'...~%"
|
|
|
|
|
(uri->string uri))
|
|
|
|
|
(close connection)
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(http-fetch uri
|
2016-11-07 17:07:08 -05:00
|
|
|
|
#:timeout timeout
|
|
|
|
|
#:verify-certificate? verify-certificate?)))
|
2012-11-12 17:09:32 -05:00
|
|
|
|
(else
|
|
|
|
|
(error "download failed" (uri->string uri)
|
|
|
|
|
code (response-reason-phrase resp))))))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
(define-syntax-rule (false-if-exception* body ...)
|
|
|
|
|
"Like `false-if-exception', but print the exception on the error port."
|
|
|
|
|
(catch #t
|
|
|
|
|
(lambda ()
|
|
|
|
|
body ...)
|
|
|
|
|
(lambda (key . args)
|
|
|
|
|
#f)
|
|
|
|
|
(lambda (key . args)
|
|
|
|
|
(print-exception (current-error-port) #f key args))))
|
|
|
|
|
|
2024-02-23 08:42:43 -05:00
|
|
|
|
(define %download-methods
|
|
|
|
|
;; Either #f (the default) or a list of symbols denoting the sequence of
|
|
|
|
|
;; download methods to be used--e.g., '(swh nar upstream).
|
|
|
|
|
(make-parameter
|
|
|
|
|
(and=> (getenv "GUIX_DOWNLOAD_METHODS")
|
|
|
|
|
(lambda (str)
|
|
|
|
|
(map string->symbol (string-tokenize str))))))
|
|
|
|
|
|
|
|
|
|
(define (download-method-enabled? method)
|
|
|
|
|
"Return true if METHOD (a symbol such as 'swh) is enabled as part of the
|
|
|
|
|
download fallback sequence."
|
|
|
|
|
(or (not (%download-methods))
|
|
|
|
|
(memq method (%download-methods))))
|
|
|
|
|
|
2014-12-29 14:51:12 -05:00
|
|
|
|
(define (uri-vicinity dir file)
|
|
|
|
|
"Concatenate DIR, slash, and FILE, keeping only one slash in between.
|
|
|
|
|
This is required by some HTTP servers."
|
|
|
|
|
(string-append (string-trim-right dir #\/) "/"
|
|
|
|
|
(string-trim file #\/)))
|
|
|
|
|
|
|
|
|
|
(define (maybe-expand-mirrors uri mirrors)
|
|
|
|
|
"If URI uses the 'mirror' scheme, expand it according to the MIRRORS alist.
|
|
|
|
|
Return a list of URIs."
|
|
|
|
|
(case (uri-scheme uri)
|
|
|
|
|
((mirror)
|
|
|
|
|
(let ((kind (string->symbol (uri-host uri)))
|
|
|
|
|
(path (uri-path uri)))
|
|
|
|
|
(match (assoc-ref mirrors kind)
|
|
|
|
|
((mirrors ..1)
|
|
|
|
|
(map (compose string->uri (cut uri-vicinity <> path))
|
|
|
|
|
mirrors))
|
|
|
|
|
(_
|
|
|
|
|
(error "unsupported URL mirror kind" kind uri)))))
|
|
|
|
|
(else
|
|
|
|
|
(list uri))))
|
|
|
|
|
|
2021-03-19 23:03:25 -04:00
|
|
|
|
(define* (disarchive-fetch/any uris file
|
|
|
|
|
#:key (timeout 10) (verify-certificate? #t))
|
|
|
|
|
"Fetch a Disarchive specification from any of URIS, assemble it,
|
|
|
|
|
and write the output to FILE."
|
|
|
|
|
(define (fetch-specification uris)
|
|
|
|
|
(any (lambda (uri)
|
|
|
|
|
(false-if-exception*
|
|
|
|
|
(let-values (((port size) (http-fetch uri
|
|
|
|
|
#:verify-certificate?
|
|
|
|
|
verify-certificate?
|
|
|
|
|
#:timeout timeout)))
|
2021-10-14 10:43:08 -04:00
|
|
|
|
(format #t "Retrieving Disarchive spec from ~a ...~%"
|
|
|
|
|
(uri->string uri))
|
2021-03-19 23:03:25 -04:00
|
|
|
|
(let ((specification (read port)))
|
|
|
|
|
(close-port port)
|
|
|
|
|
specification))))
|
|
|
|
|
uris))
|
|
|
|
|
|
|
|
|
|
(define (resolve addresses output)
|
|
|
|
|
(any (match-lambda
|
|
|
|
|
(('swhid swhid)
|
|
|
|
|
(match (string-split swhid #\:)
|
|
|
|
|
(("swh" "1" "dir" id)
|
|
|
|
|
(format #t "Downloading ~a from Software Heritage...~%" file)
|
|
|
|
|
(false-if-exception*
|
|
|
|
|
(swh-download-directory id output)))
|
|
|
|
|
(_ #f)))
|
|
|
|
|
(_ #f))
|
|
|
|
|
addresses))
|
|
|
|
|
|
|
|
|
|
(format #t "Trying to use Disarchive to assemble ~a...~%" file)
|
|
|
|
|
(match (and=> (resolve-module '(disarchive) #:ensure #f)
|
|
|
|
|
(lambda (disarchive)
|
|
|
|
|
(cons (module-ref disarchive '%disarchive-log-port)
|
|
|
|
|
(module-ref disarchive 'disarchive-assemble))))
|
2021-05-05 23:10:25 -04:00
|
|
|
|
(#f (format #t "could not load Disarchive~%")
|
|
|
|
|
#f)
|
2021-03-19 23:03:25 -04:00
|
|
|
|
((%disarchive-log-port . disarchive-assemble)
|
|
|
|
|
(match (fetch-specification uris)
|
2021-05-05 23:10:25 -04:00
|
|
|
|
(#f (format #t "could not find its Disarchive specification~%")
|
|
|
|
|
#f)
|
2021-10-04 17:03:41 -04:00
|
|
|
|
(spec (parameterize ((%disarchive-log-port (current-output-port))
|
|
|
|
|
(%verify-swh-certificate? verify-certificate?))
|
2021-05-05 23:10:25 -04:00
|
|
|
|
(false-if-exception*
|
|
|
|
|
(disarchive-assemble spec file #:resolver resolve))))))))
|
2021-03-19 23:03:25 -04:00
|
|
|
|
|
2021-09-22 06:27:41 -04:00
|
|
|
|
(define (internet-archive-uri uri)
|
|
|
|
|
"Return a URI corresponding to an Internet Archive backup of URI, or #f if
|
|
|
|
|
URI does not denote a Web URI."
|
|
|
|
|
(and (memq (uri-scheme uri) '(http https))
|
|
|
|
|
(let* ((now (time-utc->date (current-time time-utc)))
|
|
|
|
|
(date (date->string now "~Y~m~d~H~M~S")))
|
|
|
|
|
;; Note: the date in the URL can be anything and web.archive.org
|
|
|
|
|
;; automatically redirects to the closest date.
|
|
|
|
|
(build-uri 'https #:host "web.archive.org"
|
|
|
|
|
#:path (string-append "/web/" date "/"
|
|
|
|
|
(uri->string uri))))))
|
|
|
|
|
|
2016-05-14 11:37:47 -04:00
|
|
|
|
(define* (url-fetch url file
|
|
|
|
|
#:key
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(timeout 10) (verify-certificate? #t)
|
2016-05-14 11:37:47 -04:00
|
|
|
|
(mirrors '()) (content-addressed-mirrors '())
|
2021-03-19 23:03:25 -04:00
|
|
|
|
(disarchive-mirrors '())
|
2018-09-12 09:08:38 -04:00
|
|
|
|
(hashes '())
|
|
|
|
|
print-build-trace?)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
"Fetch FILE from URL; URL may be either a single string, or a list of
|
|
|
|
|
string denoting alternate URLs for FILE. Return #f on failure, and FILE
|
2016-05-14 11:37:47 -04:00
|
|
|
|
on success.
|
|
|
|
|
|
|
|
|
|
When MIRRORS is defined, it must be an alist of mirrors; it is used to resolve
|
|
|
|
|
'mirror://' URIs.
|
|
|
|
|
|
|
|
|
|
HASHES must be a list of algorithm/hash pairs, where each algorithm is a
|
|
|
|
|
symbol such as 'sha256 and each hash is a bytevector.
|
|
|
|
|
CONTENT-ADDRESSED-MIRRORS must be a list of procedures that, given a hash
|
|
|
|
|
algorithm and a hash, return a URL where the specified data can be retrieved
|
2016-11-07 17:07:08 -05:00
|
|
|
|
or #f.
|
|
|
|
|
|
|
|
|
|
When VERIFY-CERTIFICATE? is true, validate HTTPS server certificates;
|
|
|
|
|
otherwise simply ignore them."
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(define uri
|
2014-12-29 14:51:12 -05:00
|
|
|
|
(append-map (cut maybe-expand-mirrors <> mirrors)
|
2012-11-12 17:20:06 -05:00
|
|
|
|
(match url
|
|
|
|
|
((_ ...) (map string->uri url))
|
|
|
|
|
(_ (list (string->uri url))))))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
|
|
|
|
(define (fetch uri file)
|
2015-09-17 07:22:01 -04:00
|
|
|
|
(format #t "~%Starting download of ~a~%From ~a...~%"
|
2012-11-12 17:10:26 -05:00
|
|
|
|
file (uri->string uri))
|
|
|
|
|
(case (uri-scheme uri)
|
2013-01-20 16:28:38 -05:00
|
|
|
|
((http https)
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(false-if-exception*
|
|
|
|
|
(let-values (((port size)
|
|
|
|
|
(http-fetch uri
|
|
|
|
|
#:verify-certificate? verify-certificate?
|
|
|
|
|
#:timeout timeout)))
|
|
|
|
|
(call-with-output-file file
|
|
|
|
|
(lambda (output)
|
|
|
|
|
(dump-port* port output
|
|
|
|
|
#:buffer-size %http-receive-buffer-size
|
2018-09-12 09:08:38 -04:00
|
|
|
|
#:reporter (if print-build-trace?
|
|
|
|
|
(progress-reporter/trace
|
|
|
|
|
file (uri->string uri) size)
|
|
|
|
|
(progress-reporter/file
|
|
|
|
|
(uri-abbreviation uri) size)))
|
2017-10-16 16:31:50 -04:00
|
|
|
|
(newline)))
|
2022-08-01 04:56:45 -04:00
|
|
|
|
(close-port port)
|
2018-01-27 12:22:11 -05:00
|
|
|
|
file)))
|
2013-01-20 16:28:38 -05:00
|
|
|
|
((ftp)
|
2016-11-07 17:07:08 -05:00
|
|
|
|
(false-if-exception* (ftp-fetch uri file
|
2018-09-12 09:08:38 -04:00
|
|
|
|
#:timeout timeout
|
|
|
|
|
#:print-build-trace?
|
|
|
|
|
print-build-trace?)))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(else
|
|
|
|
|
(format #t "skipping URI with unsupported scheme: ~s~%"
|
|
|
|
|
uri)
|
|
|
|
|
#f)))
|
|
|
|
|
|
2016-05-27 04:29:10 -04:00
|
|
|
|
(define content-addressed-uris
|
2016-05-14 11:37:47 -04:00
|
|
|
|
(append-map (lambda (make-url)
|
|
|
|
|
(filter-map (match-lambda
|
|
|
|
|
((hash-algo . hash)
|
2016-07-31 12:25:18 -04:00
|
|
|
|
(let ((file (strip-store-file-name file)))
|
|
|
|
|
(string->uri (make-url file hash-algo hash)))))
|
2016-05-14 11:37:47 -04:00
|
|
|
|
hashes))
|
|
|
|
|
content-addressed-mirrors))
|
|
|
|
|
|
2021-03-19 23:03:25 -04:00
|
|
|
|
(define disarchive-uris
|
2021-09-14 04:11:42 -04:00
|
|
|
|
(append-map (lambda (mirror)
|
|
|
|
|
(let ((make-url (match mirror
|
|
|
|
|
((? string?)
|
|
|
|
|
(lambda (hash-algo hash)
|
|
|
|
|
(string-append
|
|
|
|
|
mirror
|
|
|
|
|
(symbol->string hash-algo) "/"
|
|
|
|
|
(bytevector->base16-string hash))))
|
|
|
|
|
((? procedure?)
|
|
|
|
|
mirror))))
|
|
|
|
|
(map (match-lambda
|
|
|
|
|
((hash-algo . hash)
|
|
|
|
|
(string->uri (make-url hash-algo hash))))
|
|
|
|
|
hashes)))
|
2021-03-19 23:03:25 -04:00
|
|
|
|
disarchive-mirrors))
|
|
|
|
|
|
2024-02-23 08:42:43 -05:00
|
|
|
|
(define initial-uris
|
|
|
|
|
(append (if (download-method-enabled? 'upstream)
|
|
|
|
|
uri
|
|
|
|
|
'())
|
|
|
|
|
(if (download-method-enabled? 'content-addressed-mirrors)
|
|
|
|
|
content-addressed-uris
|
|
|
|
|
'())
|
|
|
|
|
(if (download-method-enabled? 'internet-archive)
|
|
|
|
|
(match uri
|
|
|
|
|
((first . _)
|
|
|
|
|
(or (and=> (internet-archive-uri first) list)
|
|
|
|
|
'()))
|
|
|
|
|
(() '()))
|
|
|
|
|
'())))
|
|
|
|
|
|
2019-01-07 04:57:18 -05:00
|
|
|
|
;; Make this unbuffered so 'progress-report/file' works as expected. 'line
|
2017-09-16 16:10:18 -04:00
|
|
|
|
;; means '\n', not '\r', so it's not appropriate here.
|
2019-01-07 04:57:18 -05:00
|
|
|
|
(setvbuf (current-output-port) 'none)
|
2014-04-16 06:25:25 -04:00
|
|
|
|
|
2019-01-07 04:57:18 -05:00
|
|
|
|
(setvbuf (current-error-port) 'line)
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
2024-02-23 08:42:43 -05:00
|
|
|
|
(let try ((uri initial-uris))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
(match uri
|
|
|
|
|
((uri tail ...)
|
|
|
|
|
(or (fetch uri file)
|
|
|
|
|
(try tail)))
|
|
|
|
|
(()
|
2021-03-19 23:03:25 -04:00
|
|
|
|
;; If we are looking for a software archive, one last thing we
|
|
|
|
|
;; can try is to use Disarchive to assemble it.
|
2024-02-23 08:42:43 -05:00
|
|
|
|
(or (and (download-method-enabled? 'disarchive)
|
|
|
|
|
(disarchive-fetch/any disarchive-uris file
|
|
|
|
|
#:verify-certificate? verify-certificate?
|
|
|
|
|
#:timeout timeout))
|
2021-03-19 23:03:25 -04:00
|
|
|
|
(begin
|
|
|
|
|
(format (current-error-port) "failed to download ~s from ~s~%"
|
|
|
|
|
file url)
|
|
|
|
|
;; Remove FILE in case we made an incomplete download, for
|
|
|
|
|
;; example due to ENOSPC.
|
|
|
|
|
(catch 'system-error
|
|
|
|
|
(lambda ()
|
|
|
|
|
(delete-file file))
|
|
|
|
|
(const #f))
|
|
|
|
|
#f))))))
|
2012-11-12 17:10:26 -05:00
|
|
|
|
|
|
|
|
|
;;; download.scm ends here
|