daemon: Delegate deduplication to 'guix substitute'.

This removes the main source of latency between subsequent downloads.

* nix/libstore/build.cc (SubstitutionGoal::tryToRun): Add a
"deduplicate" key to ENV.
(SubstitutionGoal::finished): Remove call to 'optimisePath'.
* guix/scripts/substitute.scm (process-substitution)[destination-in-store?]
[dump-file/deduplicate*]: New variables.
Pass #:dump-file to 'restore-file'.
* guix/scripts/substitute.scm (guix-substitute)[deduplicate?]: New
variable.
Pass #:deduplicate? to 'process-substitution'.
* guix/serialization.scm (dump-file): Export and augment 'dump-file'.
This commit is contained in:
Ludovic Courtès 2020-12-14 17:59:32 +01:00
parent 3c799ccb98
commit c7c7f068c1
No known key found for this signature in database
GPG key ID: 090B11993D9AEBB5
3 changed files with 40 additions and 12 deletions

View file

@ -28,7 +28,8 @@ (define-module (guix scripts substitute)
#:use-module (guix records) #:use-module (guix records)
#:use-module (guix diagnostics) #:use-module (guix diagnostics)
#:use-module (guix i18n) #:use-module (guix i18n)
#:use-module ((guix serialization) #:select (restore-file)) #:use-module ((guix serialization) #:select (restore-file dump-file))
#:autoload (guix store deduplication) (dump-file/deduplicate)
#:autoload (guix scripts discover) (read-substitute-urls) #:autoload (guix scripts discover) (read-substitute-urls)
#:use-module (gcrypt hash) #:use-module (gcrypt hash)
#:use-module (guix base32) #:use-module (guix base32)
@ -1045,15 +1046,27 @@ (define-syntax-rule (with-cached-connection uri port exp ...)
(call-with-cached-connection uri (lambda (port) exp ...))) (call-with-cached-connection uri (lambda (port) exp ...)))
(define* (process-substitution store-item destination (define* (process-substitution store-item destination
#:key cache-urls acl print-build-trace?) #:key cache-urls acl
deduplicate? print-build-trace?)
"Substitute STORE-ITEM (a store file name) from CACHE-URLS, and write it to "Substitute STORE-ITEM (a store file name) from CACHE-URLS, and write it to
DESTINATION as a nar file. Verify the substitute against ACL, and verify its DESTINATION as a nar file. Verify the substitute against ACL, and verify its
hash against what appears in the narinfo. Print a status line on the current hash against what appears in the narinfo. When DEDUPLICATE? is true, and if
output port." DESTINATION is in the store, deduplicate its files. Print a status line on
the current output port."
(define narinfo (define narinfo
(lookup-narinfo cache-urls store-item (lookup-narinfo cache-urls store-item
(cut valid-narinfo? <> acl))) (cut valid-narinfo? <> acl)))
(define destination-in-store?
(string-prefix? (string-append (%store-prefix) "/")
destination))
(define (dump-file/deduplicate* . args)
;; Make sure deduplication looks at the right store (necessary in test
;; environments).
(apply dump-file/deduplicate
(append args (list #:store (%store-prefix)))))
(unless narinfo (unless narinfo
(leave (G_ "no valid substitute for '~a'~%") (leave (G_ "no valid substitute for '~a'~%")
store-item)) store-item))
@ -1100,7 +1113,11 @@ (define narinfo
((hashed get-hash) ((hashed get-hash)
(open-hash-input-port algorithm input))) (open-hash-input-port algorithm input)))
;; Unpack the Nar at INPUT into DESTINATION. ;; Unpack the Nar at INPUT into DESTINATION.
(restore-file hashed destination) (restore-file hashed destination
#:dump-file (if (and destination-in-store?
deduplicate?)
dump-file/deduplicate*
dump-file))
(close-port hashed) (close-port hashed)
(close-port input) (close-port input)
@ -1248,6 +1265,9 @@ (define print-build-trace?
((= string->number number) (> number 0)) ((= string->number number) (> number 0))
(_ #f))) (_ #f)))
(define deduplicate?
(find-daemon-option "deduplicate"))
;; The daemon's agent code opens file descriptor 4 for us and this is where ;; The daemon's agent code opens file descriptor 4 for us and this is where
;; stderr should go. ;; stderr should go.
(parameterize ((current-error-port (if (%error-to-file-descriptor-4?) (parameterize ((current-error-port (if (%error-to-file-descriptor-4?)
@ -1307,6 +1327,7 @@ (define print-build-trace?
(process-substitution store-path destination (process-substitution store-path destination
#:cache-urls (substitute-urls) #:cache-urls (substitute-urls)
#:acl (current-acl) #:acl (current-acl)
#:deduplicate? deduplicate?
#:print-build-trace? #:print-build-trace?
print-build-trace?) print-build-trace?)
(loop)))))) (loop))))))

View file

@ -51,7 +51,8 @@ (define-module (guix serialization)
write-file write-file
write-file-tree write-file-tree
fold-archive fold-archive
restore-file)) restore-file
dump-file))
;;; Comment: ;;; Comment:
;;; ;;;
@ -458,7 +459,10 @@ (define (read-eof-marker)
(&nar-read-error (port port) (file file) (token x))))))))) (&nar-read-error (port port) (file file) (token x)))))))))
(define (dump-file file input size type) (define (dump-file file input size type)
"Dump SIZE bytes from INPUT to FILE." "Dump SIZE bytes from INPUT to FILE.
This procedure is suitable for use as the #:dump-file argument to
'restore-file'."
(call-with-output-file file (call-with-output-file file
(lambda (output) (lambda (output)
(dump input output size)))) (dump input output size))))

View file

@ -2984,7 +2984,12 @@ void SubstitutionGoal::tryToRun()
if (!worker.substituter) { if (!worker.substituter) {
const Strings args = { "substitute", "--substitute" }; const Strings args = { "substitute", "--substitute" };
const std::map<string, string> env = { { "_NIX_OPTIONS", settings.pack() } }; const std::map<string, string> env = {
{ "_NIX_OPTIONS",
settings.pack() + "deduplicate="
+ (settings.autoOptimiseStore ? "yes" : "no")
}
};
worker.substituter = std::make_shared<Agent>(settings.guixProgram, args, env); worker.substituter = std::make_shared<Agent>(settings.guixProgram, args, env);
} }
@ -3085,10 +3090,8 @@ void SubstitutionGoal::finished()
if (repair) replaceValidPath(storePath, destPath); if (repair) replaceValidPath(storePath, destPath);
/* Note: 'guix substitute' takes care of resetting timestamps and /* Note: 'guix substitute' takes care of resetting timestamps and of
permissions on 'destPath', so no need to do it here. */ deduplicating 'destPath', so no need to do it here. */
worker.store.optimisePath(storePath); // FIXME: combine with hashPath()
ValidPathInfo info2; ValidPathInfo info2;
info2.path = storePath; info2.path = storePath;