123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483 |
- ;;; GNU Guix --- Functional package management for GNU
- ;;; Copyright © 2015, 2018, 2020 Ludovic Courtès <ludo@gnu.org>
- ;;;
- ;;; This file is part of GNU Guix.
- ;;;
- ;;; GNU Guix is free software; you can redistribute it and/or modify it
- ;;; under the terms of the GNU General Public License as published by
- ;;; the Free Software Foundation; either version 3 of the License, or (at
- ;;; your option) any later version.
- ;;;
- ;;; GNU Guix is distributed in the hope that it will be useful, but
- ;;; WITHOUT ANY WARRANTY; without even the implied warranty of
- ;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- ;;; GNU General Public License for more details.
- ;;;
- ;;; You should have received a copy of the GNU General Public License
- ;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
- (define-module (guix build gremlin)
- #:use-module (guix elf)
- #:use-module ((guix build utils) #:select (store-file-name?))
- #:use-module (ice-9 match)
- #:use-module (srfi srfi-1)
- #:use-module (srfi srfi-9)
- #:use-module (srfi srfi-26)
- #:use-module (srfi srfi-34)
- #:use-module (srfi srfi-35)
- #:use-module (system foreign)
- #:use-module (rnrs bytevectors)
- #:use-module (rnrs io ports)
- #:export (elf-error?
- elf-error-elf
- invalid-segment-size?
- invalid-segment-size-segment
- elf-dynamic-info
- elf-dynamic-info?
- elf-dynamic-info-soname
- elf-dynamic-info-needed
- elf-dynamic-info-rpath
- elf-dynamic-info-runpath
- expand-origin
- file-dynamic-info
- file-runpath
- file-needed
- file-needed/recursive
- missing-runpath-error?
- missing-runpath-error-file
- runpath-too-long-error?
- runpath-too-long-error-file
- set-file-runpath
- validate-needed-in-runpath
- strip-runpath))
- ;;; Commentary:
- ;;;
- ;;; A gremlin is sort-of like an elf, you know, and this module provides tools
- ;;; to deal with dynamic-link information from ELF files.
- ;;;
- ;;; Code:
- (define-condition-type &elf-error &error
- elf-error?
- (elf elf-error-elf))
- (define-condition-type &invalid-segment-size &elf-error
- invalid-segment-size?
- (segment invalid-segment-size-segment))
- (define (dynamic-link-segment elf)
- "Return the 'PT_DYNAMIC' segment of ELF--i.e., the segment that contains
- dynamic linking information."
- (let ((size (bytevector-length (elf-bytes elf))))
- (find (lambda (segment)
- (unless (<= (+ (elf-segment-offset segment)
- (elf-segment-filesz segment))
- size)
- ;; This happens on separate debug output files created by
- ;; 'strip --only-keep-debug' (Binutils 2.25.)
- (raise (condition (&invalid-segment-size
- (elf elf)
- (segment segment)))))
- (= (elf-segment-type segment) PT_DYNAMIC))
- (elf-segments elf))))
- (define (word-reader size byte-order)
- "Return a procedure to read a word of SIZE bytes according to BYTE-ORDER."
- (case size
- ((8)
- (lambda (bv index)
- (bytevector-u64-ref bv index byte-order)))
- ((4)
- (lambda (bv index)
- (bytevector-u32-ref bv index byte-order)))))
- ;; Dynamic entry:
- ;;
- ;; typedef struct
- ;; {
- ;; Elf64_Sxword d_tag; /* Dynamic entry type */
- ;; union
- ;; {
- ;; Elf64_Xword d_val; /* Integer value */
- ;; Elf64_Addr d_ptr; /* Address value */
- ;; } d_un;
- ;; } Elf64_Dyn;
- (define-record-type <dynamic-entry>
- (dynamic-entry type value offset)
- dynamic-entry?
- (type dynamic-entry-type) ;DT_*
- (value dynamic-entry-value) ;string | number | ...
- (offset dynamic-entry-offset)) ;integer
- (define (raw-dynamic-entries elf segment)
- "Return as a list of <dynamic-entry> for the dynamic entries found in
- SEGMENT, the 'PT_DYNAMIC' segment of ELF."
- (define start
- (elf-segment-offset segment))
- (define bytes
- (elf-bytes elf))
- (define word-size
- (elf-word-size elf))
- (define byte-order
- (elf-byte-order elf))
- (define read-word
- (word-reader word-size byte-order))
- (let loop ((offset 0)
- (result '()))
- (if (>= offset (elf-segment-memsz segment))
- (reverse result)
- (let ((type (read-word bytes (+ start offset)))
- (value (read-word bytes (+ start offset word-size))))
- (if (= type DT_NULL) ;finished?
- (reverse result)
- (loop (+ offset (* 2 word-size))
- (cons (dynamic-entry type value
- (+ start offset word-size))
- result)))))))
- (define (vma->offset elf vma)
- "Convert VMA, a virtual memory address, to an offset within ELF.
- Do that by looking at the loadable program segment (PT_LOAD) of ELF that
- contains VMA and by taking into account that segment's virtual address and
- offset."
- ;; See 'offset_from_vma' in Binutils.
- (define loads
- (filter (lambda (segment)
- (= (elf-segment-type segment) PT_LOAD))
- (elf-segments elf)))
- (let ((load (find (lambda (segment)
- (let ((vaddr (elf-segment-vaddr segment)))
- (and (>= vma vaddr)
- (< vma (+ (elf-segment-memsz segment)
- vaddr)))))
- loads)))
- (+ (- vma (elf-segment-vaddr load))
- (elf-segment-offset load))))
- (define (dynamic-entries elf segment)
- "Return all the dynamic entries found in SEGMENT, the 'PT_DYNAMIC' segment
- of ELF, as a list of <dynamic-entry>. The value of each entry may be a string
- or an integer depending on the entry type (for instance, the value of
- DT_NEEDED entries is a string.) Likewise the offset is the offset within the
- string table if the type is a string."
- (define entries
- (raw-dynamic-entries elf segment))
- (define string-table-offset
- (any (lambda (entry)
- (and (= (dynamic-entry-type entry) DT_STRTAB)
- (dynamic-entry-value entry)))
- entries))
- (define (interpret-dynamic-entry entry)
- (let ((type (dynamic-entry-type entry))
- (value (dynamic-entry-value entry)))
- (cond ((memv type (list DT_NEEDED DT_SONAME DT_RPATH DT_RUNPATH))
- (if string-table-offset
- (let* ((offset (vma->offset elf (+ string-table-offset value)))
- (value (pointer->string
- (bytevector->pointer (elf-bytes elf) offset))))
- (dynamic-entry type value offset))
- (dynamic-entry type value (dynamic-entry-offset entry))))
- (else
- (dynamic-entry type value (dynamic-entry-offset entry))))))
- (map interpret-dynamic-entry entries))
- ;;;
- ;;; High-level interface.
- ;;;
- (define-record-type <elf-dynamic-info>
- (%elf-dynamic-info soname needed rpath runpath)
- elf-dynamic-info?
- (soname elf-dynamic-info-soname)
- (needed elf-dynamic-info-needed)
- (rpath elf-dynamic-info-rpath)
- (runpath elf-dynamic-info-runpath))
- (define search-path->list
- (let ((not-colon (char-set-complement (char-set #\:))))
- (lambda (str)
- "Split STR on ':' characters."
- (string-tokenize str not-colon))))
- (define (elf-dynamic-info elf)
- "Return dynamic-link information for ELF as an <elf-dynamic-info> object, or
- #f if ELF lacks dynamic-link information."
- (define (matching-entry type)
- (lambda (entry)
- (= type (dynamic-entry-type entry))))
- (match (dynamic-link-segment elf)
- (#f #f)
- ((? elf-segment? dynamic)
- (let ((entries (dynamic-entries elf dynamic)))
- (%elf-dynamic-info (and=> (find (matching-entry DT_SONAME)
- entries)
- dynamic-entry-value)
- (filter-map (lambda (entry)
- (and (= (dynamic-entry-type entry)
- DT_NEEDED)
- (dynamic-entry-value entry)))
- entries)
- (or (and=> (find (matching-entry DT_RPATH)
- entries)
- (compose search-path->list
- dynamic-entry-value))
- '())
- (or (and=> (find (matching-entry DT_RUNPATH)
- entries)
- (compose search-path->list
- dynamic-entry-value))
- '()))))))
- (define (file-dynamic-info file)
- "Return the <elf-dynamic-info> record of FILE, or #f if FILE lacks dynamic
- info."
- (call-with-input-file file
- (lambda (port)
- (elf-dynamic-info (parse-elf (get-bytevector-all port))))))
- (define (file-runpath file)
- "Return the DT_RUNPATH dynamic entry of FILE as a list of strings, or #f if
- FILE lacks dynamic info."
- (and=> (file-dynamic-info file) elf-dynamic-info-runpath))
- (define (file-needed file)
- "Return the list of DT_NEEDED dynamic entries of FILE, or #f if FILE lacks
- dynamic info."
- (and=> (file-dynamic-info file) elf-dynamic-info-needed))
- (define (file-needed/recursive file)
- "Return two values: the list of absolute .so file names FILE depends on,
- recursively, and the list of .so file names that could not be found. File
- names are resolved by searching the RUNPATH of the file that NEEDs them.
- This is similar to the info returned by the 'ldd' command."
- (let loop ((files (list file))
- (result '())
- (not-found '()))
- (match files
- (()
- (values (reverse result)
- (reverse (delete-duplicates not-found))))
- ((file . rest)
- (match (file-dynamic-info file)
- (#f
- (loop rest result not-found))
- (info
- (let ((runpath (elf-dynamic-info-runpath info))
- (needed (elf-dynamic-info-needed info)))
- (if (and runpath needed)
- (let* ((runpath (map (cute expand-origin <> (dirname file))
- runpath))
- (resolved (map (cut search-path runpath <>)
- needed))
- (failed (filter-map (lambda (needed resolved)
- (and (not resolved)
- (not (libc-library? needed))
- needed))
- needed resolved))
- (needed (remove (lambda (value)
- (or (not value)
- ;; XXX: quadratic
- (member value result)))
- resolved)))
- (loop (append rest needed)
- (append needed result)
- (append failed not-found)))
- (loop rest result not-found)))))))))
- (define %libc-libraries
- ;; List of libraries as of glibc 2.21 (there are more but those are
- ;; typically mean to be LD_PRELOADed and thus do not appear as NEEDED.)
- '("libanl.so"
- "libcrypt.so"
- "libc.so"
- "libdl.so"
- "libm.so"
- "libnsl.so" ;NEEDED by nscd
- "libpthread.so"
- "libresolv.so"
- "librt.so"
- "libutil.so"))
- (define (libc-library? lib)
- "Return #t if LIB is one of the libraries shipped with the GNU C Library."
- (find (lambda (libc-lib)
- (string-prefix? libc-lib lib))
- %libc-libraries))
- (define (expand-variable str variable value)
- "Replace occurrences of '$VARIABLE' or '${VARIABLE}' in STR with VALUE."
- (define variables
- (list (string-append "$" variable)
- (string-append "${" variable "}")))
- (let loop ((thing variables)
- (str str))
- (match thing
- (()
- str)
- ((head tail ...)
- (let ((index (string-contains str head))
- (len (string-length head)))
- (loop (if index variables tail)
- (if index
- (string-replace str value
- index (+ index len))
- str)))))))
- (define (expand-origin str directory)
- "Replace occurrences of '$ORIGIN' in STR with DIRECTORY."
- (expand-variable str "ORIGIN" directory))
- (define* (validate-needed-in-runpath file
- #:key (always-found? libc-library?))
- "Return #t if all the libraries listed as FILE's 'DT_NEEDED' entries are
- present in its RUNPATH, or if FILE lacks dynamic-link information. Return #f
- otherwise. Libraries whose name matches ALWAYS-FOUND? are considered to be
- always available."
- (guard (c ((invalid-segment-size? c)
- (let ((segment (invalid-segment-size-segment c)))
- (format (current-error-port)
- "~a: error: offset + size of segment ~a (type ~a) \
- exceeds total size~%"
- file
- (elf-segment-index segment)
- (elf-segment-type segment))
- #f)))
- (let* ((elf (call-with-input-file file
- (compose parse-elf get-bytevector-all)))
- (expand (cute expand-origin <> (dirname file)))
- (dyninfo (elf-dynamic-info elf)))
- (when dyninfo
- ;; XXX: In theory we should also expand $PLATFORM and $LIB, but these
- ;; appear to be really unused.
- (let* ((expanded (map expand (elf-dynamic-info-runpath dyninfo)))
- (runpath (filter store-file-name? expanded))
- (bogus (remove store-file-name? expanded))
- (needed (remove always-found?
- (elf-dynamic-info-needed dyninfo)))
- (not-found (remove (cut search-path runpath <>)
- needed)))
- (unless (null? bogus)
- (format (current-error-port)
- "~a: warning: RUNPATH contains bogus entries: ~s~%"
- file bogus))
- (for-each (lambda (lib)
- (format (current-error-port)
- "~a: error: depends on '~a', which cannot \
- be found in RUNPATH ~s~%"
- file lib runpath))
- not-found)
- ;; (when (null? not-found)
- ;; (format (current-error-port) "~a is OK~%" file))
- (null? not-found))))))
- (define (strip-runpath file)
- "Remove from the DT_RUNPATH of FILE any entries that are not necessary
- according to DT_NEEDED."
- (define (minimal-runpath needed runpath)
- (filter (lambda (directory)
- (and (string-prefix? "/" directory)
- (any (lambda (lib)
- (file-exists? (string-append directory "/" lib)))
- needed)))
- runpath))
- (define port
- (open-file file "r+b"))
- (catch #t
- (lambda ()
- (let* ((elf (parse-elf (get-bytevector-all port)))
- (entries (dynamic-entries elf (dynamic-link-segment elf)))
- (needed (filter-map (lambda (entry)
- (and (= (dynamic-entry-type entry)
- DT_NEEDED)
- (dynamic-entry-value entry)))
- entries))
- (runpath (find (lambda (entry)
- (= DT_RUNPATH (dynamic-entry-type entry)))
- entries))
- (old (search-path->list
- (dynamic-entry-value runpath)))
- (new (minimal-runpath needed old)))
- (unless (equal? old new)
- (format (current-error-port)
- "~a: stripping RUNPATH to ~s (removed ~s)~%"
- file new
- (lset-difference string=? old new))
- (seek port (dynamic-entry-offset runpath) SEEK_SET)
- (put-bytevector port (string->utf8 (string-join new ":")))
- (put-u8 port 0))
- (close-port port)
- new))
- (lambda (key . args)
- (false-if-exception (close-port port))
- (apply throw key args))))
- (define-condition-type &missing-runpath-error &elf-error
- missing-runpath-error?
- (file missing-runpath-error-file))
- (define-condition-type &runpath-too-long-error &elf-error
- runpath-too-long-error?
- (file runpath-too-long-error-file))
- (define (set-file-runpath file path)
- "Set the value of the DT_RUNPATH dynamic entry of FILE, which must name an
- ELF file, to PATH, a list of strings. Raise a &missing-runpath-error or
- &runpath-too-long-error when appropriate."
- (define (call-with-input+output-file file proc)
- (let ((port (open-file file "r+b")))
- (guard (c (#t (close-port port) (raise c)))
- (proc port)
- (close-port port))))
- (call-with-input+output-file file
- (lambda (port)
- (let* ((elf (parse-elf (get-bytevector-all port)))
- (entries (dynamic-entries elf (dynamic-link-segment elf)))
- (runpath (find (lambda (entry)
- (= DT_RUNPATH (dynamic-entry-type entry)))
- entries))
- (path (string->utf8 (string-join path ":"))))
- (unless runpath
- (raise (condition (&missing-runpath-error (elf elf)
- (file file)))))
- ;; There might be padding left beyond RUNPATH in the string table, but
- ;; we don't know, so assume there's no padding.
- (unless (<= (bytevector-length path)
- (bytevector-length
- (string->utf8 (dynamic-entry-value runpath))))
- (raise (condition (&runpath-too-long-error (elf #f #;elf)
- (file file)))))
- (seek port (dynamic-entry-offset runpath) SEEK_SET)
- (put-bytevector port path)
- (put-u8 port 0)))))
- ;;; Local Variables:
- ;;; eval: (put 'call-with-input+output-file 'scheme-indent-function 1)
- ;;; End:
|