mirror of
https://git.in.rschanz.org/ryan77627/guix.git
synced 2025-01-08 20:30:05 -05:00
1010171280
* guix/build/gremlin.scm (elf-dynamic-info): Return the dynamic entry value, not the dynamic entry. * tests/gremlin.scm ("elf-dynamic-info-soname"): New test. Signed-off-by: Ludovic Courtès <ludo@gnu.org>
482 lines
18 KiB
Scheme
482 lines
18 KiB
Scheme
;;; GNU Guix --- Functional package management for GNU
|
||
;;; Copyright © 2015, 2018, 2020 Ludovic Courtès <ludo@gnu.org>
|
||
;;;
|
||
;;; This file is part of GNU Guix.
|
||
;;;
|
||
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
||
;;; under the terms of the GNU General Public License as published by
|
||
;;; the Free Software Foundation; either version 3 of the License, or (at
|
||
;;; your option) any later version.
|
||
;;;
|
||
;;; GNU Guix is distributed in the hope that it will be useful, but
|
||
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
;;; GNU General Public License for more details.
|
||
;;;
|
||
;;; You should have received a copy of the GNU General Public License
|
||
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
||
|
||
(define-module (guix build gremlin)
|
||
#:use-module (guix elf)
|
||
#:use-module ((guix build utils) #:select (store-file-name?))
|
||
#:use-module (ice-9 match)
|
||
#:use-module (srfi srfi-1)
|
||
#:use-module (srfi srfi-9)
|
||
#:use-module (srfi srfi-26)
|
||
#:use-module (srfi srfi-34)
|
||
#:use-module (srfi srfi-35)
|
||
#:use-module (system foreign)
|
||
#:use-module (rnrs bytevectors)
|
||
#:use-module (rnrs io ports)
|
||
#:export (elf-error?
|
||
elf-error-elf
|
||
invalid-segment-size?
|
||
invalid-segment-size-segment
|
||
|
||
elf-dynamic-info
|
||
elf-dynamic-info?
|
||
elf-dynamic-info-soname
|
||
elf-dynamic-info-needed
|
||
elf-dynamic-info-rpath
|
||
elf-dynamic-info-runpath
|
||
expand-origin
|
||
|
||
file-dynamic-info
|
||
file-runpath
|
||
file-needed
|
||
file-needed/recursive
|
||
|
||
missing-runpath-error?
|
||
missing-runpath-error-file
|
||
runpath-too-long-error?
|
||
runpath-too-long-error-file
|
||
set-file-runpath
|
||
|
||
validate-needed-in-runpath
|
||
strip-runpath))
|
||
|
||
;;; Commentary:
|
||
;;;
|
||
;;; A gremlin is sort-of like an elf, you know, and this module provides tools
|
||
;;; to deal with dynamic-link information from ELF files.
|
||
;;;
|
||
;;; Code:
|
||
|
||
(define-condition-type &elf-error &error
|
||
elf-error?
|
||
(elf elf-error-elf))
|
||
|
||
(define-condition-type &invalid-segment-size &elf-error
|
||
invalid-segment-size?
|
||
(segment invalid-segment-size-segment))
|
||
|
||
|
||
(define (dynamic-link-segment elf)
|
||
"Return the 'PT_DYNAMIC' segment of ELF--i.e., the segment that contains
|
||
dynamic linking information."
|
||
(let ((size (bytevector-length (elf-bytes elf))))
|
||
(find (lambda (segment)
|
||
(unless (<= (+ (elf-segment-offset segment)
|
||
(elf-segment-filesz segment))
|
||
size)
|
||
;; This happens on separate debug output files created by
|
||
;; 'strip --only-keep-debug' (Binutils 2.25.)
|
||
(raise (condition (&invalid-segment-size
|
||
(elf elf)
|
||
(segment segment)))))
|
||
|
||
(= (elf-segment-type segment) PT_DYNAMIC))
|
||
(elf-segments elf))))
|
||
|
||
(define (word-reader size byte-order)
|
||
"Return a procedure to read a word of SIZE bytes according to BYTE-ORDER."
|
||
(case size
|
||
((8)
|
||
(lambda (bv index)
|
||
(bytevector-u64-ref bv index byte-order)))
|
||
((4)
|
||
(lambda (bv index)
|
||
(bytevector-u32-ref bv index byte-order)))))
|
||
|
||
|
||
;; Dynamic entry:
|
||
;;
|
||
;; typedef struct
|
||
;; {
|
||
;; Elf64_Sxword d_tag; /* Dynamic entry type */
|
||
;; union
|
||
;; {
|
||
;; Elf64_Xword d_val; /* Integer value */
|
||
;; Elf64_Addr d_ptr; /* Address value */
|
||
;; } d_un;
|
||
;; } Elf64_Dyn;
|
||
|
||
(define-record-type <dynamic-entry>
|
||
(dynamic-entry type value offset)
|
||
dynamic-entry?
|
||
(type dynamic-entry-type) ;DT_*
|
||
(value dynamic-entry-value) ;string | number | ...
|
||
(offset dynamic-entry-offset)) ;integer
|
||
|
||
(define (raw-dynamic-entries elf segment)
|
||
"Return as a list of <dynamic-entry> for the dynamic entries found in
|
||
SEGMENT, the 'PT_DYNAMIC' segment of ELF."
|
||
(define start
|
||
(elf-segment-offset segment))
|
||
(define bytes
|
||
(elf-bytes elf))
|
||
(define word-size
|
||
(elf-word-size elf))
|
||
(define byte-order
|
||
(elf-byte-order elf))
|
||
(define read-word
|
||
(word-reader word-size byte-order))
|
||
|
||
(let loop ((offset 0)
|
||
(result '()))
|
||
(if (>= offset (elf-segment-memsz segment))
|
||
(reverse result)
|
||
(let ((type (read-word bytes (+ start offset)))
|
||
(value (read-word bytes (+ start offset word-size))))
|
||
(if (= type DT_NULL) ;finished?
|
||
(reverse result)
|
||
(loop (+ offset (* 2 word-size))
|
||
(cons (dynamic-entry type value
|
||
(+ start offset word-size))
|
||
result)))))))
|
||
|
||
(define (vma->offset elf vma)
|
||
"Convert VMA, a virtual memory address, to an offset within ELF.
|
||
|
||
Do that by looking at the loadable program segment (PT_LOAD) of ELF that
|
||
contains VMA and by taking into account that segment's virtual address and
|
||
offset."
|
||
;; See 'offset_from_vma' in Binutils.
|
||
(define loads
|
||
(filter (lambda (segment)
|
||
(= (elf-segment-type segment) PT_LOAD))
|
||
(elf-segments elf)))
|
||
|
||
(let ((load (find (lambda (segment)
|
||
(let ((vaddr (elf-segment-vaddr segment)))
|
||
(and (>= vma vaddr)
|
||
(< vma (+ (elf-segment-memsz segment)
|
||
vaddr)))))
|
||
loads)))
|
||
(+ (- vma (elf-segment-vaddr load))
|
||
(elf-segment-offset load))))
|
||
|
||
(define (dynamic-entries elf segment)
|
||
"Return all the dynamic entries found in SEGMENT, the 'PT_DYNAMIC' segment
|
||
of ELF, as a list of <dynamic-entry>. The value of each entry may be a string
|
||
or an integer depending on the entry type (for instance, the value of
|
||
DT_NEEDED entries is a string.) Likewise the offset is the offset within the
|
||
string table if the type is a string."
|
||
(define entries
|
||
(raw-dynamic-entries elf segment))
|
||
|
||
(define string-table-offset
|
||
(any (lambda (entry)
|
||
(and (= (dynamic-entry-type entry) DT_STRTAB)
|
||
(dynamic-entry-value entry)))
|
||
entries))
|
||
|
||
(define (interpret-dynamic-entry entry)
|
||
(let ((type (dynamic-entry-type entry))
|
||
(value (dynamic-entry-value entry)))
|
||
(cond ((memv type (list DT_NEEDED DT_SONAME DT_RPATH DT_RUNPATH))
|
||
(if string-table-offset
|
||
(let* ((offset (vma->offset elf (+ string-table-offset value)))
|
||
(value (pointer->string
|
||
(bytevector->pointer (elf-bytes elf) offset))))
|
||
(dynamic-entry type value offset))
|
||
(dynamic-entry type value (dynamic-entry-offset entry))))
|
||
(else
|
||
(dynamic-entry type value (dynamic-entry-offset entry))))))
|
||
|
||
(map interpret-dynamic-entry entries))
|
||
|
||
|
||
;;;
|
||
;;; High-level interface.
|
||
;;;
|
||
|
||
(define-record-type <elf-dynamic-info>
|
||
(%elf-dynamic-info soname needed rpath runpath)
|
||
elf-dynamic-info?
|
||
(soname elf-dynamic-info-soname)
|
||
(needed elf-dynamic-info-needed)
|
||
(rpath elf-dynamic-info-rpath)
|
||
(runpath elf-dynamic-info-runpath))
|
||
|
||
(define search-path->list
|
||
(let ((not-colon (char-set-complement (char-set #\:))))
|
||
(lambda (str)
|
||
"Split STR on ':' characters."
|
||
(string-tokenize str not-colon))))
|
||
|
||
(define (elf-dynamic-info elf)
|
||
"Return dynamic-link information for ELF as an <elf-dynamic-info> object, or
|
||
#f if ELF lacks dynamic-link information."
|
||
(define (matching-entry type)
|
||
(lambda (entry)
|
||
(= type (dynamic-entry-type entry))))
|
||
|
||
(match (dynamic-link-segment elf)
|
||
(#f #f)
|
||
((? elf-segment? dynamic)
|
||
(let ((entries (dynamic-entries elf dynamic)))
|
||
(%elf-dynamic-info (and=> (find (matching-entry DT_SONAME)
|
||
entries)
|
||
dynamic-entry-value)
|
||
(filter-map (lambda (entry)
|
||
(and (= (dynamic-entry-type entry)
|
||
DT_NEEDED)
|
||
(dynamic-entry-value entry)))
|
||
entries)
|
||
(or (and=> (find (matching-entry DT_RPATH)
|
||
entries)
|
||
(compose search-path->list
|
||
dynamic-entry-value))
|
||
'())
|
||
(or (and=> (find (matching-entry DT_RUNPATH)
|
||
entries)
|
||
(compose search-path->list
|
||
dynamic-entry-value))
|
||
'()))))))
|
||
|
||
(define (file-dynamic-info file)
|
||
"Return the <elf-dynamic-info> record of FILE, or #f if FILE lacks dynamic
|
||
info."
|
||
(call-with-input-file file
|
||
(lambda (port)
|
||
(elf-dynamic-info (parse-elf (get-bytevector-all port))))))
|
||
|
||
(define (file-runpath file)
|
||
"Return the DT_RUNPATH dynamic entry of FILE as a list of strings, or #f if
|
||
FILE lacks dynamic info."
|
||
(and=> (file-dynamic-info file) elf-dynamic-info-runpath))
|
||
|
||
(define (file-needed file)
|
||
"Return the list of DT_NEEDED dynamic entries of FILE, or #f if FILE lacks
|
||
dynamic info."
|
||
(and=> (file-dynamic-info file) elf-dynamic-info-needed))
|
||
|
||
(define (file-needed/recursive file)
|
||
"Return two values: the list of absolute .so file names FILE depends on,
|
||
recursively, and the list of .so file names that could not be found. File
|
||
names are resolved by searching the RUNPATH of the file that NEEDs them.
|
||
|
||
This is similar to the info returned by the 'ldd' command."
|
||
(let loop ((files (list file))
|
||
(result '())
|
||
(not-found '()))
|
||
(match files
|
||
(()
|
||
(values (reverse result)
|
||
(reverse (delete-duplicates not-found))))
|
||
((file . rest)
|
||
(match (file-dynamic-info file)
|
||
(#f
|
||
(loop rest result not-found))
|
||
(info
|
||
(let ((runpath (elf-dynamic-info-runpath info))
|
||
(needed (elf-dynamic-info-needed info)))
|
||
(if (and runpath needed)
|
||
(let* ((runpath (map (cute expand-origin <> (dirname file))
|
||
runpath))
|
||
(resolved (map (cut search-path runpath <>)
|
||
needed))
|
||
(failed (filter-map (lambda (needed resolved)
|
||
(and (not resolved)
|
||
(not (libc-library? needed))
|
||
needed))
|
||
needed resolved))
|
||
(needed (remove (lambda (value)
|
||
(or (not value)
|
||
;; XXX: quadratic
|
||
(member value result)))
|
||
resolved)))
|
||
(loop (append rest needed)
|
||
(append needed result)
|
||
(append failed not-found)))
|
||
(loop rest result not-found)))))))))
|
||
|
||
(define %libc-libraries
|
||
;; List of libraries as of glibc 2.21 (there are more but those are
|
||
;; typically mean to be LD_PRELOADed and thus do not appear as NEEDED.)
|
||
'("libanl.so"
|
||
"libcrypt.so"
|
||
"libc.so"
|
||
"libdl.so"
|
||
"libm.so"
|
||
"libnsl.so" ;NEEDED by nscd
|
||
"libpthread.so"
|
||
"libresolv.so"
|
||
"librt.so"
|
||
"libutil.so"))
|
||
|
||
(define (libc-library? lib)
|
||
"Return #t if LIB is one of the libraries shipped with the GNU C Library."
|
||
(find (lambda (libc-lib)
|
||
(string-prefix? libc-lib lib))
|
||
%libc-libraries))
|
||
|
||
(define (expand-variable str variable value)
|
||
"Replace occurrences of '$VARIABLE' or '${VARIABLE}' in STR with VALUE."
|
||
(define variables
|
||
(list (string-append "$" variable)
|
||
(string-append "${" variable "}")))
|
||
|
||
(let loop ((thing variables)
|
||
(str str))
|
||
(match thing
|
||
(()
|
||
str)
|
||
((head tail ...)
|
||
(let ((index (string-contains str head))
|
||
(len (string-length head)))
|
||
(loop (if index variables tail)
|
||
(if index
|
||
(string-replace str value
|
||
index (+ index len))
|
||
str)))))))
|
||
|
||
(define (expand-origin str directory)
|
||
"Replace occurrences of '$ORIGIN' in STR with DIRECTORY."
|
||
(expand-variable str "ORIGIN" directory))
|
||
|
||
(define* (validate-needed-in-runpath file
|
||
#:key (always-found? libc-library?))
|
||
"Return #t if all the libraries listed as FILE's 'DT_NEEDED' entries are
|
||
present in its RUNPATH, or if FILE lacks dynamic-link information. Return #f
|
||
otherwise. Libraries whose name matches ALWAYS-FOUND? are considered to be
|
||
always available."
|
||
(guard (c ((invalid-segment-size? c)
|
||
(let ((segment (invalid-segment-size-segment c)))
|
||
(format (current-error-port)
|
||
"~a: error: offset + size of segment ~a (type ~a) \
|
||
exceeds total size~%"
|
||
file
|
||
(elf-segment-index segment)
|
||
(elf-segment-type segment))
|
||
#f)))
|
||
|
||
(let* ((elf (call-with-input-file file
|
||
(compose parse-elf get-bytevector-all)))
|
||
(expand (cute expand-origin <> (dirname file)))
|
||
(dyninfo (elf-dynamic-info elf)))
|
||
(when dyninfo
|
||
;; XXX: In theory we should also expand $PLATFORM and $LIB, but these
|
||
;; appear to be really unused.
|
||
(let* ((expanded (map expand (elf-dynamic-info-runpath dyninfo)))
|
||
(runpath (filter store-file-name? expanded))
|
||
(bogus (remove store-file-name? expanded))
|
||
(needed (remove always-found?
|
||
(elf-dynamic-info-needed dyninfo)))
|
||
(not-found (remove (cut search-path runpath <>)
|
||
needed)))
|
||
(unless (null? bogus)
|
||
(format (current-error-port)
|
||
"~a: warning: RUNPATH contains bogus entries: ~s~%"
|
||
file bogus))
|
||
|
||
(for-each (lambda (lib)
|
||
(format (current-error-port)
|
||
"~a: error: depends on '~a', which cannot \
|
||
be found in RUNPATH ~s~%"
|
||
file lib runpath))
|
||
not-found)
|
||
;; (when (null? not-found)
|
||
;; (format (current-error-port) "~a is OK~%" file))
|
||
(null? not-found))))))
|
||
|
||
(define (strip-runpath file)
|
||
"Remove from the DT_RUNPATH of FILE any entries that are not necessary
|
||
according to DT_NEEDED."
|
||
(define (minimal-runpath needed runpath)
|
||
(filter (lambda (directory)
|
||
(and (string-prefix? "/" directory)
|
||
(any (lambda (lib)
|
||
(file-exists? (string-append directory "/" lib)))
|
||
needed)))
|
||
runpath))
|
||
|
||
(define port
|
||
(open-file file "r+b"))
|
||
|
||
(catch #t
|
||
(lambda ()
|
||
(let* ((elf (parse-elf (get-bytevector-all port)))
|
||
(entries (dynamic-entries elf (dynamic-link-segment elf)))
|
||
(needed (filter-map (lambda (entry)
|
||
(and (= (dynamic-entry-type entry)
|
||
DT_NEEDED)
|
||
(dynamic-entry-value entry)))
|
||
entries))
|
||
(runpath (find (lambda (entry)
|
||
(= DT_RUNPATH (dynamic-entry-type entry)))
|
||
entries))
|
||
(old (search-path->list
|
||
(dynamic-entry-value runpath)))
|
||
(new (minimal-runpath needed old)))
|
||
(unless (equal? old new)
|
||
(format (current-error-port)
|
||
"~a: stripping RUNPATH to ~s (removed ~s)~%"
|
||
file new
|
||
(lset-difference string=? old new))
|
||
(seek port (dynamic-entry-offset runpath) SEEK_SET)
|
||
(put-bytevector port (string->utf8 (string-join new ":")))
|
||
(put-u8 port 0))
|
||
(close-port port)
|
||
new))
|
||
(lambda (key . args)
|
||
(false-if-exception (close-port port))
|
||
(apply throw key args))))
|
||
|
||
|
||
(define-condition-type &missing-runpath-error &elf-error
|
||
missing-runpath-error?
|
||
(file missing-runpath-error-file))
|
||
|
||
(define-condition-type &runpath-too-long-error &elf-error
|
||
runpath-too-long-error?
|
||
(file runpath-too-long-error-file))
|
||
|
||
(define (set-file-runpath file path)
|
||
"Set the value of the DT_RUNPATH dynamic entry of FILE, which must name an
|
||
ELF file, to PATH, a list of strings. Raise a &missing-runpath-error or
|
||
&runpath-too-long-error when appropriate."
|
||
(define (call-with-input+output-file file proc)
|
||
(let ((port (open-file file "r+b")))
|
||
(guard (c (#t (close-port port) (raise c)))
|
||
(proc port)
|
||
(close-port port))))
|
||
|
||
(call-with-input+output-file file
|
||
(lambda (port)
|
||
(let* ((elf (parse-elf (get-bytevector-all port)))
|
||
(entries (dynamic-entries elf (dynamic-link-segment elf)))
|
||
(runpath (find (lambda (entry)
|
||
(= DT_RUNPATH (dynamic-entry-type entry)))
|
||
entries))
|
||
(path (string->utf8 (string-join path ":"))))
|
||
(unless runpath
|
||
(raise (condition (&missing-runpath-error (elf elf)
|
||
(file file)))))
|
||
|
||
;; There might be padding left beyond RUNPATH in the string table, but
|
||
;; we don't know, so assume there's no padding.
|
||
(unless (<= (bytevector-length path)
|
||
(bytevector-length
|
||
(string->utf8 (dynamic-entry-value runpath))))
|
||
(raise (condition (&runpath-too-long-error (elf #f #;elf)
|
||
(file file)))))
|
||
|
||
(seek port (dynamic-entry-offset runpath) SEEK_SET)
|
||
(put-bytevector port path)
|
||
(put-u8 port 0)))))
|
||
|
||
;;; Local Variables:
|
||
;;; eval: (put 'call-with-input+output-file 'scheme-indent-function 1)
|
||
;;; End:
|