mirror of
https://github.com/anchore/syft.git
synced 2025-11-17 08:23:15 +01:00
* follow convention for naming catalogers Signed-off-by: Alex Goodman <wagoodman@users.noreply.github.com> * fix cataloger name example Signed-off-by: Alex Goodman <wagoodman@users.noreply.github.com> --------- Signed-off-by: Alex Goodman <wagoodman@users.noreply.github.com>
283 lines
8.5 KiB
Go
283 lines
8.5 KiB
Go
package debian
|
|
|
|
import (
|
|
"fmt"
|
|
"io"
|
|
"path"
|
|
"path/filepath"
|
|
"sort"
|
|
"strings"
|
|
|
|
"github.com/anchore/packageurl-go"
|
|
"github.com/anchore/syft/internal"
|
|
"github.com/anchore/syft/internal/log"
|
|
"github.com/anchore/syft/syft/file"
|
|
"github.com/anchore/syft/syft/linux"
|
|
"github.com/anchore/syft/syft/pkg"
|
|
)
|
|
|
|
const (
|
|
md5sumsExt = ".md5sums"
|
|
conffilesExt = ".conffiles"
|
|
docsPath = "/usr/share/doc"
|
|
)
|
|
|
|
func newDpkgPackage(d pkg.DpkgDBEntry, dbLocation file.Location, resolver file.Resolver, release *linux.Release) pkg.Package {
|
|
// TODO: separate pr to license refactor, but explore extracting dpkg-specific license parsing into a separate function
|
|
licenses := make([]pkg.License, 0)
|
|
p := pkg.Package{
|
|
Name: d.Package,
|
|
Version: d.Version,
|
|
Licenses: pkg.NewLicenseSet(licenses...),
|
|
Locations: file.NewLocationSet(dbLocation.WithAnnotation(pkg.EvidenceAnnotationKey, pkg.PrimaryEvidenceAnnotation)),
|
|
PURL: packageURL(d, release),
|
|
Type: pkg.DebPkg,
|
|
Metadata: d,
|
|
}
|
|
|
|
if resolver != nil {
|
|
// the current entry only has what may have been listed in the status file, however, there are additional
|
|
// files that are listed in multiple other locations. We should retrieve them all and merge the file lists
|
|
// together.
|
|
mergeFileListing(resolver, dbLocation, &p)
|
|
|
|
// fetch additional data from the copyright file to derive the license information
|
|
addLicenses(resolver, dbLocation, &p)
|
|
}
|
|
|
|
p.SetID()
|
|
|
|
return p
|
|
}
|
|
|
|
// PackageURL returns the PURL for the specific Debian package (see https://github.com/package-url/purl-spec)
|
|
func packageURL(m pkg.DpkgDBEntry, distro *linux.Release) string {
|
|
if distro == nil {
|
|
return ""
|
|
}
|
|
|
|
if distro.ID != "debian" && !internal.StringInSlice("debian", distro.IDLike) {
|
|
return ""
|
|
}
|
|
|
|
qualifiers := map[string]string{
|
|
pkg.PURLQualifierArch: m.Architecture,
|
|
}
|
|
|
|
if m.Source != "" {
|
|
if m.SourceVersion != "" {
|
|
qualifiers[pkg.PURLQualifierUpstream] = fmt.Sprintf("%s@%s", m.Source, m.SourceVersion)
|
|
} else {
|
|
qualifiers[pkg.PURLQualifierUpstream] = m.Source
|
|
}
|
|
}
|
|
|
|
return packageurl.NewPackageURL(
|
|
packageurl.TypeDebian,
|
|
distro.ID,
|
|
m.Package,
|
|
m.Version,
|
|
pkg.PURLQualifiers(
|
|
qualifiers,
|
|
distro,
|
|
),
|
|
"",
|
|
).ToString()
|
|
}
|
|
|
|
func addLicenses(resolver file.Resolver, dbLocation file.Location, p *pkg.Package) {
|
|
metadata, ok := p.Metadata.(pkg.DpkgDBEntry)
|
|
if !ok {
|
|
log.WithFields("package", p).Warn("unable to extract DPKG metadata to add licenses")
|
|
return
|
|
}
|
|
|
|
// get license information from the copyright file
|
|
copyrightReader, copyrightLocation := fetchCopyrightContents(resolver, dbLocation, metadata)
|
|
|
|
if copyrightReader != nil && copyrightLocation != nil {
|
|
defer internal.CloseAndLogError(copyrightReader, copyrightLocation.VirtualPath)
|
|
// attach the licenses
|
|
licenseStrs := parseLicensesFromCopyright(copyrightReader)
|
|
for _, licenseStr := range licenseStrs {
|
|
p.Licenses.Add(pkg.NewLicenseFromLocations(licenseStr, copyrightLocation.WithoutAnnotations()))
|
|
}
|
|
// keep a record of the file where this was discovered
|
|
p.Locations.Add(*copyrightLocation)
|
|
}
|
|
}
|
|
|
|
func mergeFileListing(resolver file.Resolver, dbLocation file.Location, p *pkg.Package) {
|
|
metadata, ok := p.Metadata.(pkg.DpkgDBEntry)
|
|
if !ok {
|
|
log.WithFields("package", p).Warn("unable to extract DPKG metadata to file listing")
|
|
return
|
|
}
|
|
|
|
// get file listing (package files + additional config files)
|
|
files, infoLocations := getAdditionalFileListing(resolver, dbLocation, metadata)
|
|
loopNewFiles:
|
|
for _, newFile := range files {
|
|
for _, existingFile := range metadata.Files {
|
|
if existingFile.Path == newFile.Path {
|
|
// skip adding this file since it already exists
|
|
continue loopNewFiles
|
|
}
|
|
}
|
|
metadata.Files = append(metadata.Files, newFile)
|
|
}
|
|
|
|
// sort files by path
|
|
sort.SliceStable(metadata.Files, func(i, j int) bool {
|
|
return metadata.Files[i].Path < metadata.Files[j].Path
|
|
})
|
|
|
|
// persist alterations
|
|
p.Metadata = metadata
|
|
|
|
// persist location information from each new source of information
|
|
p.Locations.Add(infoLocations...)
|
|
}
|
|
|
|
func getAdditionalFileListing(resolver file.Resolver, dbLocation file.Location, m pkg.DpkgDBEntry) ([]pkg.DpkgFileRecord, []file.Location) {
|
|
// ensure the default value for a collection is never nil since this may be shown as JSON
|
|
var files = make([]pkg.DpkgFileRecord, 0)
|
|
var locations []file.Location
|
|
|
|
md5Reader, md5Location := fetchMd5Contents(resolver, dbLocation, m)
|
|
|
|
if md5Reader != nil && md5Location != nil {
|
|
defer internal.CloseAndLogError(md5Reader, md5Location.VirtualPath)
|
|
// attach the file list
|
|
files = append(files, parseDpkgMD5Info(md5Reader)...)
|
|
|
|
// keep a record of the file where this was discovered
|
|
locations = append(locations, *md5Location)
|
|
}
|
|
|
|
conffilesReader, conffilesLocation := fetchConffileContents(resolver, dbLocation, m)
|
|
|
|
if conffilesReader != nil && conffilesLocation != nil {
|
|
defer internal.CloseAndLogError(conffilesReader, conffilesLocation.VirtualPath)
|
|
// attach the file list
|
|
files = append(files, parseDpkgConffileInfo(conffilesReader)...)
|
|
|
|
// keep a record of the file where this was discovered
|
|
locations = append(locations, *conffilesLocation)
|
|
}
|
|
|
|
return files, locations
|
|
}
|
|
|
|
//nolint:dupl
|
|
func fetchMd5Contents(resolver file.Resolver, dbLocation file.Location, m pkg.DpkgDBEntry) (io.ReadCloser, *file.Location) {
|
|
var md5Reader io.ReadCloser
|
|
var err error
|
|
|
|
if resolver == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
// for typical debian-base distributions, the installed package info is at /var/lib/dpkg/status
|
|
// and the md5sum information is under /var/lib/dpkg/info/; however, for distroless the installed
|
|
// package info is across multiple files under /var/lib/dpkg/status.d/ and the md5sums are contained in
|
|
// the same directory
|
|
searchPath := filepath.Dir(dbLocation.RealPath)
|
|
|
|
if !strings.HasSuffix(searchPath, "status.d") {
|
|
searchPath = path.Join(searchPath, "info")
|
|
}
|
|
|
|
// look for /var/lib/dpkg/info/NAME:ARCH.md5sums
|
|
name := md5Key(m)
|
|
location := resolver.RelativeFileByPath(dbLocation, path.Join(searchPath, name+md5sumsExt))
|
|
|
|
if location == nil {
|
|
// the most specific key did not work, fallback to just the name
|
|
// look for /var/lib/dpkg/info/NAME.md5sums
|
|
location = resolver.RelativeFileByPath(dbLocation, path.Join(searchPath, m.Package+md5sumsExt))
|
|
}
|
|
|
|
if location == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
// this is unexpected, but not a show-stopper
|
|
md5Reader, err = resolver.FileContentsByLocation(*location)
|
|
if err != nil {
|
|
log.Warnf("failed to fetch deb md5 contents (package=%s): %+v", m.Package, err)
|
|
}
|
|
|
|
l := location.WithAnnotation(pkg.EvidenceAnnotationKey, pkg.SupportingEvidenceAnnotation)
|
|
|
|
return md5Reader, &l
|
|
}
|
|
|
|
//nolint:dupl
|
|
func fetchConffileContents(resolver file.Resolver, dbLocation file.Location, m pkg.DpkgDBEntry) (io.ReadCloser, *file.Location) {
|
|
var reader io.ReadCloser
|
|
var err error
|
|
|
|
if resolver == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
parentPath := filepath.Dir(dbLocation.RealPath)
|
|
|
|
// look for /var/lib/dpkg/info/NAME:ARCH.conffiles
|
|
name := md5Key(m)
|
|
location := resolver.RelativeFileByPath(dbLocation, path.Join(parentPath, "info", name+conffilesExt))
|
|
|
|
if location == nil {
|
|
// the most specific key did not work, fallback to just the name
|
|
// look for /var/lib/dpkg/info/NAME.conffiles
|
|
location = resolver.RelativeFileByPath(dbLocation, path.Join(parentPath, "info", m.Package+conffilesExt))
|
|
}
|
|
|
|
if location == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
// this is unexpected, but not a show-stopper
|
|
reader, err = resolver.FileContentsByLocation(*location)
|
|
if err != nil {
|
|
log.Warnf("failed to fetch deb conffiles contents (package=%s): %+v", m.Package, err)
|
|
}
|
|
|
|
l := location.WithAnnotation(pkg.EvidenceAnnotationKey, pkg.SupportingEvidenceAnnotation)
|
|
|
|
return reader, &l
|
|
}
|
|
|
|
func fetchCopyrightContents(resolver file.Resolver, dbLocation file.Location, m pkg.DpkgDBEntry) (io.ReadCloser, *file.Location) {
|
|
if resolver == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
// look for /usr/share/docs/NAME/copyright files
|
|
copyrightPath := path.Join(docsPath, m.Package, "copyright")
|
|
location := resolver.RelativeFileByPath(dbLocation, copyrightPath)
|
|
|
|
// we may not have a copyright file for each package, ignore missing files
|
|
if location == nil {
|
|
return nil, nil
|
|
}
|
|
|
|
reader, err := resolver.FileContentsByLocation(*location)
|
|
if err != nil {
|
|
log.Warnf("failed to fetch deb copyright contents (package=%s): %w", m.Package, err)
|
|
}
|
|
|
|
l := location.WithAnnotation(pkg.EvidenceAnnotationKey, pkg.SupportingEvidenceAnnotation)
|
|
|
|
return reader, &l
|
|
}
|
|
|
|
func md5Key(metadata pkg.DpkgDBEntry) string {
|
|
contentKey := metadata.Package
|
|
if metadata.Architecture != "" && metadata.Architecture != "all" {
|
|
contentKey = contentKey + ":" + metadata.Architecture
|
|
}
|
|
return contentKey
|
|
}
|