Skip to content

Commit

Permalink
Improve frequency-based upgrade heuristics, add flag to disable (#342)
Browse files Browse the repository at this point in the history
* Improve frequency-based upgrade heuristics, add flag to disable

* Update samples

* Increase score of unusually small binaries

* add period at end of godoc line

* Rename flag to --quantity-increases-risk

* tighten up the upgrade numbers

* tighten up the upgrade numbers

---------

Co-authored-by: Evan Gibler <[email protected]>
  • Loading branch information
tstromberg and egibs authored Jul 9, 2024
1 parent e1a894f commit 246762a
Show file tree
Hide file tree
Showing 17 changed files with 184 additions and 109 deletions.
30 changes: 16 additions & 14 deletions bincapz.go
Original file line number Diff line number Diff line change
Expand Up @@ -70,6 +70,7 @@ func main() {
errFirstHitFlag := flag.Bool("err-first-hit", false, "exit with error if scan source has matching capabilities")
ociFlag := flag.Bool("oci", false, "Scan an OCI image")
omitEmptyFlag := flag.Bool("omit-empty", false, "Omit files that contain no matches")
quantityIncreasesRiskFlag := flag.Bool("quantity-increases-risk", true, "increase file risk score based on behavior quantity")
profileFlag := flag.Bool("profile", false, "Generate profile and trace files")
statsFlag := flag.Bool("stats", false, "Show statistics about the scan")
thirdPartyFlag := flag.Bool("third-party", true, "Include third-party rules, which may have licensing restrictions")
Expand Down Expand Up @@ -178,20 +179,21 @@ func main() {
return
}

bc := action.Config{
IgnoreSelf: *ignoreSelfFlag,
IgnoreTags: ignoreTags,
IncludeDataFiles: includeDataFiles,
MinFileRisk: minFileRisk,
MinRisk: minRisk,
OCI: *ociFlag,
OmitEmpty: *omitEmptyFlag,
Renderer: renderer,
Rules: yrs,
ScanPaths: args,
Stats: stats,
ErrFirstHit: *errFirstHitFlag,
ErrFirstMiss: *errFirstMissFlag,
bc := bincapz.Config{
IgnoreSelf: *ignoreSelfFlag,
IgnoreTags: ignoreTags,
IncludeDataFiles: includeDataFiles,
MinFileRisk: minFileRisk,
MinRisk: minRisk,
QuantityIncreasesFisk: *quantityIncreasesRiskFlag,
OCI: *ociFlag,
OmitEmpty: *omitEmptyFlag,
Renderer: renderer,
Rules: yrs,
ScanPaths: args,
Stats: stats,
ErrFirstHit: *errFirstHitFlag,
ErrFirstMiss: *errFirstMissFlag,
}

var res *bincapz.Report
Expand Down
24 changes: 0 additions & 24 deletions pkg/action/action.go
Original file line number Diff line number Diff line change
Expand Up @@ -2,27 +2,3 @@
// SPDX-License-Identifier: Apache-2.0

package action

import (
"io"

"github.com/chainguard-dev/bincapz/pkg/render"
"github.com/hillu/go-yara/v4"
)

type Config struct {
IgnoreSelf bool
IgnoreTags []string
IncludeDataFiles bool
MinFileRisk int
MinRisk int
OCI bool
OmitEmpty bool
Output io.Writer
Renderer render.Renderer
Rules *yara.Rules
ScanPaths []string
Stats bool
ErrFirstMiss bool
ErrFirstHit bool
}
3 changes: 2 additions & 1 deletion pkg/action/archive_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@ import (
"strings"
"testing"

"github.com/chainguard-dev/bincapz/pkg/bincapz"
"github.com/chainguard-dev/bincapz/pkg/compile"
"github.com/chainguard-dev/bincapz/pkg/render"
"github.com/chainguard-dev/bincapz/rules"
Expand Down Expand Up @@ -228,7 +229,7 @@ func TestScanArchive(t *testing.T) {
if err != nil {
t.Fatalf("render: %v", err)
}
bc := Config{
bc := bincapz.Config{
IgnoreSelf: false,
IgnoreTags: []string{"harmless"},
Renderer: simple,
Expand Down
16 changes: 8 additions & 8 deletions pkg/action/diff.go
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@ import (
"github.com/chainguard-dev/clog"
)

func relFileReport(ctx context.Context, c Config, fromPath string) (map[string]*bincapz.FileReport, error) {
func relFileReport(ctx context.Context, c bincapz.Config, fromPath string) (map[string]*bincapz.FileReport, error) {
fromConfig := c
fromConfig.Renderer = nil
fromConfig.ScanPaths = []string{fromPath}
Expand All @@ -40,7 +40,7 @@ func relFileReport(ctx context.Context, c Config, fromPath string) (map[string]*
return fromRelPath, nil
}

func Diff(ctx context.Context, c Config) (*bincapz.Report, error) {
func Diff(ctx context.Context, c bincapz.Config) (*bincapz.Report, error) {
if len(c.ScanPaths) != 2 {
return nil, fmt.Errorf("diff mode requires 2 paths, you passed in %d path(s)", len(c.ScanPaths))
}
Expand Down Expand Up @@ -68,7 +68,7 @@ func Diff(ctx context.Context, c Config) (*bincapz.Report, error) {
return &bincapz.Report{Diff: d}, err
}

func processSrc(ctx context.Context, c Config, src, dest map[string]*bincapz.FileReport, d *bincapz.DiffReport) {
func processSrc(ctx context.Context, c bincapz.Config, src, dest map[string]*bincapz.FileReport, d *bincapz.DiffReport) {
// things that appear in the source
for relPath, fr := range src {
tr, exists := dest[relPath]
Expand All @@ -80,7 +80,7 @@ func processSrc(ctx context.Context, c Config, src, dest map[string]*bincapz.Fil
}
}

func handleFile(ctx context.Context, c Config, fr, tr *bincapz.FileReport, relPath string, d *bincapz.DiffReport) {
func handleFile(ctx context.Context, c bincapz.Config, fr, tr *bincapz.FileReport, relPath string, d *bincapz.DiffReport) {
// We've now established that file exists in both source & destination
if fr.RiskScore < c.MinFileRisk && tr.RiskScore < c.MinFileRisk {
clog.FromContext(ctx).Info("diff does not meet min trigger level", slog.Any("path", tr.Path))
Expand Down Expand Up @@ -120,7 +120,7 @@ func behaviorExists(b *bincapz.Behavior, behaviors []*bincapz.Behavior) bool {
return false
}

func processDest(ctx context.Context, c Config, from, to map[string]*bincapz.FileReport, d *bincapz.DiffReport) {
func processDest(ctx context.Context, c bincapz.Config, from, to map[string]*bincapz.FileReport, d *bincapz.DiffReport) {
// things that exist in the destination
for relPath, tr := range to {
fr, exists := from[relPath]
Expand All @@ -133,7 +133,7 @@ func processDest(ctx context.Context, c Config, from, to map[string]*bincapz.Fil
}
}

func fileDestination(ctx context.Context, c Config, fr, tr *bincapz.FileReport, relPath string, d *bincapz.DiffReport) {
func fileDestination(ctx context.Context, c bincapz.Config, fr, tr *bincapz.FileReport, relPath string, d *bincapz.DiffReport) {
// We've now established that this file exists in both source and destination
if fr.RiskScore < c.MinFileRisk && tr.RiskScore < c.MinFileRisk {
clog.FromContext(ctx).Info("diff does not meet min trigger level", slog.Any("path", tr.Path))
Expand All @@ -158,7 +158,7 @@ func fileDestination(ctx context.Context, c Config, fr, tr *bincapz.FileReport,
}
}

func inferMoves(ctx context.Context, c Config, d *bincapz.DiffReport) {
func inferMoves(ctx context.Context, c bincapz.Config, d *bincapz.DiffReport) {
// Walk over the added/removed paths and infer moves based on the
// levenshtein distance of the file names. If the distance is a 90+% match,
// then treat it as a move.
Expand All @@ -184,7 +184,7 @@ func inferMoves(ctx context.Context, c Config, d *bincapz.DiffReport) {
}
}

func fileMove(ctx context.Context, c Config, fr, tr *bincapz.FileReport, rpath, apath string, score float64, d *bincapz.DiffReport) {
func fileMove(ctx context.Context, c bincapz.Config, fr, tr *bincapz.FileReport, rpath, apath string, score float64, d *bincapz.DiffReport) {
if fr.RiskScore < c.MinFileRisk && tr.RiskScore < c.MinFileRisk {
clog.FromContext(ctx).Info("diff does not meet min trigger level", slog.Any("path", tr.Path))
return
Expand Down
3 changes: 2 additions & 1 deletion pkg/action/oci_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ import (
"regexp"
"testing"

"github.com/chainguard-dev/bincapz/pkg/bincapz"
"github.com/chainguard-dev/bincapz/pkg/compile"
"github.com/chainguard-dev/bincapz/pkg/render"
"github.com/chainguard-dev/bincapz/rules"
Expand Down Expand Up @@ -45,7 +46,7 @@ func TestOCI(t *testing.T) {
t.Fatalf("oci: %v", err)
}

bc := Config{
bc := bincapz.Config{
IgnoreSelf: false,
IgnoreTags: []string{"harmless"},
Renderer: simple,
Expand Down
12 changes: 6 additions & 6 deletions pkg/action/scan.go
Original file line number Diff line number Diff line change
Expand Up @@ -69,7 +69,7 @@ func formatPath(path string) string {
}

// scanSinglePath YARA scans a single path and converts it to a fileReport.
func scanSinglePath(ctx context.Context, c Config, yrs *yara.Rules, path string, absPath string, archiveRoot string) (*bincapz.FileReport, error) {
func scanSinglePath(ctx context.Context, c bincapz.Config, yrs *yara.Rules, path string, absPath string, archiveRoot string) (*bincapz.FileReport, error) {
logger := clog.FromContext(ctx)
var mrs yara.MatchRules
logger = logger.With("path", path)
Expand All @@ -87,7 +87,7 @@ func scanSinglePath(ctx context.Context, c Config, yrs *yara.Rules, path string,
return &bincapz.FileReport{Path: path, Error: fmt.Sprintf("scanfile: %v", err)}, nil
}

fr, err := report.Generate(ctx, path, mrs, c.IgnoreTags, c.MinRisk, c.IgnoreSelf)
fr, err := report.Generate(ctx, path, mrs, c)
if err != nil {
return nil, err
}
Expand Down Expand Up @@ -148,7 +148,7 @@ func errIfHitOrMiss(frs map[string]*bincapz.FileReport, kind string, scanPath st
}

// recursiveScan recursively YARA scans the configured paths - handling archives and OCI images.
func recursiveScan(ctx context.Context, c Config) (*bincapz.Report, error) {
func recursiveScan(ctx context.Context, c bincapz.Config) (*bincapz.Report, error) {
logger := clog.FromContext(ctx)
logger.Debug("recursive scan", slog.Any("config", c))
r := &bincapz.Report{
Expand Down Expand Up @@ -255,7 +255,7 @@ func recursiveScan(ctx context.Context, c Config) (*bincapz.Report, error) {
}

// processArchive extracts and scans a single archive file.
func processArchive(ctx context.Context, c Config, yrs *yara.Rules, archivePath string, logger *clog.Logger) (map[string]*bincapz.FileReport, error) {
func processArchive(ctx context.Context, c bincapz.Config, yrs *yara.Rules, archivePath string, logger *clog.Logger) (map[string]*bincapz.FileReport, error) {
logger = logger.With("archivePath", archivePath)

var err error
Expand Down Expand Up @@ -288,7 +288,7 @@ func processArchive(ctx context.Context, c Config, yrs *yara.Rules, archivePath
}

// processFile scans a single output file, rendering live output if available.
func processFile(ctx context.Context, c Config, yrs *yara.Rules, path string, scanPath string, archiveRoot string, logger *clog.Logger) (*bincapz.FileReport, error) {
func processFile(ctx context.Context, c bincapz.Config, yrs *yara.Rules, path string, scanPath string, archiveRoot string, logger *clog.Logger) (*bincapz.FileReport, error) {
logger = logger.With("path", path)

fr, err := scanSinglePath(ctx, c, yrs, path, scanPath, archiveRoot)
Expand Down Expand Up @@ -321,7 +321,7 @@ func processFile(ctx context.Context, c Config, yrs *yara.Rules, path string, sc
}

// Scan YARA scans a data source, applying output filters if necessary.
func Scan(ctx context.Context, c Config) (*bincapz.Report, error) {
func Scan(ctx context.Context, c bincapz.Config) (*bincapz.Report, error) {
r, err := recursiveScan(ctx, c)
if err != nil {
return r, err
Expand Down
32 changes: 32 additions & 0 deletions pkg/bincapz/bincapz.go
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,37 @@

package bincapz

import (
"context"
"io"

"github.com/hillu/go-yara/v4"
)

// Renderer is a common interface for Renderers.
type Renderer interface {
File(context.Context, *FileReport) error
Full(context.Context, *Report) error
}

type Config struct {
IgnoreSelf bool
IgnoreTags []string
IncludeDataFiles bool
QuantityIncreasesFisk bool
MinFileRisk int
MinRisk int
OCI bool
OmitEmpty bool
Output io.Writer
Renderer Renderer
Rules *yara.Rules
ScanPaths []string
Stats bool
ErrFirstMiss bool
ErrFirstHit bool
}

type Behavior struct {
Description string `json:",omitempty" yaml:",omitempty"`
// MatchStrings are all strings found relating to this behavior
Expand All @@ -29,6 +60,7 @@ type Behavior struct {
type FileReport struct {
Path string
SHA256 string
Size int64
// compiler -> x
Error string `json:",omitempty" yaml:",omitempty"`
Skipped string `json:",omitempty" yaml:",omitempty"`
Expand Down
9 changes: 1 addition & 8 deletions pkg/render/render.go
Original file line number Diff line number Diff line change
Expand Up @@ -4,21 +4,14 @@
package render

import (
"context"
"fmt"
"io"

"github.com/chainguard-dev/bincapz/pkg/bincapz"
)

// Renderer is a common interface for Renderers.
type Renderer interface {
File(context.Context, *bincapz.FileReport) error
Full(context.Context, *bincapz.Report) error
}

// New returns a new Renderer.
func New(kind string, w io.Writer) (Renderer, error) {
func New(kind string, w io.Writer) (bincapz.Renderer, error) {
switch kind {
case "", "auto", "terminal":
return NewTerminal(w), nil
Expand Down
Loading

0 comments on commit 246762a

Please sign in to comment.