trufflesecurity · joeleonjr · Apr 10, 2024 · Apr 10, 2024 · Apr 11, 2024 · Apr 11, 2024
@@ -60,6 +60,7 @@ require (
 	github.com/lrstanley/bubblezone v0.0.0-20240125042004-b7bafc493195
 	github.com/marusama/semaphore/v2 v2.5.0
 	github.com/mattn/go-isatty v0.0.20
+	github.com/mattn/go-sqlite3 v1.14.22
 	github.com/mholt/archiver/v4 v4.0.0-alpha.8
 	github.com/microsoft/go-mssqldb v1.7.0
 	github.com/mitchellh/go-ps v1.0.0

@@ -544,6 +544,8 @@ github.com/mattn/go-runewidth v0.0.9/go.mod h1:H031xJmbD/WCDINGzjvQ9THkh0rPKHF+m
 github.com/mattn/go-runewidth v0.0.12/go.mod h1:RAqKPSqVFrSLVXbA8x7dzmKdmGzieGRCM46jaSJTDAk=
 github.com/mattn/go-runewidth v0.0.15 h1:UNAjwbU9l54TA3KzvqLGxwWjHmMgBUVhBiTjelZgg3U=
 github.com/mattn/go-runewidth v0.0.15/go.mod h1:Jdepj2loyihRzMpdS35Xk/zdY8IAYHsh153qUoGf23w=
+github.com/mattn/go-sqlite3 v1.14.22 h1:2gZY6PC6kBnID23Tichd1K+Z0oS6nE/XwU+Vz/5o4kU=
+github.com/mattn/go-sqlite3 v1.14.22/go.mod h1:Uh1q+B4BYcTPb+yiD3kU8Ct7aC0hY9fxUwlHK0RXw+Y=
 github.com/mholt/archiver/v4 v4.0.0-alpha.8 h1:tRGQuDVPh66WCOelqe6LIGh0gwmfwxUrSSDunscGsRM=
 github.com/mholt/archiver/v4 v4.0.0-alpha.8/go.mod h1:5f7FUYGXdJWUjESffJaYR4R60VhnHxb2X3T1teMyv5A=
 github.com/microcosm-cc/bluemonday v1.0.25 h1:4NEwSfiJ+Wva0VxN5B8OwMicaJvD8r9tlJWm9rtloEg=

@@ -150,6 +150,8 @@ var (
 
 	dockerScan       = cli.Command("docker", "Scan Docker Image")
 	dockerScanImages = dockerScan.Flag("image", "Docker image to scan. Use the file:// prefix to point to a local tarball, otherwise a image registry is assumed.").Required().Strings()
+	dockerCache      = dockerScan.Flag("cache", "Use layer caching. Don't re-scan a layer that has already been scanned and is in the layer caching db.").Bool()
+	dockerCacheDB    = dockerScan.Flag("cache-db", "Path to the layer caching database. Default is trufflehog_layers.sqlite3").Default("trufflehog_layers.sqlite3").String()
 
 	travisCiScan      = cli.Command("travisci", "Scan TravisCI")
 	travisCiScanToken = travisCiScan.Flag("token", "TravisCI token. Can also be provided with environment variable").Envar("TRAVISCI_TOKEN").Required().String()
@@ -448,6 +450,7 @@ func run(state overseer.State) {
 		engine.WithFilterEntropy(*filterEntropy),
 		engine.WithVerificationOverlap(*allowVerificationOverlap),
 		engine.WithJobReportWriter(jobReportWriter),
+		engine.WithDockerCache(*dockerCache, *dockerCacheDB),
 	)
 	if err != nil {
 		logFatal(err, "error initializing engine")
@@ -583,6 +586,8 @@ func run(state overseer.State) {
 			Credential: &sourcespb.Docker_DockerKeychain{
 				DockerKeychain: true,
 			},
+			Cache:   *dockerCache,
+			CacheDb: *dockerCacheDB,
 		}
 		anyConn, err := anypb.New(&dockerConn)
 		if err != nil {

@@ -28,6 +28,7 @@ import (
 	"github.com/trufflesecurity/trufflehog/v3/pkg/pb/source_metadatapb"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/pb/sourcespb"
 	"github.com/trufflesecurity/trufflehog/v3/pkg/sources"
+	"github.com/trufflesecurity/trufflehog/v3/pkg/sources/docker"
 )
 
 var overlapError = errors.New("More than one detector has found this result. For your safety, verification has been disabled. You can override this behavior by using the --allow-verification-overlap flag.")
@@ -105,6 +106,10 @@ type Engine struct {
 	// verify determines whether the scanner will attempt to verify candidate secrets
 	verify bool
 
+	// dockerCache and dockerCacheDb is used to cache the results of scanning docker layers.
+	dockerCache   bool
+	dockerCacheDb string
+
 	// Note: bad hack only used for testing
 	verificationOverlapTracker *verificationOverlapTracker
 }
@@ -239,6 +244,14 @@ func WithVerificationOverlap(verificationOverlap bool) Option {
 	}
 }
 
+// WithDockerCache enables caching of the results of scanning docker layers.
+func WithDockerCache(dockerCache bool, dockerCacheDb string) Option {
+	return func(e *Engine) {
+		e.dockerCache = dockerCache
+		e.dockerCacheDb = dockerCacheDb
+	}
+}
+
 func filterDetectors(filterFunc func(detectors.Detector) bool, input []detectors.Detector) []detectors.Detector {
 	var out []detectors.Detector
 	for _, detector := range input {
@@ -864,6 +877,32 @@ func (e *Engine) processResult(ctx context.Context, data detectableChunk, res de
 
 func (e *Engine) notifyResults(ctx context.Context) {
 	for r := range e.ResultsChan() {
+
+		// Handle docker layer caching if applicable
+		if e.dockerCache && r.SourceType == sourcespb.SourceType_SOURCE_TYPE_DOCKER {
+			layer := r.SourceMetadata.GetDocker().Layer
+			db, err := docker.ConnectToLayersDB(e.dockerCacheDb)
+			if err != nil {
+				ctx.Logger().Error(err, "error connecting to docker cache")
+				err = docker.UpdateCompleted(db, layer, false)
+				if err != nil {
+					ctx.Logger().Error(err, "error updating docker cache")
+				}
+			}
+			if r.Verified {
+				err = docker.UpdateVerified(db, layer, true)
+			} else if r.VerificationError() != nil {
+				err = docker.UpdateUnverified(db, layer, true)
+			}
+			if err != nil {
+				ctx.Logger().Error(err, "error adding to docker cache")
+				err = docker.UpdateCompleted(db, layer, false)
+				if err != nil {
+					ctx.Logger().Error(err, "error updating docker cache")
+				}
+			}
+		}
+
 		// Filter unwanted results, based on `--results`.
 		if !r.Verified {
 			if r.VerificationError() != nil {