Skip to content

Commit

Permalink
update ConditionalDetector logic
Browse files Browse the repository at this point in the history
  • Loading branch information
rgmz authored and Richard Gomez committed Jun 5, 2024
1 parent 799bbda commit 907da3a
Show file tree
Hide file tree
Showing 4 changed files with 48 additions and 17 deletions.
16 changes: 10 additions & 6 deletions pkg/detectors/detectors.go
Original file line number Diff line number Diff line change
Expand Up @@ -30,18 +30,22 @@ type Detector interface {
// ConditionalDetector is an optional interface that a detector can implement to
// skip chunks based on specific criteria.
type ConditionalDetector interface {
// ScanChunk determines whether the detector should run.
ScanChunk(chunk sources.Chunk) bool
// ShouldScanChunk determines whether the detector should run.
ShouldScanChunk(chunk sources.Chunk) bool
}

// FilenameConditions is a set of common conditions to be used by ConditionalDetector.
var lockFilePat = regexp.MustCompile(`(^|/)(package(-lock)?\.json|yarn\.lock)$`)

// Conditions is a set of common conditions to be used by ConditionalDetector.
// (Using anonymous structs is weird, but Go has no concept of static members... https://stackoverflow.com/a/55390104)
var FilenameConditions = struct {
var Conditions = struct {
// LockFiles are a common source of false-positives.
// https://github.com/trufflesecurity/trufflehog/issues/1460
LockFiles *regexp.Regexp
IsLockFile func(path string) bool
}{
LockFiles: regexp.MustCompile(`(^|/)(package(-lock)?\.json|yarn\.lock)$`),
IsLockFile: func(path string) bool {
return lockFilePat.MatchString(path)
},
}

// Versioner is an optional interface that a detector can implement to
Expand Down
7 changes: 3 additions & 4 deletions pkg/detectors/parseur/parseur.go
Original file line number Diff line number Diff line change
Expand Up @@ -35,10 +35,9 @@ func (s Scanner) Keywords() []string {
return []string{"parseur"}
}

func (s Scanner) ScanChunk(chunk sources.Chunk) bool {
// TODO: Can |chunk.SourceMetadata| be nil?
if m, ok := chunk.SourceMetadata.GetData().(sources.GitSourceMetadata); ok {
return !detectors.FilenameConditions.LockFiles.MatchString(m.GetFile())
func (s Scanner) ShouldScanChunk(chunk sources.Chunk) bool {
if m, ok := sources.NewGitSourceMetadata(chunk.SourceType, chunk.SourceMetadata); ok {
return !detectors.Conditions.IsLockFile(m.File)
}
return true
}
Expand Down
2 changes: 1 addition & 1 deletion pkg/engine/engine.go
Original file line number Diff line number Diff line change
Expand Up @@ -637,7 +637,7 @@ func (e *Engine) detectorWorker(ctx context.Context) {
}

for k, detector := range chunkSpecificDetectors {
if d, ok := detector.(detectors.ConditionalDetector); ok && !d.ScanChunk(*chunk) {
if d, ok := detector.(detectors.ConditionalDetector); ok && !d.ShouldScanChunk(*chunk) {
ctx.Logger().V(4).Info("skipping detector for chunk", "detector", detector.Type().String(), "chunk", chunk)
delete(chunkSpecificDetectors, k)
continue
Expand Down
40 changes: 34 additions & 6 deletions pkg/sources/sources.go
Original file line number Diff line number Diff line change
Expand Up @@ -45,12 +45,40 @@ type Chunk struct {
Verify bool
}

// GitSourceMetadata defines a common interface for Git-based source metadata.
// For example, this should match Git, Azure, Bitbucket, GitHub, and Gitlab.
type GitSourceMetadata interface {
GetRepository() string
GetCommit() string
GetFile() string
// GitSourceMetadata defines a common struct for Git-based source metadata.
type GitSourceMetadata struct {
Repository string
Commit string
File string
}

func NewGitSourceMetadata(source sourcespb.SourceType, data *source_metadatapb.MetaData) (*GitSourceMetadata, bool) {
if data == nil {
return nil, false
}

switch source {
case sourcespb.SourceType_SOURCE_TYPE_GIT:
md := data.GetGit()
return &GitSourceMetadata{md.GetRepository(), md.GetCommit(), md.GetFile()}, true
case sourcespb.SourceType_SOURCE_TYPE_AZURE_REPOS:
md := data.GetAzureRepos()
return &GitSourceMetadata{md.GetRepository(), md.GetCommit(), md.GetFile()}, true
case sourcespb.SourceType_SOURCE_TYPE_BITBUCKET:
md := data.GetBitbucket()
return &GitSourceMetadata{md.GetRepository(), md.GetCommit(), md.GetFile()}, true
case sourcespb.SourceType_SOURCE_TYPE_GERRIT:
md := data.GetGerrit()
return &GitSourceMetadata{md.GetProject(), md.GetCommit(), md.GetFile()}, true
case sourcespb.SourceType_SOURCE_TYPE_GITHUB:
md := data.GetGithub()
return &GitSourceMetadata{md.GetRepository(), md.GetCommit(), md.GetFile()}, true
case sourcespb.SourceType_SOURCE_TYPE_GITLAB:
md := data.GetGitlab()
return &GitSourceMetadata{md.GetRepository(), md.GetCommit(), md.GetFile()}, true
default:
return nil, false
}
}

// ChunkingTarget specifies criteria for a targeted chunking process.
Expand Down

0 comments on commit 907da3a

Please sign in to comment.