vulncheck/source.go - vuln - Git at Google

 // Copyright 2021 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 package vulncheck

 import (
 	"golang.org/x/tools/go/callgraph"
 	"golang.org/x/tools/go/ssa"
 	"golang.org/x/vulndb/osv"
 )

 // Source detects vulnerabilities in pkgs and computes slices of
 //  - imports graph related to an import of a package with some
 //    known vulnerabilities
 //  - requires graph related to a require of a module with a
 //    package that has some known vulnerabilities
 //  - call graph leading to the use of a known vulnerable function
 //    or method
 func Source(pkgs []*Package, cfg *Config) (*Result, error) {
 	modVulns, err := fetchVulnerabilities(cfg.Client, extractModules(pkgs))
 	if err != nil {
 		return nil, err
 	}

 	result := &Result{
 		Imports:  &ImportGraph{Packages: make(map[int]*PkgNode)},
 		Requires: &RequireGraph{Modules: make(map[int]*ModNode)},
 		Calls:    &CallGraph{Funcs: make(map[int]*FuncNode)},
 	}

 	vulnPkgModSlice(pkgs, modVulns, result)

 	if cfg.ImportsOnly {
 		return result, nil
 	}

 	prog, ssaPkgs := buildSSA(pkgs)
 	entries := entryPoints(ssaPkgs)
 	cg := callGraph(prog, entries)
 	vulnCallGraphSlice(entries, modVulns, cg, result)

 	return result, nil
 }

 // pkgID is an id counter for nodes of Imports graph.
 var pkgID int = 0

 func nextPkgID() int {
 	pkgID++
 	return pkgID
 }

 // vulnPkgModSlice computes the slice of pkgs imports and requires graph
 // leading to imports/requires of vulnerable packages/modules in modVulns
 // and stores the computed slices to result.
 func vulnPkgModSlice(pkgs []*Package, modVulns moduleVulnerabilities, result *Result) {
 	// analyzedPkgs contains information on packages analyzed thus far.
 	// If a package is mapped to nil, this means it has been visited
 	// but it does not lead to a vulnerable imports. Otherwise, a
 	// visited package is mapped to Imports package node.
 	analyzedPkgs := make(map[*Package]*PkgNode)
 	for _, pkg := range pkgs {
 		// Top level packages that lead to vulnerable imports are
 		// stored as result.Imports graph entry points.
 		if e := vulnImportSlice(pkg, modVulns, result, analyzedPkgs); e != nil {
 			result.Imports.Entries = append(result.Imports.Entries, e)
 		}
 	}

 	// Populate module requires slice as an overlay
 	// of package imports slice.
 	vulnModuleSlice(result)
 }

 // vulnImportSlice checks if pkg has some vulnerabilities or transitively imports
 // a package with known vulnerabilities. If that is the case, populates result.Imports
 // graph with this reachability information and returns the result.Imports package
 // node for pkg. Otherwise, returns nil.
 func vulnImportSlice(pkg *Package, modVulns moduleVulnerabilities, result *Result, analyzed map[*Package]*PkgNode) *PkgNode {
 	if pn, ok := analyzed[pkg]; ok {
 		return pn
 	}
 	analyzed[pkg] = nil
 	// Recursively compute which direct dependencies lead to an import of
 	// a vulnerable package and remember the nodes of such dependencies.
 	var onSlice []*PkgNode
 	for _, imp := range pkg.Imports {
 		if impNode := vulnImportSlice(imp, modVulns, result, analyzed); impNode != nil {
 			onSlice = append(onSlice, impNode)
 		}
 	}

 	// Check if pkg has known vulnerabilities.
 	vulns := modVulns.VulnsForPackage(pkg.PkgPath)

 	// If pkg is not vulnerable nor it transitively leads
 	// to vulnerabilities, jump out.
 	if len(onSlice) == 0 && len(vulns) == 0 {
 		return nil
 	}

 	// Module id gets populated later.
 	id := nextPkgID()
 	pkgNode := &PkgNode{
 		ID:   id,
 		Name: pkg.Name,
 		Path: pkg.PkgPath,
 		pkg:  pkg,
 	}
 	analyzed[pkg] = pkgNode

 	result.Imports.Packages[id] = pkgNode

 	// Save node predecessor information.
 	for _, impSliceNode := range onSlice {
 		impSliceNode.ImportedBy = append(impSliceNode.ImportedBy, id)
 	}

 	// Create Vuln entry for each symbol of known OSV entries for pkg.
 	for _, osv := range vulns {
 		for _, affected := range osv.Affected {
 			if affected.Package.Name != pkgNode.Path {
 				continue
 			}
 			for _, symbol := range affected.EcosystemSpecific.Symbols {
 				vuln := &Vuln{
 					OSV:        osv,
 					Symbol:     symbol,
 					PkgPath:    pkgNode.Path,
 					ImportSink: id,
 				}
 				result.Vulns = append(result.Vulns, vuln)
 			}
 		}
 	}
 	return pkgNode
 }

 // vulnModuleSlice populates result.Requires as an overlay
 // of result.Imports.
 func vulnModuleSlice(result *Result) {
 	// Map from module nodes, identified with their
 	// path and version, to their unique ids.
 	modNodeIDs := make(map[string]int)
 	// We first collect inverse requires by (predecessor)
 	// relation on module node ids.
 	modPredRelation := make(map[int]map[int]bool)
 	for _, pkgNode := range result.Imports.Packages {
 		// Create or get module node for pkgNode.
 		pkgModID := moduleNodeID(pkgNode, result, modNodeIDs)
 		pkgNode.Module = pkgModID

 		// Get the set of predecessors.
 		predSet := make(map[int]bool)
 		for _, predPkgID := range pkgNode.ImportedBy {
 			predModID := moduleNodeID(result.Imports.Packages[predPkgID], result, modNodeIDs)
 			predSet[predModID] = true
 		}
 		modPredRelation[pkgModID] = predSet
 	}

 	// Store the predecessor requires relation to result.
 	for modID := range modPredRelation {
 		if modID == 0 {
 			continue
 		}

 		var predIDs []int
 		for predID := range modPredRelation[modID] {
 			predIDs = append(predIDs, predID)
 		}
 		modNode := result.Requires.Modules[modID]
 		modNode.RequiredBy = predIDs
 	}

 	// And finally update Vulns with module information.
 	for _, vuln := range result.Vulns {
 		pkgNode := result.Imports.Packages[vuln.ImportSink]
 		modNode := result.Requires.Modules[pkgNode.Module]

 		vuln.RequireSink = pkgNode.Module
 		vuln.ModPath = modNode.Path
 	}
 }

 // modID is an id counter for nodes of Requires graph.
 var modID int = 0

 func nextModID() int {
 	modID++
 	return modID
 }

 // moduleNode creates a module node associated with pkgNode, if one does
 // not exist already, and returns id of the module node. The actual module
 // node is stored to result.
 func moduleNodeID(pkgNode *PkgNode, result *Result, modNodeIDs map[string]int) int {
 	mod := pkgNode.pkg.Module
 	if mod == nil {
 		return 0
 	}

 	mk := modKey(mod)
 	if id, ok := modNodeIDs[mk]; ok {
 		return id
 	}

 	id := nextModID()
 	n := &ModNode{
 		ID:      id,
 		Path:    mod.Path,
 		Version: mod.Version,
 	}
 	result.Requires.Modules[id] = n
 	modNodeIDs[mk] = id

 	// Create a replace module too when applicable.
 	if mod.Replace != nil {
 		rmk := modKey(mod.Replace)
 		if rid, ok := modNodeIDs[rmk]; ok {
 			n.Replace = rid
 		} else {
 			rid := nextModID()
 			rn := &ModNode{
 				Path:    mod.Replace.Path,
 				Version: mod.Replace.Version,
 			}
 			result.Requires.Modules[rid] = rn
 			modNodeIDs[rmk] = rid
 			n.Replace = rid
 		}
 	}
 	return id
 }

 func vulnCallGraphSlice(entries []*ssa.Function, modVulns moduleVulnerabilities, cg *callgraph.Graph, result *Result) {
 	// analyzedFuncs contains information on functions analyzed thus far.
 	// If a function is mapped to nil, this means it has been visited
 	// but it does not lead to a vulnerable call. Otherwise, a visited
 	// function is mapped to Calls function node.
 	analyzedFuncs := make(map[*ssa.Function]*FuncNode)
 	for _, entry := range entries {
 		// Top level entries that lead to vulnerable calls
 		// are stored as result.Calls graph entry points.
 		if e := vulnCallSlice(entry, modVulns, cg, result, analyzedFuncs); e != nil {
 			result.Calls.Entries = append(result.Calls.Entries, e)
 		}
 	}
 }

 // funID is an id counter for nodes of Calls graph.
 var funID int = 0

 func nextFunID() int {
 	funID++
 	return funID
 }

 // vulnCallSlice checks if f has some vulnerabilities or transitively calls
 // a function with known vulnerabilities. If so, populates result.Calls
 // graph with this reachability information and returns the result.Call
 // function node. Otherwise, returns nil.
 func vulnCallSlice(f *ssa.Function, modVulns moduleVulnerabilities, cg *callgraph.Graph, result *Result, analyzed map[*ssa.Function]*FuncNode) *FuncNode {
 	if fn, ok := analyzed[f]; ok {
 		return fn
 	}

 	fn := cg.Nodes[f]
 	if fn == nil {
 		return nil
 	}

 	// Check if f has known vulnerabilities.
 	vulns := modVulns.VulnsForSymbol(f.Package().Pkg.Path(), dbFuncName(f))

 	var funNode *FuncNode
 	// If there are vulnerabilities for f, create node for f and
 	// save it immediatelly. This allows us to include F in the
 	// slice when analyzing chain V -> F -> V where V is vulnerable.
 	if len(vulns) > 0 {
 		funNode = funcNode(f)
 	}
 	analyzed[f] = funNode

 	// Recursively compute which callees lead to a call of a
 	// vulnerable function. Remember the nodes of such callees.
 	type siteNode struct {
 		call ssa.CallInstruction
 		fn   *FuncNode
 	}
 	var onSlice []siteNode
 	for _, edge := range fn.Out {
 		if calleeNode := vulnCallSlice(edge.Callee.Func, modVulns, cg, result, analyzed); calleeNode != nil {
 			onSlice = append(onSlice, siteNode{call: edge.Site, fn: calleeNode})
 		}
 	}

 	// If f is not vulnerable nor it transitively leads
 	// to vulnerable calls, jump out.
 	if len(onSlice) == 0 && len(vulns) == 0 {
 		return nil
 	}

 	// If f is not vulnerable, then at this point it has
 	// to be on the path leading to a vulnerable call.
 	if funNode == nil {
 		funNode = funcNode(f)
 		analyzed[f] = funNode
 	}
 	result.Calls.Funcs[funNode.ID] = funNode

 	// Save node predecessor information.
 	for _, calleeSliceInfo := range onSlice {
 		call, node := calleeSliceInfo.call, calleeSliceInfo.fn
 		cs := &CallSite{
 			Parent:   funNode.ID,
 			Name:     call.Common().Value.Name(),
 			RecvType: callRecvType(call),
 			Resolved: resolved(call),
 			Pos:      instrPosition(call),
 		}
 		node.CallSites = append(node.CallSites, cs)
 	}

 	// Populate CallSink field for each detected vuln symbol.
 	for _, osv := range vulns {
 		for _, affected := range osv.Affected {
 			if affected.Package.Name != funNode.PkgPath {
 				continue
 			}
 			for _, symbol := range affected.EcosystemSpecific.Symbols {
 				addCallSinkForVuln(funNode.ID, osv, symbol, funNode.PkgPath, result)
 			}
 		}
 	}
 	return funNode
 }

 func funcNode(f *ssa.Function) *FuncNode {
 	id := nextFunID()
 	return &FuncNode{
 		ID:       id,
 		Name:     f.Name(),
 		PkgPath:  f.Package().Pkg.Path(),
 		RecvType: funcRecvType(f),
 		Pos:      funcPosition(f),
 	}
 }

 // addCallSinkForVuln adds callID as call sink to vuln of result.Vulns
 // identified with <osv, symbol, pkg>.
 func addCallSinkForVuln(callID int, osv *osv.Entry, symbol, pkg string, result *Result) {
 	for _, vuln := range result.Vulns {
 		if vuln.OSV == osv && vuln.Symbol == symbol && vuln.PkgPath == pkg {
 			vuln.CallSink = callID
 			return
 		}
 	}
 }
	// Copyright 2021 The Go Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file.

	package vulncheck

	import (
	"golang.org/x/tools/go/callgraph"
	"golang.org/x/tools/go/ssa"
	"golang.org/x/vulndb/osv"
	)

	// Source detects vulnerabilities in pkgs and computes slices of
	// - imports graph related to an import of a package with some
	// known vulnerabilities
	// - requires graph related to a require of a module with a
	// package that has some known vulnerabilities
	// - call graph leading to the use of a known vulnerable function
	// or method
	func Source(pkgs []Package, cfg Config) (*Result, error) {
	modVulns, err := fetchVulnerabilities(cfg.Client, extractModules(pkgs))
	if err != nil {
	return nil, err
	}

	result := &Result{
	Imports: &ImportGraph{Packages: make(map[int]*PkgNode)},
	Requires: &RequireGraph{Modules: make(map[int]*ModNode)},
	Calls: &CallGraph{Funcs: make(map[int]*FuncNode)},
	}

	vulnPkgModSlice(pkgs, modVulns, result)

	if cfg.ImportsOnly {
	return result, nil
	}

	prog, ssaPkgs := buildSSA(pkgs)
	entries := entryPoints(ssaPkgs)
	cg := callGraph(prog, entries)
	vulnCallGraphSlice(entries, modVulns, cg, result)

	return result, nil
	}

	// pkgID is an id counter for nodes of Imports graph.
	var pkgID int = 0

	func nextPkgID() int {
	pkgID++
	return pkgID
	}

	// vulnPkgModSlice computes the slice of pkgs imports and requires graph
	// leading to imports/requires of vulnerable packages/modules in modVulns
	// and stores the computed slices to result.
	func vulnPkgModSlice(pkgs []Package, modVulns moduleVulnerabilities, result Result) {
	// analyzedPkgs contains information on packages analyzed thus far.
	// If a package is mapped to nil, this means it has been visited
	// but it does not lead to a vulnerable imports. Otherwise, a
	// visited package is mapped to Imports package node.
	analyzedPkgs := make(map[Package]PkgNode)
	for _, pkg := range pkgs {
	// Top level packages that lead to vulnerable imports are
	// stored as result.Imports graph entry points.
	if e := vulnImportSlice(pkg, modVulns, result, analyzedPkgs); e != nil {
	result.Imports.Entries = append(result.Imports.Entries, e)
	}
	}

	// Populate module requires slice as an overlay
	// of package imports slice.
	vulnModuleSlice(result)
	}

	// vulnImportSlice checks if pkg has some vulnerabilities or transitively imports
	// a package with known vulnerabilities. If that is the case, populates result.Imports
	// graph with this reachability information and returns the result.Imports package
	// node for pkg. Otherwise, returns nil.
	func vulnImportSlice(pkg Package, modVulns moduleVulnerabilities, result Result, analyzed map[Package]PkgNode) *PkgNode {
	if pn, ok := analyzed[pkg]; ok {
	return pn
	}
	analyzed[pkg] = nil
	// Recursively compute which direct dependencies lead to an import of
	// a vulnerable package and remember the nodes of such dependencies.
	var onSlice []*PkgNode
	for _, imp := range pkg.Imports {
	if impNode := vulnImportSlice(imp, modVulns, result, analyzed); impNode != nil {
	onSlice = append(onSlice, impNode)
	}
	}

	// Check if pkg has known vulnerabilities.
	vulns := modVulns.VulnsForPackage(pkg.PkgPath)

	// If pkg is not vulnerable nor it transitively leads
	// to vulnerabilities, jump out.
	if len(onSlice) == 0 && len(vulns) == 0 {
	return nil
	}

	// Module id gets populated later.
	id := nextPkgID()
	pkgNode := &PkgNode{
	ID: id,
	Name: pkg.Name,
	Path: pkg.PkgPath,
	pkg: pkg,
	}
	analyzed[pkg] = pkgNode

	result.Imports.Packages[id] = pkgNode

	// Save node predecessor information.
	for _, impSliceNode := range onSlice {
	impSliceNode.ImportedBy = append(impSliceNode.ImportedBy, id)
	}

	// Create Vuln entry for each symbol of known OSV entries for pkg.
	for _, osv := range vulns {
	for _, affected := range osv.Affected {
	if affected.Package.Name != pkgNode.Path {
	continue
	}
	for _, symbol := range affected.EcosystemSpecific.Symbols {
	vuln := &Vuln{
	OSV: osv,
	Symbol: symbol,
	PkgPath: pkgNode.Path,
	ImportSink: id,
	}
	result.Vulns = append(result.Vulns, vuln)
	}
	}
	}
	return pkgNode
	}

	// vulnModuleSlice populates result.Requires as an overlay
	// of result.Imports.
	func vulnModuleSlice(result *Result) {
	// Map from module nodes, identified with their
	// path and version, to their unique ids.
	modNodeIDs := make(map[string]int)
	// We first collect inverse requires by (predecessor)
	// relation on module node ids.
	modPredRelation := make(map[int]map[int]bool)
	for _, pkgNode := range result.Imports.Packages {
	// Create or get module node for pkgNode.
	pkgModID := moduleNodeID(pkgNode, result, modNodeIDs)
	pkgNode.Module = pkgModID

	// Get the set of predecessors.
	predSet := make(map[int]bool)
	for _, predPkgID := range pkgNode.ImportedBy {
	predModID := moduleNodeID(result.Imports.Packages[predPkgID], result, modNodeIDs)
	predSet[predModID] = true
	}
	modPredRelation[pkgModID] = predSet
	}

	// Store the predecessor requires relation to result.
	for modID := range modPredRelation {
	if modID == 0 {
	continue
	}

	var predIDs []int
	for predID := range modPredRelation[modID] {
	predIDs = append(predIDs, predID)
	}
	modNode := result.Requires.Modules[modID]
	modNode.RequiredBy = predIDs
	}

	// And finally update Vulns with module information.
	for _, vuln := range result.Vulns {
	pkgNode := result.Imports.Packages[vuln.ImportSink]
	modNode := result.Requires.Modules[pkgNode.Module]

	vuln.RequireSink = pkgNode.Module
	vuln.ModPath = modNode.Path
	}
	}

	// modID is an id counter for nodes of Requires graph.
	var modID int = 0

	func nextModID() int {
	modID++
	return modID
	}

	// moduleNode creates a module node associated with pkgNode, if one does
	// not exist already, and returns id of the module node. The actual module
	// node is stored to result.
	func moduleNodeID(pkgNode PkgNode, result Result, modNodeIDs map[string]int) int {
	mod := pkgNode.pkg.Module
	if mod == nil {
	return 0
	}

	mk := modKey(mod)
	if id, ok := modNodeIDs[mk]; ok {
	return id
	}

	id := nextModID()
	n := &ModNode{
	ID: id,
	Path: mod.Path,
	Version: mod.Version,
	}
	result.Requires.Modules[id] = n
	modNodeIDs[mk] = id

	// Create a replace module too when applicable.
	if mod.Replace != nil {
	rmk := modKey(mod.Replace)
	if rid, ok := modNodeIDs[rmk]; ok {
	n.Replace = rid
	} else {
	rid := nextModID()
	rn := &ModNode{
	Path: mod.Replace.Path,
	Version: mod.Replace.Version,
	}
	result.Requires.Modules[rid] = rn
	modNodeIDs[rmk] = rid
	n.Replace = rid
	}
	}
	return id
	}

	func vulnCallGraphSlice(entries []ssa.Function, modVulns moduleVulnerabilities, cg callgraph.Graph, result *Result) {
	// analyzedFuncs contains information on functions analyzed thus far.
	// If a function is mapped to nil, this means it has been visited
	// but it does not lead to a vulnerable call. Otherwise, a visited
	// function is mapped to Calls function node.
	analyzedFuncs := make(map[ssa.Function]FuncNode)
	for _, entry := range entries {
	// Top level entries that lead to vulnerable calls
	// are stored as result.Calls graph entry points.
	if e := vulnCallSlice(entry, modVulns, cg, result, analyzedFuncs); e != nil {
	result.Calls.Entries = append(result.Calls.Entries, e)
	}
	}
	}

	// funID is an id counter for nodes of Calls graph.
	var funID int = 0

	func nextFunID() int {
	funID++
	return funID
	}

	// vulnCallSlice checks if f has some vulnerabilities or transitively calls
	// a function with known vulnerabilities. If so, populates result.Calls
	// graph with this reachability information and returns the result.Call
	// function node. Otherwise, returns nil.
	func vulnCallSlice(f ssa.Function, modVulns moduleVulnerabilities, cg callgraph.Graph, result Result, analyzed map[ssa.Function]FuncNode) FuncNode {
	if fn, ok := analyzed[f]; ok {
	return fn
	}

	fn := cg.Nodes[f]
	if fn == nil {
	return nil
	}

	// Check if f has known vulnerabilities.
	vulns := modVulns.VulnsForSymbol(f.Package().Pkg.Path(), dbFuncName(f))

	var funNode *FuncNode
	// If there are vulnerabilities for f, create node for f and
	// save it immediatelly. This allows us to include F in the
	// slice when analyzing chain V -> F -> V where V is vulnerable.
	if len(vulns) > 0 {
	funNode = funcNode(f)
	}
	analyzed[f] = funNode

	// Recursively compute which callees lead to a call of a
	// vulnerable function. Remember the nodes of such callees.
	type siteNode struct {
	call ssa.CallInstruction
	fn *FuncNode
	}
	var onSlice []siteNode
	for _, edge := range fn.Out {
	if calleeNode := vulnCallSlice(edge.Callee.Func, modVulns, cg, result, analyzed); calleeNode != nil {
	onSlice = append(onSlice, siteNode{call: edge.Site, fn: calleeNode})
	}
	}

	// If f is not vulnerable nor it transitively leads
	// to vulnerable calls, jump out.
	if len(onSlice) == 0 && len(vulns) == 0 {
	return nil
	}

	// If f is not vulnerable, then at this point it has
	// to be on the path leading to a vulnerable call.
	if funNode == nil {
	funNode = funcNode(f)
	analyzed[f] = funNode
	}
	result.Calls.Funcs[funNode.ID] = funNode

	// Save node predecessor information.
	for _, calleeSliceInfo := range onSlice {
	call, node := calleeSliceInfo.call, calleeSliceInfo.fn
	cs := &CallSite{
	Parent: funNode.ID,
	Name: call.Common().Value.Name(),
	RecvType: callRecvType(call),
	Resolved: resolved(call),
	Pos: instrPosition(call),
	}
	node.CallSites = append(node.CallSites, cs)
	}

	// Populate CallSink field for each detected vuln symbol.
	for _, osv := range vulns {
	for _, affected := range osv.Affected {
	if affected.Package.Name != funNode.PkgPath {
	continue
	}
	for _, symbol := range affected.EcosystemSpecific.Symbols {
	addCallSinkForVuln(funNode.ID, osv, symbol, funNode.PkgPath, result)
	}
	}
	}
	return funNode
	}

	func funcNode(f ssa.Function) FuncNode {
	id := nextFunID()
	return &FuncNode{
	ID: id,
	Name: f.Name(),
	PkgPath: f.Package().Pkg.Path(),
	RecvType: funcRecvType(f),
	Pos: funcPosition(f),
	}
	}

	// addCallSinkForVuln adds callID as call sink to vuln of result.Vulns
	// identified with <osv, symbol, pkg>.
	func addCallSinkForVuln(callID int, osv osv.Entry, symbol, pkg string, result Result) {
	for _, vuln := range result.Vulns {
	if vuln.OSV == osv && vuln.Symbol == symbol && vuln.PkgPath == pkg {
	vuln.CallSink = callID
	return
	}
	}
	}