refactor/eg/eg.go - tools - Git at Google

 // Copyright 2014 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 // Package eg implements the example-based refactoring tool whose
 // command-line is defined in golang.org/x/tools/cmd/eg.
 package eg // import "golang.org/x/tools/refactor/eg"

 import (
 	"bytes"
 	"fmt"
 	"go/ast"
 	"go/format"
 	"go/printer"
 	"go/token"
 	"go/types"
 	"os"
 )

 const Help = `
 This tool implements example-based refactoring of expressions.

 The transformation is specified as a Go file defining two functions,
 'before' and 'after', of identical types.  Each function body consists
 of a single statement: either a return statement with a single
 (possibly multi-valued) expression, or an expression statement.  The
 'before' expression specifies a pattern and the 'after' expression its
 replacement.

 	package P
  	import ( "errors"; "fmt" )
  	func before(s string) error { return fmt.Errorf("%s", s) }
  	func after(s string)  error { return errors.New(s) }

 The expression statement form is useful when the expression has no
 result, for example:

  	func before(msg string) { log.Fatalf("%s", msg) }
  	func after(msg string)  { log.Fatal(msg) }

 The parameters of both functions are wildcards that may match any
 expression assignable to that type.  If the pattern contains multiple
 occurrences of the same parameter, each must match the same expression
 in the input for the pattern to match.  If the replacement contains
 multiple occurrences of the same parameter, the expression will be
 duplicated, possibly changing the side-effects.

 The tool analyses all Go code in the packages specified by the
 arguments, replacing all occurrences of the pattern with the
 substitution.

 So, the transform above would change this input:
 	err := fmt.Errorf("%s", "error: " + msg)
 to this output:
 	err := errors.New("error: " + msg)

 Identifiers, including qualified identifiers (p.X) are considered to
 match only if they denote the same object.  This allows correct
 matching even in the presence of dot imports, named imports and
 locally shadowed package names in the input program.

 Matching of type syntax is semantic, not syntactic: type syntax in the
 pattern matches type syntax in the input if the types are identical.
 Thus, func(x int) matches func(y int).

 This tool was inspired by other example-based refactoring tools,
 'gofmt -r' for Go and Refaster for Java.


 LIMITATIONS
 ===========

 EXPRESSIVENESS

 Only refactorings that replace one expression with another, regardless
 of the expression's context, may be expressed.  Refactoring arbitrary
 statements (or sequences of statements) is a less well-defined problem
 and is less amenable to this approach.

 A pattern that contains a function literal (and hence statements)
 never matches.

 There is no way to generalize over related types, e.g. to express that
 a wildcard may have any integer type, for example.

 It is not possible to replace an expression by one of a different
 type, even in contexts where this is legal, such as x in fmt.Print(x).

 The struct literals T{x} and T{K: x} cannot both be matched by a single
 template.


 SAFETY

 Verifying that a transformation does not introduce type errors is very
 complex in the general case.  An innocuous-looking replacement of one
 constant by another (e.g. 1 to 2) may cause type errors relating to
 array types and indices, for example.  The tool performs only very
 superficial checks of type preservation.


 IMPORTS

 Although the matching algorithm is fully aware of scoping rules, the
 replacement algorithm is not, so the replacement code may contain
 incorrect identifier syntax for imported objects if there are dot
 imports, named imports or locally shadowed package names in the input
 program.

 Imports are added as needed, but they are not removed as needed.
 Run 'goimports' on the modified file for now.

 Dot imports are forbidden in the template.


 TIPS
 ====

 Sometimes a little creativity is required to implement the desired
 migration.  This section lists a few tips and tricks.

 To remove the final parameter from a function, temporarily change the
 function signature so that the final parameter is variadic, as this
 allows legal calls both with and without the argument.  Then use eg to
 remove the final argument from all callers, and remove the variadic
 parameter by hand.  The reverse process can be used to add a final
 parameter.

 To add or remove parameters other than the final one, you must do it in
 stages: (1) declare a variant function f' with a different name and the
 desired parameters; (2) use eg to transform calls to f into calls to f',
 changing the arguments as needed; (3) change the declaration of f to
 match f'; (4) use eg to rename f' to f in all calls; (5) delete f'.
 `

 // TODO(adonovan): expand upon the above documentation as an HTML page.

 // A Transformer represents a single example-based transformation.
 type Transformer struct {
 	fset           *token.FileSet
 	verbose        bool
 	info           *types.Info // combined type info for template/input/output ASTs
 	seenInfos      map[*types.Info]bool
 	wildcards      map[*types.Var]bool                // set of parameters in func before()
 	env            map[string]ast.Expr                // maps parameter name to wildcard binding
 	importedObjs   map[types.Object]*ast.SelectorExpr // objects imported by after().
 	before, after  ast.Expr
 	afterStmts     []ast.Stmt
 	allowWildcards bool

 	// Working state of Transform():
 	nsubsts    int            // number of substitutions made
 	currentPkg *types.Package // package of current call
 }

 // NewTransformer returns a transformer based on the specified template,
 // a single-file package containing "before" and "after" functions as
 // described in the package documentation.
 // tmplInfo is the type information for tmplFile.
 func NewTransformer(fset *token.FileSet, tmplPkg *types.Package, tmplFile *ast.File, tmplInfo *types.Info, verbose bool) (*Transformer, error) {
 	// Check the template.
 	beforeSig := funcSig(tmplPkg, "before")
 	if beforeSig == nil {
 		return nil, fmt.Errorf("no 'before' func found in template")
 	}
 	afterSig := funcSig(tmplPkg, "after")
 	if afterSig == nil {
 		return nil, fmt.Errorf("no 'after' func found in template")
 	}

 	// TODO(adonovan): should we also check the names of the params match?
 	if !types.Identical(afterSig, beforeSig) {
 		return nil, fmt.Errorf("before %s and after %s functions have different signatures",
 			beforeSig, afterSig)
 	}

 	for _, imp := range tmplFile.Imports {
 		if imp.Name != nil && imp.Name.Name == "." {
 			// Dot imports are currently forbidden.  We
 			// make the simplifying assumption that all
 			// imports are regular, without local renames.
 			return nil, fmt.Errorf("dot-import (of %s) in template", imp.Path.Value)
 		}
 	}
 	var beforeDecl, afterDecl *ast.FuncDecl
 	for _, decl := range tmplFile.Decls {
 		if decl, ok := decl.(*ast.FuncDecl); ok {
 			switch decl.Name.Name {
 			case "before":
 				beforeDecl = decl
 			case "after":
 				afterDecl = decl
 			}
 		}
 	}

 	before, err := soleExpr(beforeDecl)
 	if err != nil {
 		return nil, fmt.Errorf("before: %s", err)
 	}
 	afterStmts, after, err := stmtAndExpr(afterDecl)
 	if err != nil {
 		return nil, fmt.Errorf("after: %s", err)
 	}

 	wildcards := make(map[*types.Var]bool)
 	for i := 0; i < beforeSig.Params().Len(); i++ {
 		wildcards[beforeSig.Params().At(i)] = true
 	}

 	// checkExprTypes returns an error if Tb (type of before()) is not
 	// safe to replace with Ta (type of after()).
 	//
 	// Only superficial checks are performed, and they may result in both
 	// false positives and negatives.
 	//
 	// Ideally, we would only require that the replacement be assignable
 	// to the context of a specific pattern occurrence, but the type
 	// checker doesn't record that information and it's complex to deduce.
 	// A Go type cannot capture all the constraints of a given expression
 	// context, which may include the size, constness, signedness,
 	// namedness or constructor of its type, and even the specific value
 	// of the replacement.  (Consider the rule that array literal keys
 	// must be unique.)  So we cannot hope to prove the safety of a
 	// transformation in general.
 	Tb := tmplInfo.TypeOf(before)
 	Ta := tmplInfo.TypeOf(after)
 	if types.AssignableTo(Tb, Ta) {
 		// safe: replacement is assignable to pattern.
 	} else if tuple, ok := Tb.(*types.Tuple); ok && tuple.Len() == 0 {
 		// safe: pattern has void type (must appear in an ExprStmt).
 	} else {
 		return nil, fmt.Errorf("%s is not a safe replacement for %s", Ta, Tb)
 	}

 	tr := &Transformer{
 		fset:           fset,
 		verbose:        verbose,
 		wildcards:      wildcards,
 		allowWildcards: true,
 		seenInfos:      make(map[*types.Info]bool),
 		importedObjs:   make(map[types.Object]*ast.SelectorExpr),
 		before:         before,
 		after:          after,
 		afterStmts:     afterStmts,
 	}

 	// Combine type info from the template and input packages, and
 	// type info for the synthesized ASTs too.  This saves us
 	// having to book-keep where each ast.Node originated as we
 	// construct the resulting hybrid AST.
 	tr.info = &types.Info{
 		Types:      make(map[ast.Expr]types.TypeAndValue),
 		Defs:       make(map[*ast.Ident]types.Object),
 		Uses:       make(map[*ast.Ident]types.Object),
 		Selections: make(map[*ast.SelectorExpr]*types.Selection),
 	}
 	mergeTypeInfo(tr.info, tmplInfo)

 	// Compute set of imported objects required by after().
 	// TODO(adonovan): reject dot-imports in pattern
 	ast.Inspect(after, func(n ast.Node) bool {
 		if n, ok := n.(*ast.SelectorExpr); ok {
 			if _, ok := tr.info.Selections[n]; !ok {
 				// qualified ident
 				obj := tr.info.Uses[n.Sel]
 				tr.importedObjs[obj] = n
 				return false // prune
 			}
 		}
 		return true // recur
 	})

 	return tr, nil
 }

 // WriteAST is a convenience function that writes AST f to the specified file.
 func WriteAST(fset *token.FileSet, filename string, f *ast.File) (err error) {
 	fh, err := os.Create(filename)
 	if err != nil {
 		return err
 	}

 	defer func() {
 		if err2 := fh.Close(); err != nil {
 			err = err2 // prefer earlier error
 		}
 	}()
 	return format.Node(fh, fset, f)
 }

 // -- utilities --------------------------------------------------------

 // funcSig returns the signature of the specified package-level function.
 func funcSig(pkg *types.Package, name string) *types.Signature {
 	if f, ok := pkg.Scope().Lookup(name).(*types.Func); ok {
 		return f.Type().(*types.Signature)
 	}
 	return nil
 }

 // soleExpr returns the sole expression in the before/after template function.
 func soleExpr(fn *ast.FuncDecl) (ast.Expr, error) {
 	if fn.Body == nil {
 		return nil, fmt.Errorf("no body")
 	}
 	if len(fn.Body.List) != 1 {
 		return nil, fmt.Errorf("must contain a single statement")
 	}
 	switch stmt := fn.Body.List[0].(type) {
 	case *ast.ReturnStmt:
 		if len(stmt.Results) != 1 {
 			return nil, fmt.Errorf("return statement must have a single operand")
 		}
 		return stmt.Results[0], nil

 	case *ast.ExprStmt:
 		return stmt.X, nil
 	}

 	return nil, fmt.Errorf("must contain a single return or expression statement")
 }

 // stmtAndExpr returns the expression in the last return statement as well as the preceding lines.
 func stmtAndExpr(fn *ast.FuncDecl) ([]ast.Stmt, ast.Expr, error) {
 	if fn.Body == nil {
 		return nil, nil, fmt.Errorf("no body")
 	}

 	n := len(fn.Body.List)
 	if n == 0 {
 		return nil, nil, fmt.Errorf("must contain at least one statement")
 	}

 	stmts, last := fn.Body.List[:n-1], fn.Body.List[n-1]

 	switch last := last.(type) {
 	case *ast.ReturnStmt:
 		if len(last.Results) != 1 {
 			return nil, nil, fmt.Errorf("return statement must have a single operand")
 		}
 		return stmts, last.Results[0], nil

 	case *ast.ExprStmt:
 		return stmts, last.X, nil
 	}

 	return nil, nil, fmt.Errorf("must end with a single return or expression statement")
 }

 // mergeTypeInfo adds type info from src to dst.
 func mergeTypeInfo(dst, src *types.Info) {
 	for k, v := range src.Types {
 		dst.Types[k] = v
 	}
 	for k, v := range src.Defs {
 		dst.Defs[k] = v
 	}
 	for k, v := range src.Uses {
 		dst.Uses[k] = v
 	}
 	for k, v := range src.Selections {
 		dst.Selections[k] = v
 	}
 }

 // (debugging only)
 func astString(fset *token.FileSet, n ast.Node) string {
 	var buf bytes.Buffer
 	printer.Fprint(&buf, fset, n)
 	return buf.String()
 }
	// Copyright 2014 The Go Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file.

	// Package eg implements the example-based refactoring tool whose
	// command-line is defined in golang.org/x/tools/cmd/eg.
	package eg // import "golang.org/x/tools/refactor/eg"

	import (
	"bytes"
	"fmt"
	"go/ast"
	"go/format"
	"go/printer"
	"go/token"
	"go/types"
	"os"
	)

	const Help = `
	This tool implements example-based refactoring of expressions.

	The transformation is specified as a Go file defining two functions,
	'before' and 'after', of identical types. Each function body consists
	of a single statement: either a return statement with a single
	(possibly multi-valued) expression, or an expression statement. The
	'before' expression specifies a pattern and the 'after' expression its
	replacement.

	package P
	import ( "errors"; "fmt" )
	func before(s string) error { return fmt.Errorf("%s", s) }
	func after(s string) error { return errors.New(s) }

	The expression statement form is useful when the expression has no
	result, for example:

	func before(msg string) { log.Fatalf("%s", msg) }
	func after(msg string) { log.Fatal(msg) }

	The parameters of both functions are wildcards that may match any
	expression assignable to that type. If the pattern contains multiple
	occurrences of the same parameter, each must match the same expression
	in the input for the pattern to match. If the replacement contains
	multiple occurrences of the same parameter, the expression will be
	duplicated, possibly changing the side-effects.

	The tool analyses all Go code in the packages specified by the
	arguments, replacing all occurrences of the pattern with the
	substitution.

	So, the transform above would change this input:
	err := fmt.Errorf("%s", "error: " + msg)
	to this output:
	err := errors.New("error: " + msg)

	Identifiers, including qualified identifiers (p.X) are considered to
	match only if they denote the same object. This allows correct
	matching even in the presence of dot imports, named imports and
	locally shadowed package names in the input program.

	Matching of type syntax is semantic, not syntactic: type syntax in the
	pattern matches type syntax in the input if the types are identical.
	Thus, func(x int) matches func(y int).

	This tool was inspired by other example-based refactoring tools,
	'gofmt -r' for Go and Refaster for Java.


	LIMITATIONS
	===========

	EXPRESSIVENESS

	Only refactorings that replace one expression with another, regardless
	of the expression's context, may be expressed. Refactoring arbitrary
	statements (or sequences of statements) is a less well-defined problem
	and is less amenable to this approach.

	A pattern that contains a function literal (and hence statements)
	never matches.

	There is no way to generalize over related types, e.g. to express that
	a wildcard may have any integer type, for example.

	It is not possible to replace an expression by one of a different
	type, even in contexts where this is legal, such as x in fmt.Print(x).

	The struct literals T{x} and T{K: x} cannot both be matched by a single
	template.


	SAFETY

	Verifying that a transformation does not introduce type errors is very
	complex in the general case. An innocuous-looking replacement of one
	constant by another (e.g. 1 to 2) may cause type errors relating to
	array types and indices, for example. The tool performs only very
	superficial checks of type preservation.


	IMPORTS

	Although the matching algorithm is fully aware of scoping rules, the
	replacement algorithm is not, so the replacement code may contain
	incorrect identifier syntax for imported objects if there are dot
	imports, named imports or locally shadowed package names in the input
	program.

	Imports are added as needed, but they are not removed as needed.
	Run 'goimports' on the modified file for now.

	Dot imports are forbidden in the template.


	TIPS
	====

	Sometimes a little creativity is required to implement the desired
	migration. This section lists a few tips and tricks.

	To remove the final parameter from a function, temporarily change the
	function signature so that the final parameter is variadic, as this
	allows legal calls both with and without the argument. Then use eg to
	remove the final argument from all callers, and remove the variadic
	parameter by hand. The reverse process can be used to add a final
	parameter.

	To add or remove parameters other than the final one, you must do it in
	stages: (1) declare a variant function f' with a different name and the
	desired parameters; (2) use eg to transform calls to f into calls to f',
	changing the arguments as needed; (3) change the declaration of f to
	match f'; (4) use eg to rename f' to f in all calls; (5) delete f'.
	`

	// TODO(adonovan): expand upon the above documentation as an HTML page.

	// A Transformer represents a single example-based transformation.
	type Transformer struct {
	fset *token.FileSet
	verbose bool
	info *types.Info // combined type info for template/input/output ASTs
	seenInfos map[*types.Info]bool
	wildcards map[*types.Var]bool // set of parameters in func before()
	env map[string]ast.Expr // maps parameter name to wildcard binding
	importedObjs map[types.Object]*ast.SelectorExpr // objects imported by after().
	before, after ast.Expr
	afterStmts []ast.Stmt
	allowWildcards bool

	// Working state of Transform():
	nsubsts int // number of substitutions made
	currentPkg *types.Package // package of current call
	}

	// NewTransformer returns a transformer based on the specified template,
	// a single-file package containing "before" and "after" functions as
	// described in the package documentation.
	// tmplInfo is the type information for tmplFile.
	func NewTransformer(fset token.FileSet, tmplPkg types.Package, tmplFile ast.File, tmplInfo types.Info, verbose bool) (*Transformer, error) {
	// Check the template.
	beforeSig := funcSig(tmplPkg, "before")
	if beforeSig == nil {
	return nil, fmt.Errorf("no 'before' func found in template")
	}
	afterSig := funcSig(tmplPkg, "after")
	if afterSig == nil {
	return nil, fmt.Errorf("no 'after' func found in template")
	}

	// TODO(adonovan): should we also check the names of the params match?
	if !types.Identical(afterSig, beforeSig) {
	return nil, fmt.Errorf("before %s and after %s functions have different signatures",
	beforeSig, afterSig)
	}

	for _, imp := range tmplFile.Imports {
	if imp.Name != nil && imp.Name.Name == "." {
	// Dot imports are currently forbidden. We
	// make the simplifying assumption that all
	// imports are regular, without local renames.
	return nil, fmt.Errorf("dot-import (of %s) in template", imp.Path.Value)
	}
	}
	var beforeDecl, afterDecl *ast.FuncDecl
	for _, decl := range tmplFile.Decls {
	if decl, ok := decl.(*ast.FuncDecl); ok {
	switch decl.Name.Name {
	case "before":
	beforeDecl = decl
	case "after":
	afterDecl = decl
	}
	}
	}

	before, err := soleExpr(beforeDecl)
	if err != nil {
	return nil, fmt.Errorf("before: %s", err)
	}
	afterStmts, after, err := stmtAndExpr(afterDecl)
	if err != nil {
	return nil, fmt.Errorf("after: %s", err)
	}

	wildcards := make(map[*types.Var]bool)
	for i := 0; i < beforeSig.Params().Len(); i++ {
	wildcards[beforeSig.Params().At(i)] = true
	}

	// checkExprTypes returns an error if Tb (type of before()) is not
	// safe to replace with Ta (type of after()).
	//
	// Only superficial checks are performed, and they may result in both
	// false positives and negatives.
	//
	// Ideally, we would only require that the replacement be assignable
	// to the context of a specific pattern occurrence, but the type
	// checker doesn't record that information and it's complex to deduce.
	// A Go type cannot capture all the constraints of a given expression
	// context, which may include the size, constness, signedness,
	// namedness or constructor of its type, and even the specific value
	// of the replacement. (Consider the rule that array literal keys
	// must be unique.) So we cannot hope to prove the safety of a
	// transformation in general.
	Tb := tmplInfo.TypeOf(before)
	Ta := tmplInfo.TypeOf(after)
	if types.AssignableTo(Tb, Ta) {
	// safe: replacement is assignable to pattern.
	} else if tuple, ok := Tb.(*types.Tuple); ok && tuple.Len() == 0 {
	// safe: pattern has void type (must appear in an ExprStmt).
	} else {
	return nil, fmt.Errorf("%s is not a safe replacement for %s", Ta, Tb)
	}

	tr := &Transformer{
	fset: fset,
	verbose: verbose,
	wildcards: wildcards,
	allowWildcards: true,
	seenInfos: make(map[*types.Info]bool),
	importedObjs: make(map[types.Object]*ast.SelectorExpr),
	before: before,
	after: after,
	afterStmts: afterStmts,
	}

	// Combine type info from the template and input packages, and
	// type info for the synthesized ASTs too. This saves us
	// having to book-keep where each ast.Node originated as we
	// construct the resulting hybrid AST.
	tr.info = &types.Info{
	Types: make(map[ast.Expr]types.TypeAndValue),
	Defs: make(map[*ast.Ident]types.Object),
	Uses: make(map[*ast.Ident]types.Object),
	Selections: make(map[ast.SelectorExpr]types.Selection),
	}
	mergeTypeInfo(tr.info, tmplInfo)

	// Compute set of imported objects required by after().
	// TODO(adonovan): reject dot-imports in pattern
	ast.Inspect(after, func(n ast.Node) bool {
	if n, ok := n.(*ast.SelectorExpr); ok {
	if _, ok := tr.info.Selections[n]; !ok {
	// qualified ident
	obj := tr.info.Uses[n.Sel]
	tr.importedObjs[obj] = n
	return false // prune
	}
	}
	return true // recur
	})

	return tr, nil
	}

	// WriteAST is a convenience function that writes AST f to the specified file.
	func WriteAST(fset token.FileSet, filename string, f ast.File) (err error) {
	fh, err := os.Create(filename)
	if err != nil {
	return err
	}

	defer func() {
	if err2 := fh.Close(); err != nil {
	err = err2 // prefer earlier error
	}
	}()
	return format.Node(fh, fset, f)
	}

	// -- utilities --------------------------------------------------------

	// funcSig returns the signature of the specified package-level function.
	func funcSig(pkg types.Package, name string) types.Signature {
	if f, ok := pkg.Scope().Lookup(name).(*types.Func); ok {
	return f.Type().(*types.Signature)
	}
	return nil
	}

	// soleExpr returns the sole expression in the before/after template function.
	func soleExpr(fn *ast.FuncDecl) (ast.Expr, error) {
	if fn.Body == nil {
	return nil, fmt.Errorf("no body")
	}
	if len(fn.Body.List) != 1 {
	return nil, fmt.Errorf("must contain a single statement")
	}
	switch stmt := fn.Body.List[0].(type) {
	case *ast.ReturnStmt:
	if len(stmt.Results) != 1 {
	return nil, fmt.Errorf("return statement must have a single operand")
	}
	return stmt.Results[0], nil

	case *ast.ExprStmt:
	return stmt.X, nil
	}

	return nil, fmt.Errorf("must contain a single return or expression statement")
	}

	// stmtAndExpr returns the expression in the last return statement as well as the preceding lines.
	func stmtAndExpr(fn *ast.FuncDecl) ([]ast.Stmt, ast.Expr, error) {
	if fn.Body == nil {
	return nil, nil, fmt.Errorf("no body")
	}

	n := len(fn.Body.List)
	if n == 0 {
	return nil, nil, fmt.Errorf("must contain at least one statement")
	}

	stmts, last := fn.Body.List[:n-1], fn.Body.List[n-1]

	switch last := last.(type) {
	case *ast.ReturnStmt:
	if len(last.Results) != 1 {
	return nil, nil, fmt.Errorf("return statement must have a single operand")
	}
	return stmts, last.Results[0], nil

	case *ast.ExprStmt:
	return stmts, last.X, nil
	}

	return nil, nil, fmt.Errorf("must end with a single return or expression statement")
	}

	// mergeTypeInfo adds type info from src to dst.
	func mergeTypeInfo(dst, src *types.Info) {
	for k, v := range src.Types {
	dst.Types[k] = v
	}
	for k, v := range src.Defs {
	dst.Defs[k] = v
	}
	for k, v := range src.Uses {
	dst.Uses[k] = v
	}
	for k, v := range src.Selections {
	dst.Selections[k] = v
	}
	}

	// (debugging only)
	func astString(fset *token.FileSet, n ast.Node) string {
	var buf bytes.Buffer
	printer.Fprint(&buf, fset, n)
	return buf.String()
	}