Commit 912ec199 authored by Dmitri Shuralyov's avatar Dmitri Shuralyov Committed by Robert Griesemer

go/format, cmd/gofmt: fix issues with partial Go code with indent

Fixes #5551.
Fixes #4449.

Adds tests for both issues.

Note that the two issues occur only when formatting partial Go code
with indent.

The best way to understand the change is as follows: I took the code
of cmd/gofmt and go/format, combined it into one unified code that
does not suffer from either 4449 nor 5551, and then applied that code
to both cmd/gofmt and go/format.

As a result, there is now much more identical code between the two
packages, making future code deduplication easier (it was not possible
to do that now without adding public APIs, which I was advised not to
do at this time).

More specifically, I took the parse() of cmd/gofmt which correctly
preserves comments (issue 5551) and modified it to fix issue where
it would sometimes modify literal values (issue 4449).

I ended up removing the matchSpace() function because it no longer
needed to do some of its work (insert indent), and a part of its work
had to be done in advance (determining the indentation of first code
line), because that calculation is required for cfg.Fprint() to run.

adjustIndent is used to adjust the indent of cfg.Fprint() to compensate
for the body of wrapper func being indented by one level. This allows
to get rid of the bytes.Replace text manipulation of inner content,
which was problematic and sometimes altered raw string literals (issue
4449). This means that sometimes the value of cfg.Indent is negative,
but that works as expected.

So now the algorithm for formatting partial Go code is:

1. Determine and prepend leading space of original source.
2. Determine and prepend indentation of first code line.
3. Format and write partial Go code (with all of its leading &
   trailing space trimmed).
4. Determine and append trailing space of original source.

LGTM=gri
R=golang-codereviews, bradfitz, gri
CC=golang-codereviews
https://golang.org/cl/142360043
parent 0b36211c
...@@ -87,13 +87,13 @@ func processFile(filename string, in io.Reader, out io.Writer, stdin bool) error ...@@ -87,13 +87,13 @@ func processFile(filename string, in io.Reader, out io.Writer, stdin bool) error
return err return err
} }
file, adjust, err := parse(fileSet, filename, src, stdin) file, sourceAdj, indentAdj, err := parse(fileSet, filename, src, stdin)
if err != nil { if err != nil {
return err return err
} }
if rewrite != nil { if rewrite != nil {
if adjust == nil { if sourceAdj == nil {
file = rewrite(file) file = rewrite(file)
} else { } else {
fmt.Fprintf(os.Stderr, "warning: rewrite ignored for incomplete programs\n") fmt.Fprintf(os.Stderr, "warning: rewrite ignored for incomplete programs\n")
...@@ -106,15 +106,10 @@ func processFile(filename string, in io.Reader, out io.Writer, stdin bool) error ...@@ -106,15 +106,10 @@ func processFile(filename string, in io.Reader, out io.Writer, stdin bool) error
simplify(file) simplify(file)
} }
var buf bytes.Buffer res, err := format(fileSet, file, sourceAdj, indentAdj, src)
err = (&printer.Config{Mode: printerMode, Tabwidth: tabWidth}).Fprint(&buf, fileSet, file)
if err != nil { if err != nil {
return err return err
} }
res := buf.Bytes()
if adjust != nil {
res = adjust(src, res)
}
if !bytes.Equal(src, res) { if !bytes.Equal(src, res) {
// formatting has changed // formatting has changed
...@@ -242,17 +237,19 @@ func diff(b1, b2 []byte) (data []byte, err error) { ...@@ -242,17 +237,19 @@ func diff(b1, b2 []byte) (data []byte, err error) {
// parse parses src, which was read from filename, // parse parses src, which was read from filename,
// as a Go source file or statement list. // as a Go source file or statement list.
func parse(fset *token.FileSet, filename string, src []byte, stdin bool) (*ast.File, func(orig, src []byte) []byte, error) { func parse(fset *token.FileSet, filename string, src []byte, fragmentOk bool) (
file *ast.File,
sourceAdj func(src []byte, indent int) []byte,
indentAdj int,
err error,
) {
// Try as whole source file. // Try as whole source file.
file, err := parser.ParseFile(fset, filename, src, parserMode) file, err = parser.ParseFile(fset, filename, src, parserMode)
if err == nil { // If there's no error, return. If the error is that the source file didn't begin with a
return file, nil, nil // package line and source fragments are ok, fall through to
}
// If the error is that the source file didn't begin with a
// package line and this is standard input, fall through to
// try as a source fragment. Stop and return on any other error. // try as a source fragment. Stop and return on any other error.
if !stdin || !strings.Contains(err.Error(), "expected 'package'") { if err == nil || !fragmentOk || !strings.Contains(err.Error(), "expected 'package'") {
return nil, nil, err return
} }
// If this is a declaration list, make it a source file // If this is a declaration list, make it a source file
...@@ -262,19 +259,19 @@ func parse(fset *token.FileSet, filename string, src []byte, stdin bool) (*ast.F ...@@ -262,19 +259,19 @@ func parse(fset *token.FileSet, filename string, src []byte, stdin bool) (*ast.F
psrc := append([]byte("package p;"), src...) psrc := append([]byte("package p;"), src...)
file, err = parser.ParseFile(fset, filename, psrc, parserMode) file, err = parser.ParseFile(fset, filename, psrc, parserMode)
if err == nil { if err == nil {
adjust := func(orig, src []byte) []byte { sourceAdj = func(src []byte, indent int) []byte {
// Remove the package clause. // Remove the package clause.
// Gofmt has turned the ; into a \n. // Gofmt has turned the ; into a \n.
src = src[len("package p\n"):] src = src[indent+len("package p\n"):]
return matchSpace(orig, src) return bytes.TrimSpace(src)
} }
return file, adjust, nil return
} }
// If the error is that the source file didn't begin with a // If the error is that the source file didn't begin with a
// declaration, fall through to try as a statement list. // declaration, fall through to try as a statement list.
// Stop and return on any other error. // Stop and return on any other error.
if !strings.Contains(err.Error(), "expected declaration") { if !strings.Contains(err.Error(), "expected declaration") {
return nil, nil, err return
} }
// If this is a statement list, make it a source file // If this is a statement list, make it a source file
...@@ -285,65 +282,89 @@ func parse(fset *token.FileSet, filename string, src []byte, stdin bool) (*ast.F ...@@ -285,65 +282,89 @@ func parse(fset *token.FileSet, filename string, src []byte, stdin bool) (*ast.F
fsrc := append(append([]byte("package p; func _() {"), src...), '\n', '}') fsrc := append(append([]byte("package p; func _() {"), src...), '\n', '}')
file, err = parser.ParseFile(fset, filename, fsrc, parserMode) file, err = parser.ParseFile(fset, filename, fsrc, parserMode)
if err == nil { if err == nil {
adjust := func(orig, src []byte) []byte { sourceAdj = func(src []byte, indent int) []byte {
// Cap adjusted indent to zero.
if indent < 0 {
indent = 0
}
// Remove the wrapping. // Remove the wrapping.
// Gofmt has turned the ; into a \n\n. // Gofmt has turned the ; into a \n\n.
src = src[len("package p\n\nfunc _() {"):] // There will be two non-blank lines with indent, hence 2*indent.
src = src[:len(src)-len("\n}\n")] src = src[2*indent+len("package p\n\nfunc _() {"):]
// Gofmt has also indented the function body one level. src = src[:len(src)-(indent+len("\n}\n"))]
// Remove that indent. return bytes.TrimSpace(src)
src = bytes.Replace(src, []byte("\n\t"), []byte("\n"), -1)
return matchSpace(orig, src)
} }
return file, adjust, nil // Gofmt has also indented the function body one level.
// Adjust that with indentAdj.
indentAdj = -1
} }
// Failed, and out of options. // Succeeded, or out of options.
return nil, nil, err return
} }
func cutSpace(b []byte) (before, middle, after []byte) { func format(fset *token.FileSet, file *ast.File, sourceAdj func(src []byte, indent int) []byte, indentAdj int, src []byte) ([]byte, error) {
i := 0 if sourceAdj == nil {
for i < len(b) && (b[i] == ' ' || b[i] == '\t' || b[i] == '\n') { // Complete source file.
i++ var buf bytes.Buffer
err := (&printer.Config{Mode: printerMode, Tabwidth: tabWidth}).Fprint(&buf, fset, file)
if err != nil {
return nil, err
} }
j := len(b) return buf.Bytes(), nil
for j > 0 && (b[j-1] == ' ' || b[j-1] == '\t' || b[j-1] == '\n') {
j--
} }
if i <= j {
return b[:i], b[i:j], b[j:] // Partial source file.
// Determine and prepend leading space.
i, j := 0, 0
for j < len(src) && isSpace(src[j]) {
if src[j] == '\n' {
i = j + 1 // byte offset of last line in leading space
} }
return nil, nil, b[j:] j++
} }
var res []byte
res = append(res, src[:i]...)
// matchSpace reformats src to use the same space context as orig. // Determine and prepend indentation of first code line.
// 1) If orig begins with blank lines, matchSpace inserts them at the beginning of src. // Spaces are ignored unless there are no tabs,
// 2) matchSpace copies the indentation of the first non-blank line in orig // in which case spaces count as one tab.
// to every non-blank line in src. indent := 0
// 3) matchSpace copies the trailing space from orig and uses it in place hasSpace := false
// of src's trailing space. for _, b := range src[i:j] {
func matchSpace(orig []byte, src []byte) []byte { switch b {
before, _, after := cutSpace(orig) case ' ':
i := bytes.LastIndex(before, []byte{'\n'}) hasSpace = true
before, indent := before[:i+1], before[i+1:] case '\t':
indent++
_, src, _ = cutSpace(src)
var b bytes.Buffer
b.Write(before)
for len(src) > 0 {
line := src
if i := bytes.IndexByte(line, '\n'); i >= 0 {
line, src = line[:i+1], line[i+1:]
} else {
src = nil
} }
if len(line) > 0 && line[0] != '\n' { // not blank
b.Write(indent)
} }
b.Write(line) if indent == 0 && hasSpace {
indent = 1
} }
b.Write(after) for i := 0; i < indent; i++ {
return b.Bytes() res = append(res, '\t')
}
// Format the source.
// Write it without any leading and trailing space.
cfg := &printer.Config{Mode: printerMode, Tabwidth: tabWidth}
cfg.Indent = indent + indentAdj
var buf bytes.Buffer
err := cfg.Fprint(&buf, fset, file)
if err != nil {
return nil, err
}
res = append(res, sourceAdj(buf.Bytes(), cfg.Indent)...)
// Determine and append trailing space.
i = len(src)
for i > 0 && isSpace(src[i-1]) {
i--
}
return append(res, src[i:]...), nil
}
func isSpace(b byte) bool {
return b == ' ' || b == '\t' || b == '\n' || b == '\r'
} }
...@@ -32,7 +32,7 @@ var ( ...@@ -32,7 +32,7 @@ var (
) )
func gofmt(fset *token.FileSet, filename string, src *bytes.Buffer) error { func gofmt(fset *token.FileSet, filename string, src *bytes.Buffer) error {
f, _, err := parse(fset, filename, src.Bytes(), false) f, _, _, err := parse(fset, filename, src.Bytes(), false)
if err != nil { if err != nil {
return err return err
} }
...@@ -60,7 +60,7 @@ func testFile(t *testing.T, b1, b2 *bytes.Buffer, filename string) { ...@@ -60,7 +60,7 @@ func testFile(t *testing.T, b1, b2 *bytes.Buffer, filename string) {
// exclude files w/ syntax errors (typically test cases) // exclude files w/ syntax errors (typically test cases)
fset := token.NewFileSet() fset := token.NewFileSet()
if _, _, err = parse(fset, filename, b1.Bytes(), false); err != nil { if _, _, _, err = parse(fset, filename, b1.Bytes(), false); err != nil {
if *verbose { if *verbose {
fmt.Fprintf(os.Stderr, "ignoring %s\n", err) fmt.Fprintf(os.Stderr, "ignoring %s\n", err)
} }
......
//gofmt -stdin
if err != nil {
source := strings.NewReader(`line 1.
line 2.
`)
return source
}
f := func(hat, tail string) {
fmt.Println(hat+`
foo
`+tail,
"more",
"and more")
}
//gofmt -stdin
if err != nil {
source := strings.NewReader(`line 1.
line 2.
`)
return source
}
f:=func( hat, tail string){
fmt. Println ( hat+ `
foo
`+ tail ,
"more" ,
"and more" )
}
//gofmt -stdin
if err != nil {
source := strings.NewReader(`line 1.
line 2.
`)
return source
}
f := func(hat, tail string) {
fmt.Println(hat+`
foo
`+tail,
"more",
"and more")
}
//gofmt -stdin
if err != nil {
source := strings.NewReader(`line 1.
line 2.
`)
return source
}
f:=func( hat, tail string){
fmt. Println ( hat+ `
foo
`+ tail ,
"more" ,
"and more" )
}
...@@ -18,6 +18,8 @@ import ( ...@@ -18,6 +18,8 @@ import (
var config = printer.Config{Mode: printer.UseSpaces | printer.TabIndent, Tabwidth: 8} var config = printer.Config{Mode: printer.UseSpaces | printer.TabIndent, Tabwidth: 8}
const parserMode = parser.ParseComments
// Node formats node in canonical gofmt style and writes the result to dst. // Node formats node in canonical gofmt style and writes the result to dst.
// //
// The node type must be *ast.File, *printer.CommentedNode, []ast.Decl, // The node type must be *ast.File, *printer.CommentedNode, []ast.Decl,
...@@ -52,7 +54,7 @@ func Node(dst io.Writer, fset *token.FileSet, node interface{}) error { ...@@ -52,7 +54,7 @@ func Node(dst io.Writer, fset *token.FileSet, node interface{}) error {
if err != nil { if err != nil {
return err return err
} }
file, err = parser.ParseFile(fset, "", buf.Bytes(), parser.ParseComments) file, err = parser.ParseFile(fset, "", buf.Bytes(), parserMode)
if err != nil { if err != nil {
// We should never get here. If we do, provide good diagnostic. // We should never get here. If we do, provide good diagnostic.
return fmt.Errorf("format.Node internal error (%s)", err) return fmt.Errorf("format.Node internal error (%s)", err)
...@@ -80,33 +82,125 @@ func Node(dst io.Writer, fset *token.FileSet, node interface{}) error { ...@@ -80,33 +82,125 @@ func Node(dst io.Writer, fset *token.FileSet, node interface{}) error {
// //
func Source(src []byte) ([]byte, error) { func Source(src []byte) ([]byte, error) {
fset := token.NewFileSet() fset := token.NewFileSet()
node, err := parse(fset, src) file, sourceAdj, indentAdj, err := parse(fset, "", src, true)
if err != nil { if err != nil {
return nil, err return nil, err
} }
var buf bytes.Buffer return format(fset, file, sourceAdj, indentAdj, src)
if file, ok := node.(*ast.File); ok { }
func hasUnsortedImports(file *ast.File) bool {
for _, d := range file.Decls {
d, ok := d.(*ast.GenDecl)
if !ok || d.Tok != token.IMPORT {
// Not an import declaration, so we're done.
// Imports are always first.
return false
}
if d.Lparen.IsValid() {
// For now assume all grouped imports are unsorted.
// TODO(gri) Should check if they are sorted already.
return true
}
// Ungrouped imports are sorted by default.
}
return false
}
// parse parses src, which was read from filename,
// as a Go source file or statement list.
func parse(fset *token.FileSet, filename string, src []byte, fragmentOk bool) (
file *ast.File,
sourceAdj func(src []byte, indent int) []byte,
indentAdj int,
err error,
) {
// Try as whole source file.
file, err = parser.ParseFile(fset, filename, src, parserMode)
// If there's no error, return. If the error is that the source file didn't begin with a
// package line and source fragments are ok, fall through to
// try as a source fragment. Stop and return on any other error.
if err == nil || !fragmentOk || !strings.Contains(err.Error(), "expected 'package'") {
return
}
// If this is a declaration list, make it a source file
// by inserting a package clause.
// Insert using a ;, not a newline, so that the line numbers
// in psrc match the ones in src.
psrc := append([]byte("package p;"), src...)
file, err = parser.ParseFile(fset, filename, psrc, parserMode)
if err == nil {
sourceAdj = func(src []byte, indent int) []byte {
// Remove the package clause.
// Gofmt has turned the ; into a \n.
src = src[indent+len("package p\n"):]
return bytes.TrimSpace(src)
}
return
}
// If the error is that the source file didn't begin with a
// declaration, fall through to try as a statement list.
// Stop and return on any other error.
if !strings.Contains(err.Error(), "expected declaration") {
return
}
// If this is a statement list, make it a source file
// by inserting a package clause and turning the list
// into a function body. This handles expressions too.
// Insert using a ;, not a newline, so that the line numbers
// in fsrc match the ones in src.
fsrc := append(append([]byte("package p; func _() {"), src...), '\n', '}')
file, err = parser.ParseFile(fset, filename, fsrc, parserMode)
if err == nil {
sourceAdj = func(src []byte, indent int) []byte {
// Cap adjusted indent to zero.
if indent < 0 {
indent = 0
}
// Remove the wrapping.
// Gofmt has turned the ; into a \n\n.
// There will be two non-blank lines with indent, hence 2*indent.
src = src[2*indent+len("package p\n\nfunc _() {"):]
src = src[:len(src)-(indent+len("\n}\n"))]
return bytes.TrimSpace(src)
}
// Gofmt has also indented the function body one level.
// Adjust that with indentAdj.
indentAdj = -1
}
// Succeeded, or out of options.
return
}
func format(fset *token.FileSet, file *ast.File, sourceAdj func(src []byte, indent int) []byte, indentAdj int, src []byte) ([]byte, error) {
if sourceAdj == nil {
// Complete source file. // Complete source file.
ast.SortImports(fset, file) ast.SortImports(fset, file)
var buf bytes.Buffer
err := config.Fprint(&buf, fset, file) err := config.Fprint(&buf, fset, file)
if err != nil { if err != nil {
return nil, err return nil, err
} }
return buf.Bytes(), nil
}
} else {
// Partial source file. // Partial source file.
// Determine and prepend leading space. // Determine and prepend leading space.
i, j := 0, 0 i, j := 0, 0
for j < len(src) && isSpace(src[j]) { for j < len(src) && isSpace(src[j]) {
if src[j] == '\n' { if src[j] == '\n' {
i = j + 1 // index of last line in leading space i = j + 1 // byte offset of last line in leading space
} }
j++ j++
} }
buf.Write(src[:i]) var res []byte
res = append(res, src[:i]...)
// Determine indentation of first code line. // Determine and prepend indentation of first code line.
// Spaces are ignored unless there are no tabs, // Spaces are ignored unless there are no tabs,
// in which case spaces count as one tab. // in which case spaces count as one tab.
indent := 0 indent := 0
...@@ -122,78 +216,29 @@ func Source(src []byte) ([]byte, error) { ...@@ -122,78 +216,29 @@ func Source(src []byte) ([]byte, error) {
if indent == 0 && hasSpace { if indent == 0 && hasSpace {
indent = 1 indent = 1
} }
for i := 0; i < indent; i++ {
res = append(res, '\t')
}
// Format the source. // Format the source.
// Write it without any leading and trailing space.
cfg := config cfg := config
cfg.Indent = indent cfg.Indent = indent + indentAdj
err := cfg.Fprint(&buf, fset, node) var buf bytes.Buffer
err := cfg.Fprint(&buf, fset, file)
if err != nil { if err != nil {
return nil, err return nil, err
} }
res = append(res, sourceAdj(buf.Bytes(), cfg.Indent)...)
// Determine and append trailing space. // Determine and append trailing space.
i = len(src) i = len(src)
for i > 0 && isSpace(src[i-1]) { for i > 0 && isSpace(src[i-1]) {
i-- i--
} }
buf.Write(src[i:]) return append(res, src[i:]...), nil
}
return buf.Bytes(), nil
}
func hasUnsortedImports(file *ast.File) bool {
for _, d := range file.Decls {
d, ok := d.(*ast.GenDecl)
if !ok || d.Tok != token.IMPORT {
// Not an import declaration, so we're done.
// Imports are always first.
return false
}
if d.Lparen.IsValid() {
// For now assume all grouped imports are unsorted.
// TODO(gri) Should check if they are sorted already.
return true
}
// Ungrouped imports are sorted by default.
}
return false
} }
func isSpace(b byte) bool { func isSpace(b byte) bool {
return b == ' ' || b == '\t' || b == '\n' || b == '\r' return b == ' ' || b == '\t' || b == '\n' || b == '\r'
} }
func parse(fset *token.FileSet, src []byte) (interface{}, error) {
// Try as a complete source file.
file, err := parser.ParseFile(fset, "", src, parser.ParseComments)
if err == nil {
return file, nil
}
// If the source is missing a package clause, try as a source fragment; otherwise fail.
if !strings.Contains(err.Error(), "expected 'package'") {
return nil, err
}
// Try as a declaration list by prepending a package clause in front of src.
// Use ';' not '\n' to keep line numbers intact.
psrc := append([]byte("package p;"), src...)
file, err = parser.ParseFile(fset, "", psrc, parser.ParseComments)
if err == nil {
return file.Decls, nil
}
// If the source is missing a declaration, try as a statement list; otherwise fail.
if !strings.Contains(err.Error(), "expected declaration") {
return nil, err
}
// Try as statement list by wrapping a function around src.
fsrc := append(append([]byte("package p; func _() {"), src...), '}')
file, err = parser.ParseFile(fset, "", fsrc, parser.ParseComments)
if err == nil {
return file.Decls[0].(*ast.FuncDecl).Body.List, nil
}
// Failed, and out of options.
return nil, err
}
...@@ -87,7 +87,11 @@ var tests = []string{ ...@@ -87,7 +87,11 @@ var tests = []string{
"\tx := 0\n\tgo f()\n\n\n", "\tx := 0\n\tgo f()\n\n\n",
"\n\t\t\n\n\tx := 0\n\tgo f()\n\n\n", "\n\t\t\n\n\tx := 0\n\tgo f()\n\n\n",
"\n\t\t\n\n\t\t\tx := 0\n\t\t\tgo f()\n\n\n", "\n\t\t\n\n\t\t\tx := 0\n\t\t\tgo f()\n\n\n",
"\n\t\t\n\n\t\t\tx := 0\n\t\t\tconst s = `\nfoo\n`\n\n\n", // no indentation inside raw strings "\n\t\t\n\n\t\t\tx := 0\n\t\t\tconst s = `\nfoo\n`\n\n\n", // no indentation added inside raw strings
"\n\t\t\n\n\t\t\tx := 0\n\t\t\tconst s = `\n\t\tfoo\n`\n\n\n", // no indentation removed inside raw strings
// comments
"i := 5 /* Comment */", // Issue 5551.
// erroneous programs // erroneous programs
"ERROR1 + 2 +", "ERROR1 + 2 +",
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment