From aa82fe333f124a754788d6fe9b2105d13fc69f68 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Fri, 29 Nov 2024 02:18:05 +0800 Subject: [PATCH 01/14] change wording --- gopls/internal/golang/codeaction.go | 6 +++--- gopls/internal/golang/fix.go | 2 +- gopls/internal/golang/undeclared.go | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/gopls/internal/golang/codeaction.go b/gopls/internal/golang/codeaction.go index 627ba1a60d6..9a7bee7f817 100644 --- a/gopls/internal/golang/codeaction.go +++ b/gopls/internal/golang/codeaction.go @@ -335,9 +335,9 @@ func quickFix(ctx context.Context, req *codeActionsRequest) error { req.addApplyFixAction(msg, fixMissingCalledFunction, req.loc) } - // "undeclared name: x" or "undefined: x" compiler error. - // Offer a "Create variable/function x" code action. - // See [fixUndeclared] for command implementation. + // "undeclared name: X" or "undefined: X" compiler error. + // Offer a "Create variable/function X" code action. + // See [createUndeclared] for command implementation. case strings.HasPrefix(msg, "undeclared name: "), strings.HasPrefix(msg, "undefined: "): path, _ := astutil.PathEnclosingInterval(req.pgf.File, start, end) diff --git a/gopls/internal/golang/fix.go b/gopls/internal/golang/fix.go index 7e83c1d6700..e812c677541 100644 --- a/gopls/internal/golang/fix.go +++ b/gopls/internal/golang/fix.go @@ -112,7 +112,7 @@ func ApplyFix(ctx context.Context, fix string, snapshot *cache.Snapshot, fh file fixInvertIfCondition: singleFile(invertIfCondition), fixSplitLines: singleFile(splitLines), fixJoinLines: singleFile(joinLines), - fixCreateUndeclared: singleFile(CreateUndeclared), + fixCreateUndeclared: singleFile(createUndeclared), fixMissingInterfaceMethods: stubMissingInterfaceMethodsFixer, fixMissingCalledFunction: stubMissingCalledFunctionFixer, } diff --git a/gopls/internal/golang/undeclared.go b/gopls/internal/golang/undeclared.go index 35a5c7a1e57..0615386e9bf 100644 --- a/gopls/internal/golang/undeclared.go +++ b/gopls/internal/golang/undeclared.go @@ -68,8 +68,8 @@ func undeclaredFixTitle(path []ast.Node, errMsg string) string { return fmt.Sprintf("Create %s %s", noun, name) } -// CreateUndeclared generates a suggested declaration for an undeclared variable or function. -func CreateUndeclared(fset *token.FileSet, start, end token.Pos, content []byte, file *ast.File, pkg *types.Package, info *types.Info) (*token.FileSet, *analysis.SuggestedFix, error) { +// createUndeclared generates a suggested declaration for an undeclared variable or function. +func createUndeclared(fset *token.FileSet, start, end token.Pos, content []byte, file *ast.File, pkg *types.Package, info *types.Info) (*token.FileSet, *analysis.SuggestedFix, error) { pos := start // don't use the end path, _ := astutil.PathEnclosingInterval(file, pos, pos) if len(path) < 2 { From f37d0177cde925572b7fdc408681a592547c2bae Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Fri, 13 Dec 2024 07:26:08 +0800 Subject: [PATCH 02/14] factor out a thin signature of parsePrintfVerb zz --- go/analysis/passes/printf/printf.go | 117 ++++---- gopls/internal/golang/highlight.go | 273 +++++++++++++++++- .../testdata/highlight/highlight_printf.txt | 40 +++ 3 files changed, 365 insertions(+), 65 deletions(-) create mode 100644 gopls/internal/test/marker/testdata/highlight/highlight_printf.txt diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 95c4bbaa98a..4273e00e5ba 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -421,9 +421,9 @@ func checkCall(pass *analysis.Pass) { fn, kind := printfNameAndKind(pass, call) switch kind { case KindPrintf, KindErrorf: - checkPrintf(pass, kind, call, fn) + checkPrintf(pass, kind, call, fn.FullName()) case KindPrint: - checkPrint(pass, call, fn) + checkPrint(pass, call, fn.FullName()) } }) } @@ -490,12 +490,10 @@ func isFormatter(typ types.Type) bool { type formatState struct { verb rune // the format verb: 'd' for "%d" format string // the full format directive from % through verb, "%.3d". - name string // Printf, Sprintf etc. flags []byte // the list of # + etc. argNums []int // the successive argument numbers that are consumed, adjusted to refer to actual arg in call firstArg int // Index of first argument after the format in the Printf call. // Used only during parse. - pass *analysis.Pass call *ast.CallExpr argNum int // Which argument we're expecting to format now. hasIndex bool // Whether the argument is indexed. @@ -504,7 +502,7 @@ type formatState struct { } // checkPrintf checks a call to a formatted print routine such as Printf. -func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.Func) { +func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname string) { idx := formatStringIndex(pass, call) if idx < 0 || idx >= len(call.Args) { return @@ -523,7 +521,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.F Pos: formatArg.Pos(), End: formatArg.End(), Message: fmt.Sprintf("non-constant format string in call to %s", - fn.FullName()), + fname), SuggestedFixes: []analysis.SuggestedFix{{ Message: `Insert "%s" format string`, TextEdits: []analysis.TextEdit{{ @@ -540,7 +538,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.F firstArg := idx + 1 // Arguments are immediately after format string. if !strings.Contains(format, "%") { if len(call.Args) > firstArg { - pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", fn.FullName()) + pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", fname) } return } @@ -553,12 +551,13 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.F if format[i] != '%' { continue } - state := parsePrintfVerb(pass, call, fn.FullName(), format[i:], firstArg, argNum) - if state == nil { + state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) + if err != nil { + pass.ReportRangef(call.Fun, "%s %s", fname, err.Error()) return } w = len(state.format) - if !okPrintfArg(pass, call, state) { // One error per format is enough. + if !okPrintfArg(pass, call, state, fname) { // One error per format is enough. return } if state.hasIndex { @@ -567,7 +566,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.F if state.verb == 'w' { switch kind { case KindNone, KindPrint, KindPrintf: - pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", state.name) + pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", fname) return } } @@ -593,7 +592,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fn *types.F if maxArgNum != len(call.Args) { expect := maxArgNum - firstArg numArgs := len(call.Args) - firstArg - pass.ReportRangef(call, "%s call needs %v but has %v", fn.FullName(), count(expect, "arg"), count(numArgs, "arg")) + pass.ReportRangef(call, "%s call needs %v but has %v", fname, count(expect, "arg"), count(numArgs, "arg")) } } @@ -621,9 +620,9 @@ func (s *formatState) scanNum() { } // parseIndex scans an index expression. It returns false if there is a syntax error. -func (s *formatState) parseIndex() bool { +func (s *formatState) parseIndex() error { if s.nbytes == len(s.format) || s.format[s.nbytes] != '[' { - return true + return nil } // Argument index present. s.nbytes++ // skip '[' @@ -634,15 +633,13 @@ func (s *formatState) parseIndex() bool { ok = false // syntax error is either missing "]" or invalid index. s.nbytes = strings.Index(s.format[start:], "]") if s.nbytes < 0 { - s.pass.ReportRangef(s.call, "%s format %s is missing closing ]", s.name, s.format) - return false + return fmt.Errorf("format %s is missing closing ]", s.format) } s.nbytes = s.nbytes + start } arg32, err := strconv.ParseInt(s.format[start:s.nbytes], 10, 32) if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.firstArg) { - s.pass.ReportRangef(s.call, "%s format has invalid argument index [%s]", s.name, s.format[start:s.nbytes]) - return false + return fmt.Errorf("format has invalid argument index [%s]", s.format[start:s.nbytes]) } s.nbytes++ // skip ']' arg := int(arg32) @@ -650,11 +647,11 @@ func (s *formatState) parseIndex() bool { s.argNum = arg s.hasIndex = true s.indexPending = true - return true + return nil } -// parseNum scans a width or precision (or *). It returns false if there's a bad index expression. -func (s *formatState) parseNum() bool { +// parseNum scans a width or precision (or *). +func (s *formatState) parseNum() { if s.nbytes < len(s.format) && s.format[s.nbytes] == '*' { if s.indexPending { // Absorb it. s.indexPending = false @@ -665,61 +662,55 @@ func (s *formatState) parseNum() bool { } else { s.scanNum() } - return true } // parsePrecision scans for a precision. It returns false if there's a bad index expression. -func (s *formatState) parsePrecision() bool { +func (s *formatState) parsePrecision() error { // If there's a period, there may be a precision. if s.nbytes < len(s.format) && s.format[s.nbytes] == '.' { s.flags = append(s.flags, '.') // Treat precision as a flag. s.nbytes++ - if !s.parseIndex() { - return false - } - if !s.parseNum() { - return false + if err := s.parseIndex(); err != nil { + return err } + s.parseNum() } - return true + return nil } // parsePrintfVerb looks the formatting directive that begins the format string // and returns a formatState that encodes what the directive wants, without looking -// at the actual arguments present in the call. The result is nil if there is an error. -func parsePrintfVerb(pass *analysis.Pass, call *ast.CallExpr, name, format string, firstArg, argNum int) *formatState { +// at the actual arguments present in the call. It returns the error description if parse fails. +func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*formatState, error) { state := &formatState{ format: format, - name: name, flags: make([]byte, 0, 5), argNum: argNum, argNums: make([]int, 0, 1), nbytes: 1, // There's guaranteed to be a percent sign. firstArg: firstArg, - pass: pass, call: call, } // There may be flags. state.parseFlags() // There may be an index. - if !state.parseIndex() { - return nil + if err := state.parseIndex(); err != nil { + return nil, err } // There may be a width. - if !state.parseNum() { - return nil - } + state.parseNum() // There may be a precision. - if !state.parsePrecision() { - return nil + if err := state.parsePrecision(); err != nil { + return nil, err } // Now a verb, possibly prefixed by an index (which we may already have). - if !state.indexPending && !state.parseIndex() { - return nil + if !state.indexPending { + if err := state.parseIndex(); err != nil { + return nil, err + } } if state.nbytes == len(state.format) { - pass.ReportRangef(call.Fun, "%s format %s is missing verb at end of string", name, state.format) - return nil + return nil, fmt.Errorf("format %s is missing verb at end of string", state.format) } verb, w := utf8.DecodeRuneInString(state.format[state.nbytes:]) state.verb = verb @@ -728,7 +719,7 @@ func parsePrintfVerb(pass *analysis.Pass, call *ast.CallExpr, name, format strin state.argNums = append(state.argNums, state.argNum) } state.format = state.format[:state.nbytes] - return state + return state, nil } // printfArgType encodes the types of expressions a printf verb accepts. It is a bitmask. @@ -794,7 +785,7 @@ var printVerbs = []printVerb{ // okPrintfArg compares the formatState to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fname string) (ok bool) { var v printVerb found := false // Linear scan is fast enough for a small list. @@ -816,7 +807,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", state.name, state.format, state.verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", fname, state.format, state.verb) return false } for _, flag := range state.flags { @@ -826,7 +817,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", state.name, state.format, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", fname, state.format, flag) return false } } @@ -840,7 +831,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o nargs := len(state.argNums) for i := 0; i < nargs-trueArgs; i++ { argNum := state.argNums[i] - if !argCanBeChecked(pass, call, i, state) { + if !argCanBeChecked(pass, call, i, state, fname) { return } arg := call.Args[argNum] @@ -849,7 +840,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", state.name, state.format, analysisinternal.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", fname, state.format, analysisutil.Format(pass.Fset, arg), details) return false } } @@ -858,12 +849,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o return true } argNum := state.argNums[len(state.argNums)-1] - if !argCanBeChecked(pass, call, len(state.argNums)-1, state) { + if !argCanBeChecked(pass, call, len(state.argNums)-1, state, fname) { return false } arg := call.Args[argNum] if isFunctionValue(pass, arg) && state.verb != 'p' && state.verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", state.name, state.format, analysisinternal.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", fname, state.format, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -875,12 +866,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState) (o if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", state.name, state.format, analysisinternal.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", fname, state.format, analysisutil.Format(pass.Fset, arg), typeString, details) return false } if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(state.flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", state.name, state.format, analysisinternal.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", fname, state.format, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -964,7 +955,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, formatArg int, state *formatState) bool { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, formatArg int, state *formatState, name string) bool { argNum := state.argNums[formatArg] if argNum <= 0 { // Shouldn't happen, so catch it with prejudice. @@ -982,7 +973,7 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, formatArg int, sta // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". arg := argNum - state.firstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", state.name, state.format, arg, count(len(call.Args)-state.firstArg, "arg")) + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, state.format, arg, count(len(call.Args)-state.firstArg, "arg")) return false } @@ -999,7 +990,7 @@ const ( ) // checkPrint checks a call to an unformatted print routine such as Println. -func checkPrint(pass *analysis.Pass, call *ast.CallExpr, fn *types.Func) { +func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { firstArg := 0 typ := pass.TypesInfo.Types[call.Fun].Type if typ == nil { @@ -1033,7 +1024,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, fn *types.Func) { if sel, ok := call.Args[0].(*ast.SelectorExpr); ok { if x, ok := sel.X.(*ast.Ident); ok { if x.Name == "os" && strings.HasPrefix(sel.Sel.Name, "Std") { - pass.ReportRangef(call, "%s does not take io.Writer but has first arg %s", fn.FullName(), analysisinternal.Format(pass.Fset, call.Args[0])) + pass.ReportRangef(call, "%s does not take io.Writer but has first arg %s", name, analysisutil.Format(pass.Fset, call.Args[0])) } } } @@ -1047,25 +1038,25 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, fn *types.Func) { if strings.Contains(s, "%") { m := printFormatRE.FindStringSubmatch(s) if m != nil { - pass.ReportRangef(call, "%s call has possible Printf formatting directive %s", fn.FullName(), m[0]) + pass.ReportRangef(call, "%s call has possible Printf formatting directive %s", name, m[0]) } } } - if strings.HasSuffix(fn.Name(), "ln") { + if strings.HasSuffix(name, "ln") { // The last item, if a string, should not have a newline. arg = args[len(args)-1] if s, ok := stringConstantExpr(pass, arg); ok { if strings.HasSuffix(s, "\n") { - pass.ReportRangef(call, "%s arg list ends with redundant newline", fn.FullName()) + pass.ReportRangef(call, "%s arg list ends with redundant newline", name) } } } for _, arg := range args { if isFunctionValue(pass, arg) { - pass.ReportRangef(call, "%s arg %s is a func value, not called", fn.FullName(), analysisinternal.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s arg %s is a func value, not called", name, analysisutil.Format(pass.Fset, arg)) } if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s arg %s causes recursive call to %s method", fn.FullName(), analysisinternal.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s arg %s causes recursive call to %s method", name, analysisutil.Format(pass.Fset, arg), methodName) } } } diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index 1174ce7f7d4..bb6773c5074 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -10,11 +10,13 @@ import ( "go/ast" "go/token" "go/types" + "strings" "golang.org/x/tools/go/ast/astutil" "golang.org/x/tools/gopls/internal/cache" "golang.org/x/tools/gopls/internal/file" "golang.org/x/tools/gopls/internal/protocol" + gastutil "golang.org/x/tools/gopls/internal/util/astutil" "golang.org/x/tools/internal/event" ) @@ -49,7 +51,7 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po } } } - result, err := highlightPath(path, pgf.File, pkg.TypesInfo()) + result, err := highlightPath(path, pgf.File, pkg.TypesInfo(), pos) if err != nil { return nil, err } @@ -69,8 +71,20 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po // highlightPath returns ranges to highlight for the given enclosing path, // which should be the result of astutil.PathEnclosingInterval. -func highlightPath(path []ast.Node, file *ast.File, info *types.Info) (map[posRange]protocol.DocumentHighlightKind, error) { +func highlightPath(path []ast.Node, file *ast.File, info *types.Info, pos token.Pos) (map[posRange]protocol.DocumentHighlightKind, error) { result := make(map[posRange]protocol.DocumentHighlightKind) + // Inside a printf-style call? + for _, node := range path { + if call, ok := node.(*ast.CallExpr); ok { + for _, args := range call.Args { + // Only try when pos is in right side of the format String. + if basicList, ok := args.(*ast.BasicLit); ok && basicList.Pos() < pos && + basicList.Kind == token.STRING && strings.Contains(basicList.Value, "%") { + highlightPrintf(basicList, call, pos, result) + } + } + } + } switch node := path[0].(type) { case *ast.BasicLit: // Import path string literal? @@ -131,6 +145,261 @@ func highlightPath(path []ast.Node, file *ast.File, info *types.Info) (map[posRa return result, nil } +// highlightPrintf identifies and highlights the relationships between placeholders +// in a format string and their corresponding variadic arguments in a printf-style +// function call. +// +// For example: +// +// fmt.Printf("Hello %s, you scored %d", name, score) +// +// If the cursor is on %s or name, highlightPrintf will highlight %s as a write operation, +// and name as a read operation. +func highlightPrintf(directive *ast.BasicLit, call *ast.CallExpr, pos token.Pos, result map[posRange]protocol.DocumentHighlightKind) { + // Two '%'s are interpreted as one '%'(escaped), let's replace them with spaces. + format := strings.Replace(directive.Value, "%%", " ", -1) + if strings.Contains(directive.Value, "%[") || + strings.Contains(directive.Value, "%p") || + strings.Contains(directive.Value, "%T") { + // parsef can not handle these cases. + return + } + expectedVariadicArgs := make([]ast.Expr, strings.Count(format, "%")) + firstVariadic := -1 + for i, arg := range call.Args { + if directive == arg { + firstVariadic = i + 1 + argsLen := len(call.Args) - i - 1 + if argsLen > len(expectedVariadicArgs) { + // Translate from Printf(a0,"%d %d",5, 6, 7) to [5, 6] + copy(expectedVariadicArgs, call.Args[firstVariadic:firstVariadic+len(expectedVariadicArgs)]) + } else { + // Translate from Printf(a0,"%d %d %s",5, 6) to [5, 6, nil] + copy(expectedVariadicArgs[:argsLen], call.Args[firstVariadic:]) + } + break + } + } + formatItems, err := parsef(format, directive.Pos(), expectedVariadicArgs...) + if err != nil { + return + } + var percent formatPercent + // Cursor in argument. + if pos > directive.End() { + var curVariadic int + // Which variadic argument cursor sits inside. + for i := firstVariadic; i < len(call.Args); i++ { + if gastutil.NodeContains(call.Args[i], pos) { + // Offset relative to formatItems. + curVariadic = i - firstVariadic + break + } + } + index := -1 + for _, item := range formatItems { + switch item := item.(type) { + case formatPercent: + percent = item + index++ + case formatVerb: + if token.Pos(percent).IsValid() { + if index == curVariadic { + // Placeholders behave like writting values from arguments to themselves, + // so highlight them with Write semantic. + highlightRange(result, token.Pos(percent), item.rang.end, protocol.Write) + highlightRange(result, item.operand.Pos(), item.operand.End(), protocol.Read) + return + } + percent = formatPercent(token.NoPos) + } + } + } + } else { + // Cursor in format string. + for _, item := range formatItems { + switch item := item.(type) { + case formatPercent: + percent = item + case formatVerb: + if token.Pos(percent).IsValid() { + if token.Pos(percent) <= pos && pos <= item.rang.end { + highlightRange(result, token.Pos(percent), item.rang.end, protocol.Write) + if item.operand != nil { + highlightRange(result, item.operand.Pos(), item.operand.End(), protocol.Read) + } + return + } + percent = formatPercent(token.NoPos) + } + } + } + } +} + +// Below are formatting directives definitions. +type formatPercent token.Pos +type formatLiteral struct { + literal string + rang posRange +} +type formatFlags struct { + flag string + rang posRange +} +type formatWidth struct { + width int + rang posRange +} +type formatPrec struct { + prec int + rang posRange +} +type formatVerb struct { + verb rune + rang posRange + operand ast.Expr // verb's corresponding operand, may be nil +} + +type formatItem interface { + formatItem() +} + +func (formatPercent) formatItem() {} +func (formatLiteral) formatItem() {} +func (formatVerb) formatItem() {} +func (formatWidth) formatItem() {} +func (formatFlags) formatItem() {} +func (formatPrec) formatItem() {} + +type formatFunc func(fmt.State, rune) + +var _ fmt.Formatter = formatFunc(nil) + +func (f formatFunc) Format(st fmt.State, verb rune) { f(st, verb) } + +// parsef parses a printf-style format string into its constituent components together with +// their position in the source code, including [formatLiteral], formatting directives +// [formatFlags], [formatPrecision], [formatWidth], [formatPrecision], [formatVerb], and its operand. +// +// If format contains explicit argument indexes, eg. fmt.Sprintf("%[2]d %[1]d\n", 11, 22), +// the returned range will not be correct. +// If an invalid argument is given for a verb, such as providing a string to %d, the returned error will +// contain a description of the problem. +func parsef(format string, pos token.Pos, args ...ast.Expr) ([]formatItem, error) { + const sep = "__GOPLS_SEP__" + // A conversion represents a single % operation and its operand. + type conversion struct { + verb rune + width int // or -1 + prec int // or -1 + flag string // some of "-+# 0" + operand ast.Expr + } + var convs []conversion + wrappers := make([]any, len(args)) + for i, operand := range args { + wrappers[i] = formatFunc(func(st fmt.State, verb rune) { + st.Write([]byte(sep)) + width, ok := st.Width() + if !ok { + width = -1 + } + prec, ok := st.Precision() + if !ok { + prec = -1 + } + flag := "" + for _, b := range "-+# 0" { + if st.Flag(int(b)) { + flag += string(b) + } + } + convs = append(convs, conversion{ + verb: verb, + width: width, + prec: prec, + flag: flag, + operand: operand, + }) + }) + } + + // Interleave the literals and the conversions. + var formatItems []formatItem + s := fmt.Sprintf(format, wrappers...) + // All errors begin with the string "%!". + if strings.Contains(s, "%!") { + return nil, fmt.Errorf("%s", strings.Replace(s, sep, "", -1)) + } + for i, word := range strings.Split(s, sep) { + if word != "" { + formatItems = append(formatItems, formatLiteral{ + literal: word, + rang: posRange{ + start: pos, + end: pos + token.Pos(len(word)), + }, + }) + pos = pos + token.Pos(len(word)) + } + if i < len(convs) { + conv := convs[i] + // Collect %. + formatItems = append(formatItems, formatPercent(pos)) + pos += 1 + // Collect flags. + if flag := conv.flag; flag != "" { + length := token.Pos(len(conv.flag)) + formatItems = append(formatItems, formatFlags{ + flag: flag, + rang: posRange{ + start: pos, + end: pos + length, + }, + }) + pos += length + } + // Collect width. + if width := conv.width; conv.width != -1 { + length := token.Pos(len(fmt.Sprintf("%d", conv.width))) + formatItems = append(formatItems, formatWidth{ + width: width, + rang: posRange{ + start: pos, + end: pos + length, + }, + }) + pos += length + } + // Collect precision, which starts with a dot. + if prec := conv.prec; conv.prec != -1 { + length := token.Pos(len(fmt.Sprintf("%d", conv.prec))) + 1 + formatItems = append(formatItems, formatPrec{ + prec: prec, + rang: posRange{ + start: pos, + end: pos + length, + }, + }) + pos += length + } + // Collect verb, which must be present. + length := token.Pos(len(string(conv.verb))) + formatItems = append(formatItems, formatVerb{ + verb: conv.verb, + rang: posRange{ + start: pos, + end: pos + length, + }, + operand: conv.operand, + }) + pos += length + } + } + return formatItems, nil +} + type posRange struct { start, end token.Pos } diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt new file mode 100644 index 00000000000..ea0011be205 --- /dev/null +++ b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt @@ -0,0 +1,40 @@ +This test checks functionality of the printf-like directives and operands highlight. + +-- flags -- +-ignore_extra_diags + +-- highlights.go -- +package highlightprintf + +import ( + "fmt" +) + +func BasicPrintfHighlights() { + fmt.Printf("Hello %s, you have %d new messages!", "Alice", 5) //@hiloc(normals, "%s", write),hiloc(normalarg0, "\"Alice\"", read),highlightall(normals, normalarg0) + fmt.Printf("Hello %s, you have %d new messages!", "Alice", 5) //@hiloc(normald, "%d", write),hiloc(normalargs1, "5", read),highlightall(normald, normalargs1) +} + +func ComplexPrintfHighlights() { + fmt.Printf("Hello %#3.4s, you have %-2.3d new messages!", "Alice", 5) //@hiloc(complexs, "%#3.4s", write),hiloc(complexarg0, "\"Alice\"", read),highlightall(complexs, complexarg0) + fmt.Printf("Hello %#3.4s, you have %-2.3d new messages!", "Alice", 5) //@hiloc(complexd, "%-2.3d", write),hiloc(complexarg1, "5", read),highlightall(complexd, complexarg1) +} + +func MissingDirectives() { + fmt.Printf("Hello %s, you have 5 new messages!", "Alice", 5) //@hiloc(missings, "%s", write),hiloc(missingargs0, "\"Alice\"", read),highlightall(missings, missingargs0) +} + +func TooManyDirectives() { + fmt.Printf("Hello %s, you have %d new %s %q messages!", "Alice", 5) //@hiloc(toomanys, "%s", write),hiloc(toomanyargs0, "\"Alice\"", read),highlightall(toomanys, toomanyargs0) + fmt.Printf("Hello %s, you have %d new %s %q messages!", "Alice", 5) //@hiloc(toomanyd, "%d", write),hiloc(toomanyargs1, "5", read),highlightall(toomanyd, toomanyargs1) +} + +func SpecialChars() { + fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(specials, "%s", write),hiloc(specialargs0, "\"Alice\"", read),highlightall(specials, specialargs0) + fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(speciald, "%d", write),hiloc(specialargs1, "5", read),highlightall(speciald, specialargs1) +} + +func Escaped() { + fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapeds, "%s", write),hiloc(escapedargs0, "\"Alice\"", read),highlightall(escapeds, escapedargs0) + fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapedd, "%s", write),hiloc(escapedargs1, "\"Alice\"", read),highlightall(escapedd, escapedargs1) +} From 88dc478240ea5b143e6da395b20bd66079764625 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Fri, 13 Dec 2024 10:20:11 +0800 Subject: [PATCH 03/14] add formatItem types --- go/analysis/passes/printf/printf.go | 87 +++++++++++++++++++++-------- 1 file changed, 63 insertions(+), 24 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 4273e00e5ba..ef4166846dd 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -376,8 +376,8 @@ var isPrint = stringSet{ // formatStringIndex returns the index of the format string (the last // non-variadic parameter) within the given printf-like call // expression, or -1 if unknown. -func formatStringIndex(pass *analysis.Pass, call *ast.CallExpr) int { - typ := pass.TypesInfo.Types[call.Fun].Type +func formatStringIndex(info *types.Info, call *ast.CallExpr) int { + typ := info.Types[call.Fun].Type if typ == nil { return -1 // missing type } @@ -402,8 +402,8 @@ func formatStringIndex(pass *analysis.Pass, call *ast.CallExpr) int { // // ("", false) is returned if expression isn't a string // constant. -func stringConstantExpr(pass *analysis.Pass, expr ast.Expr) (string, bool) { - lit := pass.TypesInfo.Types[expr].Value +func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { + lit := info.Types[expr].Value if lit != nil && lit.Kind() == constant.String { return constant.StringVal(lit), true } @@ -502,13 +502,13 @@ type formatState struct { } // checkPrintf checks a call to a formatted print routine such as Printf. -func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname string) { - idx := formatStringIndex(pass, call) +func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { + idx := formatStringIndex(pass.TypesInfo, call) if idx < 0 || idx >= len(call.Args) { return } formatArg := call.Args[idx] - format, ok := stringConstantExpr(pass, formatArg) + format, ok := stringConstantExpr(pass.TypesInfo, formatArg) if !ok { // Format string argument is non-constant. @@ -521,7 +521,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname strin Pos: formatArg.Pos(), End: formatArg.End(), Message: fmt.Sprintf("non-constant format string in call to %s", - fname), + name), SuggestedFixes: []analysis.SuggestedFix{{ Message: `Insert "%s" format string`, TextEdits: []analysis.TextEdit{{ @@ -538,7 +538,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname strin firstArg := idx + 1 // Arguments are immediately after format string. if !strings.Contains(format, "%") { if len(call.Args) > firstArg { - pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", fname) + pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", name) } return } @@ -553,11 +553,11 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname strin } state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) if err != nil { - pass.ReportRangef(call.Fun, "%s %s", fname, err.Error()) + pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) return } w = len(state.format) - if !okPrintfArg(pass, call, state, fname) { // One error per format is enough. + if !okPrintfArg(pass, call, name, state) { // One error per format is enough. return } if state.hasIndex { @@ -566,7 +566,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname strin if state.verb == 'w' { switch kind { case KindNone, KindPrint, KindPrintf: - pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", fname) + pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", name) return } } @@ -592,7 +592,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, fname strin if maxArgNum != len(call.Args) { expect := maxArgNum - firstArg numArgs := len(call.Args) - firstArg - pass.ReportRangef(call, "%s call needs %v but has %v", fname, count(expect, "arg"), count(numArgs, "arg")) + pass.ReportRangef(call, "%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) } } @@ -678,6 +678,45 @@ func (s *formatState) parsePrecision() error { return nil } +// Below are formatting directives definitions. +type formatPercent token.Pos +type formatLiteral struct { + literal string + rang posRange +} +type formatFlags struct { + flag string + rang posRange +} +type formatWidth struct { + width int + rang posRange +} +type formatPrec struct { + prec int + rang posRange +} +type formatVerb struct { + verb rune + rang posRange + operand ast.Expr // verb's corresponding operand, may be nil +} + +type posRange struct { + start, end token.Pos +} + +type formatItem interface { + formatItem() +} + +func (formatPercent) formatItem() {} +func (formatLiteral) formatItem() {} +func (formatVerb) formatItem() {} +func (formatWidth) formatItem() {} +func (formatFlags) formatItem() {} +func (formatPrec) formatItem() {} + // parsePrintfVerb looks the formatting directive that begins the format string // and returns a formatState that encodes what the directive wants, without looking // at the actual arguments present in the call. It returns the error description if parse fails. @@ -785,7 +824,7 @@ var printVerbs = []printVerb{ // okPrintfArg compares the formatState to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fname string) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, name string, state *formatState) (ok bool) { var v printVerb found := false // Linear scan is fast enough for a small list. @@ -807,7 +846,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", fname, state.format, state.verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", name, state.format, state.verb) return false } for _, flag := range state.flags { @@ -817,7 +856,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", fname, state.format, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, state.format, flag) return false } } @@ -831,7 +870,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn nargs := len(state.argNums) for i := 0; i < nargs-trueArgs; i++ { argNum := state.argNums[i] - if !argCanBeChecked(pass, call, i, state, fname) { + if !argCanBeChecked(pass, call, i, state, name) { return } arg := call.Args[argNum] @@ -840,7 +879,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", fname, state.format, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, state.format, analysisutil.Format(pass.Fset, arg), details) return false } } @@ -849,12 +888,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn return true } argNum := state.argNums[len(state.argNums)-1] - if !argCanBeChecked(pass, call, len(state.argNums)-1, state, fname) { + if !argCanBeChecked(pass, call, len(state.argNums)-1, state, name) { return false } arg := call.Args[argNum] if isFunctionValue(pass, arg) && state.verb != 'p' && state.verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", fname, state.format, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, state.format, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -866,12 +905,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, state *formatState, fn if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", fname, state.format, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, state.format, analysisutil.Format(pass.Fset, arg), typeString, details) return false } if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(state.flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", fname, state.format, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, state.format, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -1031,7 +1070,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } arg := args[0] - if s, ok := stringConstantExpr(pass, arg); ok { + if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { // Ignore trailing % character // The % in "abc 0.0%" couldn't be a formatting directive. s = strings.TrimSuffix(s, "%") @@ -1045,7 +1084,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { if strings.HasSuffix(name, "ln") { // The last item, if a string, should not have a newline. arg = args[len(args)-1] - if s, ok := stringConstantExpr(pass, arg); ok { + if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { if strings.HasSuffix(s, "\n") { pass.ReportRangef(call, "%s arg list ends with redundant newline", name) } From 205449a97440f7fbb37bca9e074b28b9178c5a8b Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 17 Dec 2024 00:57:26 +0800 Subject: [PATCH 04/14] test pass --- go/analysis/passes/printf/printf.go | 163 +++++------ internal/fmtstr/parse.go | 438 ++++++++++++++++++++++++++++ 2 files changed, 509 insertions(+), 92 deletions(-) create mode 100644 internal/fmtstr/parse.go diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index ef4166846dd..14ee44a26bd 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -25,6 +25,7 @@ import ( "golang.org/x/tools/go/ast/inspector" "golang.org/x/tools/go/types/typeutil" "golang.org/x/tools/internal/analysisinternal" + "golang.org/x/tools/internal/fmtstr" "golang.org/x/tools/internal/typeparams" ) @@ -535,7 +536,10 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } - firstArg := idx + 1 // Arguments are immediately after format string. + var anyIndex bool + var firstArg int + firstArg = idx + 1 // Arguments are immediately after format string. + maxArgNum := firstArg if !strings.Contains(format, "%") { if len(call.Args) > firstArg { pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", name) @@ -543,43 +547,30 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } // Hard part: check formats against args. - argNum := firstArg - maxArgNum := firstArg - anyIndex := false - for i, w := 0, 0; i < len(format); i += w { - w = 1 - if format[i] != '%' { - continue - } - state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) - if err != nil { - pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) - return + states, err := fmtstr.ParsePrintf(pass.TypesInfo, call, name) + if err != nil { + pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) + return + } + + for _, state := range states { + if (state.Prec != nil && state.Prec.Index != -1) || + (state.Width != nil && state.Width.Index != -1) || + (state.Verb != nil && state.Verb.Index != -1) { + anyIndex = true } - w = len(state.format) - if !okPrintfArg(pass, call, name, state) { // One error per format is enough. + if !okPrintfArg(pass, call, &maxArgNum, name, state) { // One error per format is enough. return } - if state.hasIndex { - anyIndex = true - } - if state.verb == 'w' { + if state.Verb.Verb == 'w' { switch kind { case KindNone, KindPrint, KindPrintf: pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", name) return } } - if len(state.argNums) > 0 { - // Continue with the next sequential argument. - argNum = state.argNums[len(state.argNums)-1] + 1 - } - for _, n := range state.argNums { - if n >= maxArgNum { - maxArgNum = n + 1 - } - } } + // Dotdotdot is hard. if call.Ellipsis.IsValid() && maxArgNum >= len(call.Args)-1 { return @@ -592,6 +583,10 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string if maxArgNum != len(call.Args) { expect := maxArgNum - firstArg numArgs := len(call.Args) - firstArg + s := fmt.Sprintf("%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) + if s == "fmt.Printf call needs 0 args but has 1 arg" { + s = "" + } pass.ReportRangef(call, "%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) } } @@ -668,7 +663,7 @@ func (s *formatState) parseNum() { func (s *formatState) parsePrecision() error { // If there's a period, there may be a precision. if s.nbytes < len(s.format) && s.format[s.nbytes] == '.' { - s.flags = append(s.flags, '.') // Treat precision as a flag. + // s.flags = append(s.flags, '.') // Treat precision as a flag. s.nbytes++ if err := s.parseIndex(); err != nil { return err @@ -678,45 +673,6 @@ func (s *formatState) parsePrecision() error { return nil } -// Below are formatting directives definitions. -type formatPercent token.Pos -type formatLiteral struct { - literal string - rang posRange -} -type formatFlags struct { - flag string - rang posRange -} -type formatWidth struct { - width int - rang posRange -} -type formatPrec struct { - prec int - rang posRange -} -type formatVerb struct { - verb rune - rang posRange - operand ast.Expr // verb's corresponding operand, may be nil -} - -type posRange struct { - start, end token.Pos -} - -type formatItem interface { - formatItem() -} - -func (formatPercent) formatItem() {} -func (formatLiteral) formatItem() {} -func (formatVerb) formatItem() {} -func (formatWidth) formatItem() {} -func (formatFlags) formatItem() {} -func (formatPrec) formatItem() {} - // parsePrintfVerb looks the formatting directive that begins the format string // and returns a formatState that encodes what the directive wants, without looking // at the actual arguments present in the call. It returns the error description if parse fails. @@ -824,12 +780,13 @@ var printVerbs = []printVerb{ // okPrintfArg compares the formatState to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, name string, state *formatState) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, state *fmtstr.FormatState) (ok bool) { + verb := state.Verb.Verb var v printVerb found := false // Linear scan is fast enough for a small list. for _, v = range printVerbs { - if v.verb == state.verb { + if v.verb == verb { found = true break } @@ -838,39 +795,56 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, name string, state *fo // Could current arg implement fmt.Formatter? // Skip check for the %w verb, which requires an error. formatter := false - if v.typ != argError && state.argNum < len(call.Args) { - if tv, ok := pass.TypesInfo.Types[call.Args[state.argNum]]; ok { + if v.typ != argError && state.Verb.ArgNum < len(call.Args) { + if tv, ok := pass.TypesInfo.Types[call.Args[state.Verb.ArgNum]]; ok { formatter = isFormatter(tv.Type) } } if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", name, state.format, state.verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", name, state.Format, verb) return false } - for _, flag := range state.flags { + for _, flag := range state.Flags { // TODO: Disable complaint about '0' for Go 1.10. To be fixed properly in 1.11. // See issues 23598 and 23605. if flag == '0' { continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, state.format, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, state.Format, flag) return false } } } // Verb is good. If len(state.argNums)>trueArgs, we have something like %.*s and all // but the final arg must be an integer. + var argNums []int + if state.Width != nil && state.Width.ArgNum != -1 { + argNums = append(argNums, state.Width.ArgNum) + } + if state.Prec != nil && state.Prec.ArgNum != -1 { + argNums = append(argNums, state.Prec.ArgNum) + } + if state.Verb != nil && state.Verb.ArgNum != -1 && verb != '%' { + argNums = append(argNums, state.Verb.ArgNum) + } + + for _, n := range argNums { + if n >= *maxArgNum { + *maxArgNum = n + 1 + } + } + trueArgs := 1 - if state.verb == '%' { + if verb == '%' { trueArgs = 0 } - nargs := len(state.argNums) + nargs := len(argNums) for i := 0; i < nargs-trueArgs; i++ { - argNum := state.argNums[i] - if !argCanBeChecked(pass, call, i, state, name) { + argNum := argNums[i] + if !argCanBeChecked(pass, call, argNums[i], state, name) { return } arg := call.Args[argNum] @@ -879,21 +853,21 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, name string, state *fo if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, state.format, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, state.Format, analysisutil.Format(pass.Fset, arg), details) return false } } - if state.verb == '%' || formatter { + if verb == '%' || formatter { return true } - argNum := state.argNums[len(state.argNums)-1] - if !argCanBeChecked(pass, call, len(state.argNums)-1, state, name) { + argNum := argNums[len(argNums)-1] + if !argCanBeChecked(pass, call, argNums[len(argNums)-1], state, name) { return false } arg := call.Args[argNum] - if isFunctionValue(pass, arg) && state.verb != 'p' && state.verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, state.format, analysisutil.Format(pass.Fset, arg)) + if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, state.Format, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -905,12 +879,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, name string, state *fo if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, state.format, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, state.Format, analysisutil.Format(pass.Fset, arg), typeString, details) return false } - if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(state.flags, []byte{'#'}) { + if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(state.Flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, state.format, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, state.Format, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -994,8 +968,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, formatArg int, state *formatState, name string) bool { - argNum := state.argNums[formatArg] +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state *fmtstr.FormatState, name string) bool { if argNum <= 0 { // Shouldn't happen, so catch it with prejudice. panic("negative arg num") @@ -1011,8 +984,14 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, formatArg int, sta } // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". - arg := argNum - state.firstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, state.format, arg, count(len(call.Args)-state.firstArg, "arg")) + arg := argNum - state.FirstArg + 1 // People think of arguments as 1-indexed. + // fmt.Printf format %*% reads arg #2, but call has 1 arg + s := fmt.Sprintf("%s format %s reads arg #%d, but call has %v", name, state.Format, arg, count(len(call.Args)-state.FirstArg, "arg")) + if s == "fmt.Printf format %*% reads arg #2, but call has 1 arg" { + z := 1 + _ = z + } + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, state.Format, arg, count(len(call.Args)-state.FirstArg, "arg")) return false } diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go new file mode 100644 index 00000000000..f835e95be19 --- /dev/null +++ b/internal/fmtstr/parse.go @@ -0,0 +1,438 @@ +// Copyright 2010 The Go Authors. All rights reserved. +// Use of this source code is governed by a BSD-style +// license that can be found in the LICENSE file. + +package fmtstr + +import ( + _ "embed" + "fmt" + "go/ast" + "go/constant" + "go/types" + "strconv" + "strings" + "unicode/utf8" + // "golang.org/x/tools/go/analysis/passes/internal/analysisutil" +) + +// ParsePrintf checks a call to a formatted print routine such as Printf. +// func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { +func ParsePrintf(info *types.Info, call *ast.CallExpr, name string) ([]*FormatState, error) { + idx := formatStringIndex(info, call) + if idx < 0 || idx >= len(call.Args) { + return nil, fmt.Errorf("%s", "can't parse") + } + formatArg := call.Args[idx] + format, ok := stringConstantExpr(info, formatArg) + if !ok { + return nil, fmt.Errorf("non-constant format string in call to %s", name) + } + firstArg := idx + 1 // Arguments are immediately after format string. + if !strings.Contains(format, "%") { + return nil, fmt.Errorf("%s call has arguments but no formatting directives", name) + } + // Hard part: check formats against args. + argNum := firstArg + var states []*FormatState + for i, w := 0, 0; i < len(format); i += w { + w = 1 + if format[i] != '%' { + continue + } + state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) + if err != nil { + return nil, fmt.Errorf("%s %s", name, err.Error()) + } + + state.AddRange(i) + states = append(states, state) + + w = len(state.Format) + if len(state.argNums) > 0 { + // Continue with the next sequential argument. + argNum = state.argNums[len(state.argNums)-1] + 1 + } + } + return states, nil +} + +// formatStringIndex returns the index of the format string (the last +// non-variadic parameter) within the given printf-like call +// expression, or -1 if unknown. +func formatStringIndex(info *types.Info, call *ast.CallExpr) int { + typ := info.Types[call.Fun].Type + if typ == nil { + return -1 // missing type + } + sig, ok := typ.(*types.Signature) + if !ok { + return -1 // ill-typed + } + if !sig.Variadic() { + // Skip checking non-variadic functions. + return -1 + } + idx := sig.Params().Len() - 2 + if idx < 0 { + // Skip checking variadic functions without + // fixed arguments. + return -1 + } + return idx +} + +// stringConstantExpr returns expression's string constant value. +// +// ("", false) is returned if expression isn't a string +// constant. +func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { + lit := info.Types[expr].Value + if lit != nil && lit.Kind() == constant.String { + return constant.StringVal(lit), true + } + return "", false +} + +// FormatState holds the parsed representation of a printf directive such as "%3.*[4]d". +// It is constructed by parsePrintfVerb. +type FormatState struct { + Format string // the full format directive from % through verb, "%.3d". + Flags []byte // the list of # + etc. + Width *DirectiveSize // format width: '3' for "%3d", if any. + Prec *DirectiveSize // format precision: '4' for "%.4d", if any. + Verb *DirectiveVerb // format verb: 'd' for "%d" + Range posRange + FirstArg int // Index of first argument after the format in the Printf call. + // Used only during parse. + call *ast.CallExpr + argNums []int // the successive argument numbers that are consumed, adjusted to refer to actual arg in call + argNum int // Which argument we're expecting to format now. + hasIndex bool // Whether the argument is indexed. + index int + indexPos int + indexPending bool // Whether we have an indexed argument that has not resolved. + nbytes int // number of bytes of the format string consumed. +} + +func (s *FormatState) AddRange(parsedLen int) { + if s.Verb != nil { + s.Verb.Range.Start += parsedLen + s.Verb.Range.End += parsedLen + + s.Range.Start = parsedLen + s.Range.End = s.Verb.Range.End + } + if s.Prec != nil { + s.Prec.Range.Start += parsedLen + s.Prec.Range.End += parsedLen + } + if s.Width != nil { + s.Width.Range.Start += parsedLen + s.Width.Range.End += parsedLen + } +} + +// parseFlags accepts any printf flags. +func (s *FormatState) parseFlags() { + for s.nbytes < len(s.Format) { + switch c := s.Format[s.nbytes]; c { + case '#', '0', '+', '-', ' ': + s.Flags = append(s.Flags, c) + s.nbytes++ + default: + return + } + } +} + +// scanNum advances through a decimal number for [Size] or [Index] if present. +func (s *FormatState) scanNum() (int, bool) { + start := s.nbytes + for ; s.nbytes < len(s.Format); s.nbytes++ { + c := s.Format[s.nbytes] + if c < '0' || '9' < c { + if start < s.nbytes { + num, _ := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) + return int(num), true + // switch kind { + // case Size: + // s.Prec = &DirectiveSize{ + // Kind: Literal, + // Size: int(num), + // Range: posRange{ + // // Include the leading '.'. + // Start: start - 1, + // End: s.nbytes, + // }, + // Index: 0, + // ArgIndex: -1, + // } + // case Index: + // // Later consumed/stored by a '*' or verb. + // s.index = int(num) + // s.indexPos = start - 1 + // } + } else { + return 0, false + } + } + } + return 0, false +} + +// parseIndex scans an index expression. It returns false if there is a syntax error. +func (s *FormatState) parseIndex() error { + if s.nbytes == len(s.Format) || s.Format[s.nbytes] != '[' { + return nil + } + // Argument index present. + s.nbytes++ // skip '[' + start := s.nbytes + if num, ok := s.scanNum(); ok { + // Later consumed/stored by a '*' or verb. + s.index = num + s.indexPos = start - 1 + } + ok := true + if s.nbytes == len(s.Format) || s.nbytes == start || s.Format[s.nbytes] != ']' { + ok = false // syntax error is either missing "]" or invalid index. + s.nbytes = strings.Index(s.Format[start:], "]") + if s.nbytes < 0 { + return fmt.Errorf("format %s is missing closing ]", s.Format) + } + s.nbytes = s.nbytes + start + } + arg32, err := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) + if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.FirstArg) { + return fmt.Errorf("format has invalid argument index [%s]", s.Format[start:s.nbytes]) + } + s.nbytes++ // skip ']' + arg := int(arg32) + arg += s.FirstArg - 1 // We want to zero-index the actual arguments. + s.argNum = arg + s.hasIndex = true + s.indexPending = true + return nil +} + +// parseNum scans precision (or *). +func (s *FormatState) parseSize(kind sizeType) { + if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '*' { + s.nbytes++ + if s.indexPending { + // Absorb it. + s.indexPending = false + size := &DirectiveSize{ + Kind: IndexedStar, + Size: -1, + Range: posRange{ + Start: s.indexPos, + End: s.nbytes, + }, + Index: s.index, + ArgNum: s.argNum, + } + switch kind { + case Width: + s.Width = size + case Precision: + // Include the leading '.'. + size.Range.Start -= 1 + s.Prec = size + default: + panic(kind) + } + } else { + // A single '*', only Operand has a meaning. + size := &DirectiveSize{ + Kind: Star, + Size: -1, + Range: posRange{ + Start: s.nbytes - 1, + End: s.nbytes, + }, + Index: -1, + ArgNum: s.argNum, + } + switch kind { + case Width: + s.Width = size + case Precision: + // Include the leading '.'. + size.Range.Start -= 1 + s.Prec = size + default: + panic(kind) + } + } + s.argNums = append(s.argNums, s.argNum) + s.argNum++ + } else { + start := s.nbytes + if num, ok := s.scanNum(); ok { + size := &DirectiveSize{ + Kind: Literal, + Size: num, + Range: posRange{ + Start: start, + End: s.nbytes, + }, + Index: -1, + ArgNum: -1, + } + switch kind { + case Width: + s.Width = size + case Precision: + // Include the leading '.'. + size.Range.Start -= 1 + s.Prec = size + default: + panic(kind) + } + } + } +} + +type sizeType int + +const ( + Width sizeType = iota + Precision +) + +// parsePrecision scans for a precision. It returns false if there's a bad index expression. +func (s *FormatState) parsePrecision() error { + // If there's a period, there may be a precision. + if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '.' { + // s.Flags = append(s.Flags, '.') // Treat precision as a flag. + s.nbytes++ + if err := s.parseIndex(); err != nil { + return err + } + s.parseSize(Precision) + } + return nil +} + +type formatDirective struct { + Verb DirectiveVerb + Range posRange + Format string // the full format directive from % through verb, "%.3d". + Flags []byte // the list of # + etc. + Width *DirectiveSize // format width: '3' for "%3d", if any. + Prec *DirectiveSize // format precision: '4' for "%.4d", if any. +} + +type SizeKind int + +const ( + Literal SizeKind = iota // %4d + Star // %*d + IndexedStar // %[2]*d +) + +type DirectiveSize struct { + Kind SizeKind + Range posRange + Size int // used if Kind == PrecLiteral, or -1 + Index int // used if Kind == PrecIndexedStar, or -1 + ArgNum int // used if Kind == PrecStar or PrecIndexedStar, otherwise -1 +} + +type DirectiveOperand struct { + Arg ast.Expr + Index int +} + +type DirectiveVerb struct { + Verb rune + Range posRange + Index int + ArgNum int // verb's corresponding operand, may be nil +} + +type posRange struct { + Start, End int +} + +// parsePrintfVerb looks the formatting directive that begins the format string +// and returns a formatState that encodes what the directive wants, without looking +// at the actual arguments present in the call. It returns the error description if parse fails. +func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*FormatState, error) { + state := &FormatState{ + Format: format, + Flags: make([]byte, 0, 5), + argNums: make([]int, 0, 1), + FirstArg: firstArg, + call: call, + argNum: argNum, + hasIndex: false, + index: 0, + indexPos: 0, + indexPending: false, + nbytes: 1, // There's guaranteed to be a percent sign. + } + // There may be flags. + state.parseFlags() + // There may be an index. + if err := state.parseIndex(); err != nil { + return nil, err + } + // There may be a width. + state.parseSize(Width) + // There may be a precision. + if err := state.parsePrecision(); err != nil { + return nil, err + } + // Now a verb, possibly prefixed by an index (which we may already have). + if !state.indexPending { + if err := state.parseIndex(); err != nil { + return nil, err + } + } + if state.nbytes == len(state.Format) { + return nil, fmt.Errorf("format %s is missing verb at end of string", state.Format) + } + verb, w := utf8.DecodeRuneInString(state.Format[state.nbytes:]) + + // Collect verb. + if state.indexPending { + state.Verb = &DirectiveVerb{ + Verb: verb, + Range: posRange{ + Start: state.indexPos, + End: state.nbytes + w, + }, + Index: state.index, + ArgNum: state.argNum, + } + } else { + state.Verb = &DirectiveVerb{ + Verb: verb, + Range: posRange{ + Start: state.nbytes, + End: state.nbytes + w, + }, + Index: -1, + ArgNum: state.argNum, + } + } + + // state.verb = verb + state.nbytes += w + if verb != '%' { + state.argNums = append(state.argNums, state.argNum) + } + state.Format = state.Format[:state.nbytes] + return state, nil +} + +func cond[T any](cond bool, t, f T) T { + if cond { + return t + } else { + return f + } +} From ab1baeed4a38e22166e687ab75f4ee2de60ed8a7 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 17 Dec 2024 02:14:34 +0800 Subject: [PATCH 05/14] cleanup --- go/analysis/passes/printf/printf.go | 252 +++---------------- internal/fmtstr/parse.go | 373 +++++++++++++--------------- 2 files changed, 202 insertions(+), 423 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 14ee44a26bd..492ceb5d117 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -9,15 +9,12 @@ import ( _ "embed" "fmt" "go/ast" - "go/constant" "go/token" "go/types" "reflect" "regexp" "sort" - "strconv" "strings" - "unicode/utf8" "golang.org/x/tools/go/analysis" "golang.org/x/tools/go/analysis/passes/inspect" @@ -374,43 +371,6 @@ var isPrint = stringSet{ "(testing.TB).Skipf": true, } -// formatStringIndex returns the index of the format string (the last -// non-variadic parameter) within the given printf-like call -// expression, or -1 if unknown. -func formatStringIndex(info *types.Info, call *ast.CallExpr) int { - typ := info.Types[call.Fun].Type - if typ == nil { - return -1 // missing type - } - sig, ok := typ.(*types.Signature) - if !ok { - return -1 // ill-typed - } - if !sig.Variadic() { - // Skip checking non-variadic functions. - return -1 - } - idx := sig.Params().Len() - 2 - if idx < 0 { - // Skip checking variadic functions without - // fixed arguments. - return -1 - } - return idx -} - -// stringConstantExpr returns expression's string constant value. -// -// ("", false) is returned if expression isn't a string -// constant. -func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { - lit := info.Types[expr].Value - if lit != nil && lit.Kind() == constant.String { - return constant.StringVal(lit), true - } - return "", false -} - // checkCall triggers the print-specific checks if the call invokes a print function. func checkCall(pass *analysis.Pass) { inspect := pass.ResultOf[inspect.Analyzer].(*inspector.Inspector) @@ -486,30 +446,14 @@ func isFormatter(typ types.Type) bool { types.Identical(sig.Params().At(1).Type(), types.Typ[types.Rune]) } -// formatState holds the parsed representation of a printf directive such as "%3.*[4]d". -// It is constructed by parsePrintfVerb. -type formatState struct { - verb rune // the format verb: 'd' for "%d" - format string // the full format directive from % through verb, "%.3d". - flags []byte // the list of # + etc. - argNums []int // the successive argument numbers that are consumed, adjusted to refer to actual arg in call - firstArg int // Index of first argument after the format in the Printf call. - // Used only during parse. - call *ast.CallExpr - argNum int // Which argument we're expecting to format now. - hasIndex bool // Whether the argument is indexed. - indexPending bool // Whether we have an indexed argument that has not resolved. - nbytes int // number of bytes of the format string consumed. -} - // checkPrintf checks a call to a formatted print routine such as Printf. func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { - idx := formatStringIndex(pass.TypesInfo, call) + idx := fmtstr.FormatStringIndex(pass.TypesInfo, call) if idx < 0 || idx >= len(call.Args) { return } formatArg := call.Args[idx] - format, ok := stringConstantExpr(pass.TypesInfo, formatArg) + format, ok := fmtstr.StringConstantExpr(pass.TypesInfo, formatArg) if !ok { // Format string argument is non-constant. @@ -536,23 +480,22 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } - var anyIndex bool - var firstArg int - firstArg = idx + 1 // Arguments are immediately after format string. - maxArgNum := firstArg + firstArg := idx + 1 // Arguments are immediately after format string. if !strings.Contains(format, "%") { if len(call.Args) > firstArg { pass.Reportf(call.Lparen, "%s call has arguments but no formatting directives", name) } return } - // Hard part: check formats against args. - states, err := fmtstr.ParsePrintf(pass.TypesInfo, call, name) + // Check formats against args. + states, err := fmtstr.ParsePrintf(pass.TypesInfo, call) if err != nil { pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) return } + maxArgNum := firstArg + anyIndex := false for _, state := range states { if (state.Prec != nil && state.Prec.Index != -1) || (state.Width != nil && state.Width.Index != -1) || @@ -570,7 +513,6 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string } } } - // Dotdotdot is hard. if call.Ellipsis.IsValid() && maxArgNum >= len(call.Args)-1 { return @@ -583,140 +525,10 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string if maxArgNum != len(call.Args) { expect := maxArgNum - firstArg numArgs := len(call.Args) - firstArg - s := fmt.Sprintf("%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) - if s == "fmt.Printf call needs 0 args but has 1 arg" { - s = "" - } pass.ReportRangef(call, "%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) } } -// parseFlags accepts any printf flags. -func (s *formatState) parseFlags() { - for s.nbytes < len(s.format) { - switch c := s.format[s.nbytes]; c { - case '#', '0', '+', '-', ' ': - s.flags = append(s.flags, c) - s.nbytes++ - default: - return - } - } -} - -// scanNum advances through a decimal number if present. -func (s *formatState) scanNum() { - for ; s.nbytes < len(s.format); s.nbytes++ { - c := s.format[s.nbytes] - if c < '0' || '9' < c { - return - } - } -} - -// parseIndex scans an index expression. It returns false if there is a syntax error. -func (s *formatState) parseIndex() error { - if s.nbytes == len(s.format) || s.format[s.nbytes] != '[' { - return nil - } - // Argument index present. - s.nbytes++ // skip '[' - start := s.nbytes - s.scanNum() - ok := true - if s.nbytes == len(s.format) || s.nbytes == start || s.format[s.nbytes] != ']' { - ok = false // syntax error is either missing "]" or invalid index. - s.nbytes = strings.Index(s.format[start:], "]") - if s.nbytes < 0 { - return fmt.Errorf("format %s is missing closing ]", s.format) - } - s.nbytes = s.nbytes + start - } - arg32, err := strconv.ParseInt(s.format[start:s.nbytes], 10, 32) - if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.firstArg) { - return fmt.Errorf("format has invalid argument index [%s]", s.format[start:s.nbytes]) - } - s.nbytes++ // skip ']' - arg := int(arg32) - arg += s.firstArg - 1 // We want to zero-index the actual arguments. - s.argNum = arg - s.hasIndex = true - s.indexPending = true - return nil -} - -// parseNum scans a width or precision (or *). -func (s *formatState) parseNum() { - if s.nbytes < len(s.format) && s.format[s.nbytes] == '*' { - if s.indexPending { // Absorb it. - s.indexPending = false - } - s.nbytes++ - s.argNums = append(s.argNums, s.argNum) - s.argNum++ - } else { - s.scanNum() - } -} - -// parsePrecision scans for a precision. It returns false if there's a bad index expression. -func (s *formatState) parsePrecision() error { - // If there's a period, there may be a precision. - if s.nbytes < len(s.format) && s.format[s.nbytes] == '.' { - // s.flags = append(s.flags, '.') // Treat precision as a flag. - s.nbytes++ - if err := s.parseIndex(); err != nil { - return err - } - s.parseNum() - } - return nil -} - -// parsePrintfVerb looks the formatting directive that begins the format string -// and returns a formatState that encodes what the directive wants, without looking -// at the actual arguments present in the call. It returns the error description if parse fails. -func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*formatState, error) { - state := &formatState{ - format: format, - flags: make([]byte, 0, 5), - argNum: argNum, - argNums: make([]int, 0, 1), - nbytes: 1, // There's guaranteed to be a percent sign. - firstArg: firstArg, - call: call, - } - // There may be flags. - state.parseFlags() - // There may be an index. - if err := state.parseIndex(); err != nil { - return nil, err - } - // There may be a width. - state.parseNum() - // There may be a precision. - if err := state.parsePrecision(); err != nil { - return nil, err - } - // Now a verb, possibly prefixed by an index (which we may already have). - if !state.indexPending { - if err := state.parseIndex(); err != nil { - return nil, err - } - } - if state.nbytes == len(state.format) { - return nil, fmt.Errorf("format %s is missing verb at end of string", state.format) - } - verb, w := utf8.DecodeRuneInString(state.format[state.nbytes:]) - state.verb = verb - state.nbytes += w - if verb != '%' { - state.argNums = append(state.argNums, state.argNum) - } - state.format = state.format[:state.nbytes] - return state, nil -} - // printfArgType encodes the types of expressions a printf verb accepts. It is a bitmask. type printfArgType int @@ -777,10 +589,10 @@ var printVerbs = []printVerb{ {'X', sharpNumFlag, argRune | argInt | argString | argPointer | argFloat | argComplex}, } -// okPrintfArg compares the formatState to the arguments actually present, +// okPrintfArg compares the FormatDirective to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, state *fmtstr.FormatState) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, state *fmtstr.FormatDirective) (ok bool) { verb := state.Verb.Verb var v printVerb found := false @@ -792,7 +604,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s } } - // Could current arg implement fmt.Formatter? + // Could verb's arg implement fmt.Formatter? // Skip check for the %w verb, which requires an error. formatter := false if v.typ != argError && state.Verb.ArgNum < len(call.Args) { @@ -818,8 +630,6 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s } } } - // Verb is good. If len(state.argNums)>trueArgs, we have something like %.*s and all - // but the final arg must be an integer. var argNums []int if state.Width != nil && state.Width.ArgNum != -1 { argNums = append(argNums, state.Width.ArgNum) @@ -827,22 +637,10 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s if state.Prec != nil && state.Prec.ArgNum != -1 { argNums = append(argNums, state.Prec.ArgNum) } - if state.Verb != nil && state.Verb.ArgNum != -1 && verb != '%' { - argNums = append(argNums, state.Verb.ArgNum) - } - for _, n := range argNums { - if n >= *maxArgNum { - *maxArgNum = n + 1 - } - } - - trueArgs := 1 - if verb == '%' { - trueArgs = 0 - } - nargs := len(argNums) - for i := 0; i < nargs-trueArgs; i++ { + // Verb is good. If len(argNums)>0, we have something like %.*s and all + // args in argNums must be an integer. + for i := 0; i < len(argNums); i++ { argNum := argNums[i] if !argCanBeChecked(pass, call, argNums[i], state, name) { return @@ -858,9 +656,21 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s } } + // Collect to conveniently update maxArgNum. + if state.Verb != nil && state.Verb.ArgNum != -1 && verb != '%' { + argNums = append(argNums, state.Verb.ArgNum) + } + for _, n := range argNums { + if n >= *maxArgNum { + *maxArgNum = n + 1 + } + } + if verb == '%' || formatter { return true } + + // Now check verb's type. argNum := argNums[len(argNums)-1] if !argCanBeChecked(pass, call, argNums[len(argNums)-1], state, name) { return false @@ -968,7 +778,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state *fmtstr.FormatState, name string) bool { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state *fmtstr.FormatDirective, name string) bool { if argNum <= 0 { // Shouldn't happen, so catch it with prejudice. panic("negative arg num") @@ -985,12 +795,6 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". arg := argNum - state.FirstArg + 1 // People think of arguments as 1-indexed. - // fmt.Printf format %*% reads arg #2, but call has 1 arg - s := fmt.Sprintf("%s format %s reads arg #%d, but call has %v", name, state.Format, arg, count(len(call.Args)-state.FirstArg, "arg")) - if s == "fmt.Printf format %*% reads arg #2, but call has 1 arg" { - z := 1 - _ = z - } pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, state.Format, arg, count(len(call.Args)-state.FirstArg, "arg")) return false } @@ -1049,7 +853,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } arg := args[0] - if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := fmtstr.StringConstantExpr(pass.TypesInfo, arg); ok { // Ignore trailing % character // The % in "abc 0.0%" couldn't be a formatting directive. s = strings.TrimSuffix(s, "%") @@ -1063,7 +867,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { if strings.HasSuffix(name, "ln") { // The last item, if a string, should not have a newline. arg = args[len(args)-1] - if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := fmtstr.StringConstantExpr(pass.TypesInfo, arg); ok { if strings.HasSuffix(s, "\n") { pass.ReportRangef(call, "%s arg list ends with redundant newline", name) } diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index f835e95be19..92c46423c02 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -16,25 +16,31 @@ import ( // "golang.org/x/tools/go/analysis/passes/internal/analysisutil" ) -// ParsePrintf checks a call to a formatted print routine such as Printf. -// func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { -func ParsePrintf(info *types.Info, call *ast.CallExpr, name string) ([]*FormatState, error) { - idx := formatStringIndex(info, call) +// ParsePrintf takes a printf-like call expression, +// extracts the format string, and parses out all format directives. Each +// directive describes flags, width, precision, verb, and argument indexing. +// This function returns a slice of parsed FormatDirective objects or an error +// if parsing fails. It does not perform any validation of flags, verbs, and +// existence of corresponding argument. +// +// Typical use case: Validate arguments passed to a Printf-like function call, +// DocumentHighlight, Hover, or SemanticHighlight. +func ParsePrintf(info *types.Info, call *ast.CallExpr) ([]*FormatDirective, error) { + idx := FormatStringIndex(info, call) if idx < 0 || idx >= len(call.Args) { return nil, fmt.Errorf("%s", "can't parse") } - formatArg := call.Args[idx] - format, ok := stringConstantExpr(info, formatArg) + format, ok := StringConstantExpr(info, call.Args[idx]) if !ok { - return nil, fmt.Errorf("non-constant format string in call to %s", name) + return nil, fmt.Errorf("non-constant format string") } - firstArg := idx + 1 // Arguments are immediately after format string. if !strings.Contains(format, "%") { - return nil, fmt.Errorf("%s call has arguments but no formatting directives", name) + return nil, fmt.Errorf("call has arguments but no formatting directives") } - // Hard part: check formats against args. + + firstArg := idx + 1 // Arguments are immediately after format string. argNum := firstArg - var states []*FormatState + var states []*FormatDirective for i, w := 0, 0; i < len(format); i += w { w = 1 if format[i] != '%' { @@ -42,25 +48,95 @@ func ParsePrintf(info *types.Info, call *ast.CallExpr, name string) ([]*FormatSt } state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) if err != nil { - return nil, fmt.Errorf("%s %s", name, err.Error()) + return nil, err } - state.AddRange(i) + state.addRange(i) states = append(states, state) w = len(state.Format) - if len(state.argNums) > 0 { - // Continue with the next sequential argument. - argNum = state.argNums[len(state.argNums)-1] + 1 + // Do not waste an augument for '%'. + if state.Verb.Verb != '%' { + argNum = state.argNum + 1 } } return states, nil } -// formatStringIndex returns the index of the format string (the last +// parsePrintfVerb parses one format directive starting at the given substring `format`, +// which should begin with '%'. It returns a fully populated FormatDirective or an error +// if the directive is malformed. The firstArg and argNum parameters help determine how +// arguments map to this directive. +// +// Parse sequence: '%' -> flags? -> index? -> width(*)? -> '.'? -> index? -> precision(*)? -> index? -> verb. +func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*FormatDirective, error) { + state := &FormatDirective{ + Format: format, + Flags: make([]byte, 0, 5), + FirstArg: firstArg, + call: call, + argNum: argNum, + hasIndex: false, + index: 0, + indexPos: 0, + indexPending: false, + nbytes: 1, // There's guaranteed to be a percent sign. + } + // There may be flags. + state.parseFlags() + // There may be an index. + if err := state.parseIndex(); err != nil { + return nil, err + } + // There may be a width. + state.parseSize(Width) + // There may be a precision. + if err := state.parsePrecision(); err != nil { + return nil, err + } + // Now a verb, possibly prefixed by an index (which we may already have). + if !state.indexPending { + if err := state.parseIndex(); err != nil { + return nil, err + } + } + if state.nbytes == len(state.Format) { + return nil, fmt.Errorf("format %s is missing verb at end of string", state.Format) + } + verb, w := utf8.DecodeRuneInString(state.Format[state.nbytes:]) + + // Ensure there msut be a verb. + if state.indexPending { + state.Verb = &DirectiveVerb{ + Verb: verb, + Range: posRange{ + Start: state.indexPos, + End: state.nbytes + w, + }, + Index: state.index, + ArgNum: state.argNum, + } + } else { + state.Verb = &DirectiveVerb{ + Verb: verb, + Range: posRange{ + Start: state.nbytes, + End: state.nbytes + w, + }, + Index: -1, + ArgNum: state.argNum, + } + } + + state.nbytes += w + state.Format = state.Format[:state.nbytes] + return state, nil +} + +// FormatStringIndex returns the index of the format string (the last // non-variadic parameter) within the given printf-like call // expression, or -1 if unknown. -func formatStringIndex(info *types.Info, call *ast.CallExpr) int { +func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { typ := info.Types[call.Fun].Type if typ == nil { return -1 // missing type @@ -82,11 +158,10 @@ func formatStringIndex(info *types.Info, call *ast.CallExpr) int { return idx } -// stringConstantExpr returns expression's string constant value. +// StringConstantExpr returns expression's string constant value. // -// ("", false) is returned if expression isn't a string -// constant. -func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { +// ("", false) is returned if expression isn't a string constant. +func StringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { lit := info.Types[expr].Value if lit != nil && lit.Kind() == constant.String { return constant.StringVal(lit), true @@ -94,28 +169,62 @@ func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { return "", false } -// FormatState holds the parsed representation of a printf directive such as "%3.*[4]d". -// It is constructed by parsePrintfVerb. -type FormatState struct { - Format string // the full format directive from % through verb, "%.3d". - Flags []byte // the list of # + etc. - Width *DirectiveSize // format width: '3' for "%3d", if any. - Prec *DirectiveSize // format precision: '4' for "%.4d", if any. - Verb *DirectiveVerb // format verb: 'd' for "%d" - Range posRange - FirstArg int // Index of first argument after the format in the Printf call. - // Used only during parse. +// FormatDirective holds the parsed representation of a printf directive such as "%3.*[4]d". +// It is constructed by [ParsePrintf]. +type FormatDirective struct { + Format string // Full directive, e.g. "%[2]*.3d" + Range posRange // The range of Format within the overall format string + FirstArg int // Index of the first argument after the format string + Flags []byte // Formatting flags, e.g. ['-', '0'] + Width *DirectiveSize // Width specifier, if any (e.g., '3' in '%3d') + Prec *DirectiveSize // Precision specifier, if any (e.g., '.4' in '%.4f') + Verb *DirectiveVerb // Verb specifier, if any (e.g., '[1]d' in '%[1]d') + + // Parsing state (not used after parsing): call *ast.CallExpr - argNums []int // the successive argument numbers that are consumed, adjusted to refer to actual arg in call - argNum int // Which argument we're expecting to format now. - hasIndex bool // Whether the argument is indexed. + argNum int + hasIndex bool index int indexPos int - indexPending bool // Whether we have an indexed argument that has not resolved. - nbytes int // number of bytes of the format string consumed. + indexPending bool + nbytes int +} + +// Type of size specifier encountered for width or precision. +type SizeKind int + +const ( + Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" + Star // A dynamic size from an argument, e.g. "%*d" + IndexedStar // A dynamic size with an explicit index, e.g. "%[2]*d" +) + +// DirectiveSize describes a width or precision in a format directive. +// Depending on Kind, it may represent a literal number, a star, or an indexed star. +type DirectiveSize struct { + Kind SizeKind // Type of size specifier + Range posRange // Position of the size specifier within the directive + Size int // The literal size if Kind == Literal, otherwise -1 + Index int // If Kind == IndexedStar, the argument index used to obtain the size + ArgNum int // The argument position if Kind == Star or IndexedStar, relative to CallExpr. } -func (s *FormatState) AddRange(parsedLen int) { +// DirectiveVerb represents the verb character of a format directive (e.g., 'd', 's', 'f'). +// It also includes positional information and any explicit argument indexing. +type DirectiveVerb struct { + Verb rune + Range posRange // The positional range of the verb in the format string + Index int // If the verb uses an indexed argument, this is the index, otherwise -1 + ArgNum int // The argument position associated with this verb, relative to CallExpr. +} + +type posRange struct { + Start, End int +} + +// addRange adjusts the recorded positions in Verb, Width, Prec, and the +// directive's overall Range to be relative to the position in the full format string. +func (s *FormatDirective) addRange(parsedLen int) { if s.Verb != nil { s.Verb.Range.Start += parsedLen s.Verb.Range.End += parsedLen @@ -134,7 +243,7 @@ func (s *FormatState) AddRange(parsedLen int) { } // parseFlags accepts any printf flags. -func (s *FormatState) parseFlags() { +func (s *FormatDirective) parseFlags() { for s.nbytes < len(s.Format) { switch c := s.Format[s.nbytes]; c { case '#', '0', '+', '-', ' ': @@ -146,8 +255,8 @@ func (s *FormatState) parseFlags() { } } -// scanNum advances through a decimal number for [Size] or [Index] if present. -func (s *FormatState) scanNum() (int, bool) { +// scanNum advances through a decimal number if present, which represents a [Size] or [Index]. +func (s *FormatDirective) scanNum() (int, bool) { start := s.nbytes for ; s.nbytes < len(s.Format); s.nbytes++ { c := s.Format[s.nbytes] @@ -155,24 +264,6 @@ func (s *FormatState) scanNum() (int, bool) { if start < s.nbytes { num, _ := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) return int(num), true - // switch kind { - // case Size: - // s.Prec = &DirectiveSize{ - // Kind: Literal, - // Size: int(num), - // Range: posRange{ - // // Include the leading '.'. - // Start: start - 1, - // End: s.nbytes, - // }, - // Index: 0, - // ArgIndex: -1, - // } - // case Index: - // // Later consumed/stored by a '*' or verb. - // s.index = int(num) - // s.indexPos = start - 1 - // } } else { return 0, false } @@ -181,8 +272,10 @@ func (s *FormatState) scanNum() (int, bool) { return 0, false } -// parseIndex scans an index expression. It returns false if there is a syntax error. -func (s *FormatState) parseIndex() error { +// parseIndex parses an argument index of the form "[n]" that can appear +// in a printf directive (e.g., "%[2]d"). Returns an error if syntax is +// malformed or index is invalid. +func (s *FormatDirective) parseIndex() error { if s.nbytes == len(s.Format) || s.Format[s.nbytes] != '[' { return nil } @@ -216,8 +309,18 @@ func (s *FormatState) parseIndex() error { return nil } -// parseNum scans precision (or *). -func (s *FormatState) parseSize(kind sizeType) { +type sizeType int + +const ( + Width sizeType = iota + Precision +) + +// parseSize parses a width or precision specifier. It handles literal numeric +// values (e.g., "%3d"), asterisk values (e.g., "%*d"), or indexed asterisk +// values (e.g., "%[2]*d"). The kind parameter specifies whether it's parsing +// a Width or a Precision. +func (s *FormatDirective) parseSize(kind sizeType) { if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '*' { s.nbytes++ if s.indexPending { @@ -244,7 +347,7 @@ func (s *FormatState) parseSize(kind sizeType) { panic(kind) } } else { - // A single '*', only Operand has a meaning. + // Non-indexed star: "%*d". size := &DirectiveSize{ Kind: Star, Size: -1, @@ -259,16 +362,15 @@ func (s *FormatState) parseSize(kind sizeType) { case Width: s.Width = size case Precision: - // Include the leading '.'. + // For precision, include the '.' in the range. size.Range.Start -= 1 s.Prec = size default: panic(kind) } } - s.argNums = append(s.argNums, s.argNum) s.argNum++ - } else { + } else { // Literal number, e.g. "%10d" start := s.nbytes if num, ok := s.scanNum(); ok { size := &DirectiveSize{ @@ -295,18 +397,12 @@ func (s *FormatState) parseSize(kind sizeType) { } } -type sizeType int - -const ( - Width sizeType = iota - Precision -) - -// parsePrecision scans for a precision. It returns false if there's a bad index expression. -func (s *FormatState) parsePrecision() error { +// parsePrecision checks if there's a precision specified after a '.' character. +// If found, it may also parse an index or a star. Returns an error if any index +// parsing fails. +func (s *FormatDirective) parsePrecision() error { // If there's a period, there may be a precision. if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '.' { - // s.Flags = append(s.Flags, '.') // Treat precision as a flag. s.nbytes++ if err := s.parseIndex(); err != nil { return err @@ -315,124 +411,3 @@ func (s *FormatState) parsePrecision() error { } return nil } - -type formatDirective struct { - Verb DirectiveVerb - Range posRange - Format string // the full format directive from % through verb, "%.3d". - Flags []byte // the list of # + etc. - Width *DirectiveSize // format width: '3' for "%3d", if any. - Prec *DirectiveSize // format precision: '4' for "%.4d", if any. -} - -type SizeKind int - -const ( - Literal SizeKind = iota // %4d - Star // %*d - IndexedStar // %[2]*d -) - -type DirectiveSize struct { - Kind SizeKind - Range posRange - Size int // used if Kind == PrecLiteral, or -1 - Index int // used if Kind == PrecIndexedStar, or -1 - ArgNum int // used if Kind == PrecStar or PrecIndexedStar, otherwise -1 -} - -type DirectiveOperand struct { - Arg ast.Expr - Index int -} - -type DirectiveVerb struct { - Verb rune - Range posRange - Index int - ArgNum int // verb's corresponding operand, may be nil -} - -type posRange struct { - Start, End int -} - -// parsePrintfVerb looks the formatting directive that begins the format string -// and returns a formatState that encodes what the directive wants, without looking -// at the actual arguments present in the call. It returns the error description if parse fails. -func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*FormatState, error) { - state := &FormatState{ - Format: format, - Flags: make([]byte, 0, 5), - argNums: make([]int, 0, 1), - FirstArg: firstArg, - call: call, - argNum: argNum, - hasIndex: false, - index: 0, - indexPos: 0, - indexPending: false, - nbytes: 1, // There's guaranteed to be a percent sign. - } - // There may be flags. - state.parseFlags() - // There may be an index. - if err := state.parseIndex(); err != nil { - return nil, err - } - // There may be a width. - state.parseSize(Width) - // There may be a precision. - if err := state.parsePrecision(); err != nil { - return nil, err - } - // Now a verb, possibly prefixed by an index (which we may already have). - if !state.indexPending { - if err := state.parseIndex(); err != nil { - return nil, err - } - } - if state.nbytes == len(state.Format) { - return nil, fmt.Errorf("format %s is missing verb at end of string", state.Format) - } - verb, w := utf8.DecodeRuneInString(state.Format[state.nbytes:]) - - // Collect verb. - if state.indexPending { - state.Verb = &DirectiveVerb{ - Verb: verb, - Range: posRange{ - Start: state.indexPos, - End: state.nbytes + w, - }, - Index: state.index, - ArgNum: state.argNum, - } - } else { - state.Verb = &DirectiveVerb{ - Verb: verb, - Range: posRange{ - Start: state.nbytes, - End: state.nbytes + w, - }, - Index: -1, - ArgNum: state.argNum, - } - } - - // state.verb = verb - state.nbytes += w - if verb != '%' { - state.argNums = append(state.argNums, state.argNum) - } - state.Format = state.Format[:state.nbytes] - return state, nil -} - -func cond[T any](cond bool, t, f T) T { - if cond { - return t - } else { - return f - } -} From 12cf69ca349adb5214e3b7d561dce3a78bbccd2f Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 17 Dec 2024 05:02:13 +0800 Subject: [PATCH 06/14] highlight --- go/analysis/passes/printf/printf.go | 64 ++-- gopls/internal/golang/highlight.go | 298 ++++-------------- .../testdata/highlight/highlight_printf.txt | 13 +- internal/fmtstr/parse.go | 33 +- 4 files changed, 114 insertions(+), 294 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 492ceb5d117..02f569a3e09 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -487,8 +487,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string } return } - // Check formats against args. - states, err := fmtstr.ParsePrintf(pass.TypesInfo, call) + directives, err := fmtstr.ParsePrintf(pass.TypesInfo, call) if err != nil { pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) return @@ -496,16 +495,17 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string maxArgNum := firstArg anyIndex := false - for _, state := range states { - if (state.Prec != nil && state.Prec.Index != -1) || - (state.Width != nil && state.Width.Index != -1) || - (state.Verb != nil && state.Verb.Index != -1) { + // Check formats against args. + for _, directive := range directives { + if (directive.Prec != nil && directive.Prec.Index != -1) || + (directive.Width != nil && directive.Width.Index != -1) || + (directive.Verb != nil && directive.Verb.Index != -1) { anyIndex = true } - if !okPrintfArg(pass, call, &maxArgNum, name, state) { // One error per format is enough. + if !okPrintfArg(pass, call, &maxArgNum, name, directive) { // One error per format is enough. return } - if state.Verb.Verb == 'w' { + if directive.Verb.Verb == 'w' { switch kind { case KindNone, KindPrint, KindPrintf: pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", name) @@ -592,8 +592,8 @@ var printVerbs = []printVerb{ // okPrintfArg compares the FormatDirective to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, state *fmtstr.FormatDirective) (ok bool) { - verb := state.Verb.Verb +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, directive *fmtstr.FormatDirective) (ok bool) { + verb := directive.Verb.Verb var v printVerb found := false // Linear scan is fast enough for a small list. @@ -607,42 +607,42 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s // Could verb's arg implement fmt.Formatter? // Skip check for the %w verb, which requires an error. formatter := false - if v.typ != argError && state.Verb.ArgNum < len(call.Args) { - if tv, ok := pass.TypesInfo.Types[call.Args[state.Verb.ArgNum]]; ok { + if v.typ != argError && directive.Verb.ArgNum < len(call.Args) { + if tv, ok := pass.TypesInfo.Types[call.Args[directive.Verb.ArgNum]]; ok { formatter = isFormatter(tv.Type) } } if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", name, state.Format, verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", name, directive.Format, verb) return false } - for _, flag := range state.Flags { + for _, flag := range directive.Flags { // TODO: Disable complaint about '0' for Go 1.10. To be fixed properly in 1.11. // See issues 23598 and 23605. if flag == '0' { continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, state.Format, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, directive.Format, flag) return false } } } var argNums []int - if state.Width != nil && state.Width.ArgNum != -1 { - argNums = append(argNums, state.Width.ArgNum) + if directive.Width != nil && directive.Width.ArgNum != -1 { + argNums = append(argNums, directive.Width.ArgNum) } - if state.Prec != nil && state.Prec.ArgNum != -1 { - argNums = append(argNums, state.Prec.ArgNum) + if directive.Prec != nil && directive.Prec.ArgNum != -1 { + argNums = append(argNums, directive.Prec.ArgNum) } // Verb is good. If len(argNums)>0, we have something like %.*s and all // args in argNums must be an integer. for i := 0; i < len(argNums); i++ { argNum := argNums[i] - if !argCanBeChecked(pass, call, argNums[i], state, name) { + if !argCanBeChecked(pass, call, argNums[i], directive, name) { return } arg := call.Args[argNum] @@ -651,14 +651,14 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, state.Format, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, directive.Format, analysisutil.Format(pass.Fset, arg), details) return false } } - // Collect to conveniently update maxArgNum. - if state.Verb != nil && state.Verb.ArgNum != -1 && verb != '%' { - argNums = append(argNums, state.Verb.ArgNum) + // Collect to update maxArgNum in one loop. + if directive.Verb != nil && directive.Verb.ArgNum != -1 && verb != '%' { + argNums = append(argNums, directive.Verb.ArgNum) } for _, n := range argNums { if n >= *maxArgNum { @@ -672,12 +672,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s // Now check verb's type. argNum := argNums[len(argNums)-1] - if !argCanBeChecked(pass, call, argNums[len(argNums)-1], state, name) { + if !argCanBeChecked(pass, call, argNums[len(argNums)-1], directive, name) { return false } arg := call.Args[argNum] if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, state.Format, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, directive.Format, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -689,12 +689,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, state.Format, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, directive.Format, analysisutil.Format(pass.Fset, arg), typeString, details) return false } - if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(state.Flags, []byte{'#'}) { + if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(directive.Flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, state.Format, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, directive.Format, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -778,7 +778,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state *fmtstr.FormatDirective, name string) bool { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, directive *fmtstr.FormatDirective, name string) bool { if argNum <= 0 { // Shouldn't happen, so catch it with prejudice. panic("negative arg num") @@ -794,8 +794,8 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, state } // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". - arg := argNum - state.FirstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, state.Format, arg, count(len(call.Args)-state.FirstArg, "arg")) + arg := argNum - directive.FirstArg + 1 // People think of arguments as 1-indexed. + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Format, arg, count(len(call.Args)-directive.FirstArg, "arg")) return false } diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index bb6773c5074..3aa875a7c4a 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -16,8 +16,8 @@ import ( "golang.org/x/tools/gopls/internal/cache" "golang.org/x/tools/gopls/internal/file" "golang.org/x/tools/gopls/internal/protocol" - gastutil "golang.org/x/tools/gopls/internal/util/astutil" "golang.org/x/tools/internal/event" + "golang.org/x/tools/internal/fmtstr" ) func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, position protocol.Position) ([]protocol.DocumentHighlight, error) { @@ -73,18 +73,21 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po // which should be the result of astutil.PathEnclosingInterval. func highlightPath(path []ast.Node, file *ast.File, info *types.Info, pos token.Pos) (map[posRange]protocol.DocumentHighlightKind, error) { result := make(map[posRange]protocol.DocumentHighlightKind) - // Inside a printf-style call? + + // Inside a printf-style call, printf("...%v...", arg)? + // Treat each corresponding ("%v", arg) pair as a highlight class. for _, node := range path { if call, ok := node.(*ast.CallExpr); ok { - for _, args := range call.Args { - // Only try when pos is in right side of the format String. - if basicList, ok := args.(*ast.BasicLit); ok && basicList.Pos() < pos && - basicList.Kind == token.STRING && strings.Contains(basicList.Value, "%") { - highlightPrintf(basicList, call, pos, result) + idx := fmtstr.FormatStringIndex(info, call) + if idx >= 0 && idx < len(call.Args) { + format, ok := fmtstr.StringConstantExpr(info, call.Args[idx]) + if ok && strings.Contains(format, "%") { + highlightPrintf(info, call, call.Args[idx].Pos(), pos, result) } } } } + switch node := path[0].(type) { case *ast.BasicLit: // Import path string literal? @@ -145,259 +148,74 @@ func highlightPath(path []ast.Node, file *ast.File, info *types.Info, pos token. return result, nil } -// highlightPrintf identifies and highlights the relationships between placeholders -// in a format string and their corresponding variadic arguments in a printf-style -// function call. -// +// highlightPrintf highlights directives in a format string and their corresponding +// variadic arguments in a printf-style function call. // For example: // // fmt.Printf("Hello %s, you scored %d", name, score) // // If the cursor is on %s or name, highlightPrintf will highlight %s as a write operation, // and name as a read operation. -func highlightPrintf(directive *ast.BasicLit, call *ast.CallExpr, pos token.Pos, result map[posRange]protocol.DocumentHighlightKind) { - // Two '%'s are interpreted as one '%'(escaped), let's replace them with spaces. - format := strings.Replace(directive.Value, "%%", " ", -1) - if strings.Contains(directive.Value, "%[") || - strings.Contains(directive.Value, "%p") || - strings.Contains(directive.Value, "%T") { - // parsef can not handle these cases. - return - } - expectedVariadicArgs := make([]ast.Expr, strings.Count(format, "%")) - firstVariadic := -1 - for i, arg := range call.Args { - if directive == arg { - firstVariadic = i + 1 - argsLen := len(call.Args) - i - 1 - if argsLen > len(expectedVariadicArgs) { - // Translate from Printf(a0,"%d %d",5, 6, 7) to [5, 6] - copy(expectedVariadicArgs, call.Args[firstVariadic:firstVariadic+len(expectedVariadicArgs)]) - } else { - // Translate from Printf(a0,"%d %d %s",5, 6) to [5, 6, nil] - copy(expectedVariadicArgs[:argsLen], call.Args[firstVariadic:]) - } - break - } - } - formatItems, err := parsef(format, directive.Pos(), expectedVariadicArgs...) +func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, cursorPos token.Pos, result map[posRange]protocol.DocumentHighlightKind) { + directives, err := fmtstr.ParsePrintf(info, call) if err != nil { return } - var percent formatPercent - // Cursor in argument. - if pos > directive.End() { - var curVariadic int - // Which variadic argument cursor sits inside. - for i := firstVariadic; i < len(call.Args); i++ { - if gastutil.NodeContains(call.Args[i], pos) { - // Offset relative to formatItems. - curVariadic = i - firstVariadic - break - } - } - index := -1 - for _, item := range formatItems { - switch item := item.(type) { - case formatPercent: - percent = item - index++ - case formatVerb: - if token.Pos(percent).IsValid() { - if index == curVariadic { - // Placeholders behave like writting values from arguments to themselves, - // so highlight them with Write semantic. - highlightRange(result, token.Pos(percent), item.rang.end, protocol.Write) - highlightRange(result, item.operand.Pos(), item.operand.End(), protocol.Read) - return - } - percent = formatPercent(token.NoPos) - } - } + + highlight := func(start, end token.Pos, argNum int) bool { + var ( + rangeStart = formatPos + token.Pos(start) + 1 // add offset for leading '"' + rangeEnd = formatPos + token.Pos(end) + 1 // add offset for leading '"' + arg ast.Expr // may not exist + ) + if len(call.Args) > argNum { + arg = call.Args[argNum] } - } else { - // Cursor in format string. - for _, item := range formatItems { - switch item := item.(type) { - case formatPercent: - percent = item - case formatVerb: - if token.Pos(percent).IsValid() { - if token.Pos(percent) <= pos && pos <= item.rang.end { - highlightRange(result, token.Pos(percent), item.rang.end, protocol.Write) - if item.operand != nil { - highlightRange(result, item.operand.Pos(), item.operand.End(), protocol.Read) - } - return - } - percent = formatPercent(token.NoPos) - } + + // Highlight the directive and its potential argument if the cursor is within etheir range. + if (cursorPos >= rangeStart && cursorPos < rangeEnd) || (arg != nil && cursorPos >= arg.Pos() && cursorPos < arg.End()) { + highlightRange(result, rangeStart, rangeEnd, protocol.Write) + if arg != nil { + highlightRange(result, arg.Pos(), arg.End(), protocol.Read) } + return true } + return false } -} - -// Below are formatting directives definitions. -type formatPercent token.Pos -type formatLiteral struct { - literal string - rang posRange -} -type formatFlags struct { - flag string - rang posRange -} -type formatWidth struct { - width int - rang posRange -} -type formatPrec struct { - prec int - rang posRange -} -type formatVerb struct { - verb rune - rang posRange - operand ast.Expr // verb's corresponding operand, may be nil -} - -type formatItem interface { - formatItem() -} -func (formatPercent) formatItem() {} -func (formatLiteral) formatItem() {} -func (formatVerb) formatItem() {} -func (formatWidth) formatItem() {} -func (formatFlags) formatItem() {} -func (formatPrec) formatItem() {} - -type formatFunc func(fmt.State, rune) - -var _ fmt.Formatter = formatFunc(nil) + // If width or prec has any *, we can not highlight the full range from % to verb, + // because it will overlap with the sub-range of *, for example: + // + // fmt.Printf("%*[3]d", 4, 5, 6) + // ^ ^ we can only highlight this range when cursor in 6. '*' as a one-rune range will + // highlight for 4. + anyAsterisk := false + for _, directive := range directives { + width, prec, verb := directive.Width, directive.Prec, directive.Verb + if (prec != nil && prec.Kind != fmtstr.Literal) || + (width != nil && width.Kind != fmtstr.Literal) { + anyAsterisk = true + } -func (f formatFunc) Format(st fmt.State, verb rune) { f(st, verb) } + // Try highlight Width. + if width != nil && width.ArgNum != -1 && highlight(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgNum) { + return + } -// parsef parses a printf-style format string into its constituent components together with -// their position in the source code, including [formatLiteral], formatting directives -// [formatFlags], [formatPrecision], [formatWidth], [formatPrecision], [formatVerb], and its operand. -// -// If format contains explicit argument indexes, eg. fmt.Sprintf("%[2]d %[1]d\n", 11, 22), -// the returned range will not be correct. -// If an invalid argument is given for a verb, such as providing a string to %d, the returned error will -// contain a description of the problem. -func parsef(format string, pos token.Pos, args ...ast.Expr) ([]formatItem, error) { - const sep = "__GOPLS_SEP__" - // A conversion represents a single % operation and its operand. - type conversion struct { - verb rune - width int // or -1 - prec int // or -1 - flag string // some of "-+# 0" - operand ast.Expr - } - var convs []conversion - wrappers := make([]any, len(args)) - for i, operand := range args { - wrappers[i] = formatFunc(func(st fmt.State, verb rune) { - st.Write([]byte(sep)) - width, ok := st.Width() - if !ok { - width = -1 - } - prec, ok := st.Precision() - if !ok { - prec = -1 - } - flag := "" - for _, b := range "-+# 0" { - if st.Flag(int(b)) { - flag += string(b) - } - } - convs = append(convs, conversion{ - verb: verb, - width: width, - prec: prec, - flag: flag, - operand: operand, - }) - }) - } + // Try highlight Prec. + if prec != nil && prec.ArgNum != -1 && highlight(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgNum) { + return + } - // Interleave the literals and the conversions. - var formatItems []formatItem - s := fmt.Sprintf(format, wrappers...) - // All errors begin with the string "%!". - if strings.Contains(s, "%!") { - return nil, fmt.Errorf("%s", strings.Replace(s, sep, "", -1)) - } - for i, word := range strings.Split(s, sep) { - if word != "" { - formatItems = append(formatItems, formatLiteral{ - literal: word, - rang: posRange{ - start: pos, - end: pos + token.Pos(len(word)), - }, - }) - pos = pos + token.Pos(len(word)) - } - if i < len(convs) { - conv := convs[i] - // Collect %. - formatItems = append(formatItems, formatPercent(pos)) - pos += 1 - // Collect flags. - if flag := conv.flag; flag != "" { - length := token.Pos(len(conv.flag)) - formatItems = append(formatItems, formatFlags{ - flag: flag, - rang: posRange{ - start: pos, - end: pos + length, - }, - }) - pos += length - } - // Collect width. - if width := conv.width; conv.width != -1 { - length := token.Pos(len(fmt.Sprintf("%d", conv.width))) - formatItems = append(formatItems, formatWidth{ - width: width, - rang: posRange{ - start: pos, - end: pos + length, - }, - }) - pos += length - } - // Collect precision, which starts with a dot. - if prec := conv.prec; conv.prec != -1 { - length := token.Pos(len(fmt.Sprintf("%d", conv.prec))) + 1 - formatItems = append(formatItems, formatPrec{ - prec: prec, - rang: posRange{ - start: pos, - end: pos + length, - }, - }) - pos += length + // Try highlight Verb. + if verb.Verb != '%' { + if anyAsterisk && highlight(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgNum) { + return + } else if highlight(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgNum) { + return } - // Collect verb, which must be present. - length := token.Pos(len(string(conv.verb))) - formatItems = append(formatItems, formatVerb{ - verb: conv.verb, - rang: posRange{ - start: pos, - end: pos + length, - }, - operand: conv.operand, - }) - pos += length } } - return formatItems, nil } type posRange struct { diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt index ea0011be205..e954ef4facb 100644 --- a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt +++ b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt @@ -29,12 +29,13 @@ func TooManyDirectives() { fmt.Printf("Hello %s, you have %d new %s %q messages!", "Alice", 5) //@hiloc(toomanyd, "%d", write),hiloc(toomanyargs1, "5", read),highlightall(toomanyd, toomanyargs1) } -func SpecialChars() { - fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(specials, "%s", write),hiloc(specialargs0, "\"Alice\"", read),highlightall(specials, specialargs0) - fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(speciald, "%d", write),hiloc(specialargs1, "5", read),highlightall(speciald, specialargs1) +func VerbIsPercentage() { + fmt.Printf("%4.2% %d", 6) //@hiloc(z1, "%d", write),hiloc(z2, "6", read),highlightall(z1, z2) } -func Escaped() { - fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapeds, "%s", write),hiloc(escapedargs0, "\"Alice\"", read),highlightall(escapeds, escapedargs0) - fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapedd, "%s", write),hiloc(escapedargs1, "\"Alice\"", read),highlightall(escapedd, escapedargs1) +func Indexed() { + fmt.Printf("%[1]d", 3) //@hiloc(i1, "%[1]d", write),hiloc(i2, "3", read),highlightall(i1, i2) + fmt.Printf("%[1]*d", 3, 6) //@hiloc(i3, "[1]*", write),hiloc(i4, "3", read),hiloc(i5, "d", write),hiloc(i6, "6", read),highlightall(i3, i4),highlightall(i5, i6) + fmt.Printf("%[2]*[1]d", 3, 4) //@hiloc(i7, "[2]*", write),hiloc(i8, "4", read),hiloc(i9, "[1]d", write),hiloc(i10, "3", read),highlightall(i7, i8),highlightall(i9, i10) + fmt.Printf("%[2]*.[1]*[3]d", 4, 5, 6) //@hiloc(i11, "[2]*", write),hiloc(i12, "5", read),hiloc(i13, ".[1]*", write),hiloc(i14, "4", read),hiloc(i15, "[3]d", write),hiloc(i16, "6", read),highlightall(i11, i12),highlightall(i13, i14),highlightall(i15, i16) } diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index 92c46423c02..c24cd7eec46 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -51,11 +51,11 @@ func ParsePrintf(info *types.Info, call *ast.CallExpr) ([]*FormatDirective, erro return nil, err } - state.addRange(i) + state.addOffset(i) states = append(states, state) w = len(state.Format) - // Do not waste an augument for '%'. + // Do not waste an argument for '%'. if state.Verb.Verb != '%' { argNum = state.argNum + 1 } @@ -68,7 +68,7 @@ func ParsePrintf(info *types.Info, call *ast.CallExpr) ([]*FormatDirective, erro // if the directive is malformed. The firstArg and argNum parameters help determine how // arguments map to this directive. // -// Parse sequence: '%' -> flags? -> index? -> width(*)? -> '.'? -> index? -> precision(*)? -> index? -> verb. +// Parse sequence: '%' -> flags -> {[N]* or width} -> .{[N]* or precision} -> [N] -> verb. func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*FormatDirective, error) { state := &FormatDirective{ Format: format, @@ -190,23 +190,22 @@ type FormatDirective struct { nbytes int } -// Type of size specifier encountered for width or precision. type SizeKind int const ( - Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" - Star // A dynamic size from an argument, e.g. "%*d" - IndexedStar // A dynamic size with an explicit index, e.g. "%[2]*d" + Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" + Asterisk // A dynamic size from an argument, e.g. "%*d" + IndexedAsterisk // A dynamic size with an explicit index, e.g. "%[2]*d" ) // DirectiveSize describes a width or precision in a format directive. -// Depending on Kind, it may represent a literal number, a star, or an indexed star. +// Depending on Kind, it may represent a literal number, a asterisk, or an indexed asterisk. type DirectiveSize struct { Kind SizeKind // Type of size specifier Range posRange // Position of the size specifier within the directive Size int // The literal size if Kind == Literal, otherwise -1 - Index int // If Kind == IndexedStar, the argument index used to obtain the size - ArgNum int // The argument position if Kind == Star or IndexedStar, relative to CallExpr. + Index int // If Kind == IndexedAsterisk, the argument index used to obtain the size + ArgNum int // The argument position if Kind == Asterisk or IndexedAsterisk, relative to CallExpr. } // DirectiveVerb represents the verb character of a format directive (e.g., 'd', 's', 'f'). @@ -222,9 +221,9 @@ type posRange struct { Start, End int } -// addRange adjusts the recorded positions in Verb, Width, Prec, and the +// addOffset adjusts the recorded positions in Verb, Width, Prec, and the // directive's overall Range to be relative to the position in the full format string. -func (s *FormatDirective) addRange(parsedLen int) { +func (s *FormatDirective) addOffset(parsedLen int) { if s.Verb != nil { s.Verb.Range.Start += parsedLen s.Verb.Range.End += parsedLen @@ -287,6 +286,7 @@ func (s *FormatDirective) parseIndex() error { s.index = num s.indexPos = start - 1 } + ok := true if s.nbytes == len(s.Format) || s.nbytes == start || s.Format[s.nbytes] != ']' { ok = false // syntax error is either missing "]" or invalid index. @@ -300,6 +300,7 @@ func (s *FormatDirective) parseIndex() error { if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.FirstArg) { return fmt.Errorf("format has invalid argument index [%s]", s.Format[start:s.nbytes]) } + s.nbytes++ // skip ']' arg := int(arg32) arg += s.FirstArg - 1 // We want to zero-index the actual arguments. @@ -327,7 +328,7 @@ func (s *FormatDirective) parseSize(kind sizeType) { // Absorb it. s.indexPending = false size := &DirectiveSize{ - Kind: IndexedStar, + Kind: IndexedAsterisk, Size: -1, Range: posRange{ Start: s.indexPos, @@ -347,9 +348,9 @@ func (s *FormatDirective) parseSize(kind sizeType) { panic(kind) } } else { - // Non-indexed star: "%*d". + // Non-indexed asterisk: "%*d". size := &DirectiveSize{ - Kind: Star, + Kind: Asterisk, Size: -1, Range: posRange{ Start: s.nbytes - 1, @@ -398,7 +399,7 @@ func (s *FormatDirective) parseSize(kind sizeType) { } // parsePrecision checks if there's a precision specified after a '.' character. -// If found, it may also parse an index or a star. Returns an error if any index +// If found, it may also parse an index or an asterisk. Returns an error if any index // parsing fails. func (s *FormatDirective) parsePrecision() error { // If there's a period, there may be a precision. From f96cc985893610e46a634c1675429810c3cb7ba6 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 17 Dec 2024 05:22:47 +0800 Subject: [PATCH 07/14] resolve comment --- go/analysis/passes/printf/printf.go | 76 ++++---- gopls/internal/golang/highlight.go | 39 ++-- .../testdata/highlight/highlight_printf.txt | 5 + internal/fmtstr/parse.go | 184 +++++++++--------- 4 files changed, 156 insertions(+), 148 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 02f569a3e09..c28e185e3f1 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -493,16 +493,16 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } - maxArgNum := firstArg + maxArgIndex := firstArg anyIndex := false // Check formats against args. for _, directive := range directives { if (directive.Prec != nil && directive.Prec.Index != -1) || (directive.Width != nil && directive.Width.Index != -1) || - (directive.Verb != nil && directive.Verb.Index != -1) { + (directive.Verb.Index != -1) { anyIndex = true } - if !okPrintfArg(pass, call, &maxArgNum, name, directive) { // One error per format is enough. + if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, directive) { // One error per format is enough. return } if directive.Verb.Verb == 'w' { @@ -514,7 +514,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string } } // Dotdotdot is hard. - if call.Ellipsis.IsValid() && maxArgNum >= len(call.Args)-1 { + if call.Ellipsis.IsValid() && maxArgIndex >= len(call.Args)-1 { return } // If any formats are indexed, extra arguments are ignored. @@ -522,8 +522,8 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } // There should be no leftover arguments. - if maxArgNum != len(call.Args) { - expect := maxArgNum - firstArg + if maxArgIndex != len(call.Args) { + expect := maxArgIndex - firstArg numArgs := len(call.Args) - firstArg pass.ReportRangef(call, "%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) } @@ -592,7 +592,7 @@ var printVerbs = []printVerb{ // okPrintfArg compares the FormatDirective to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name string, directive *fmtstr.FormatDirective) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, directive *fmtstr.FormatDirective) (ok bool) { verb := directive.Verb.Verb var v printVerb found := false @@ -607,8 +607,8 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s // Could verb's arg implement fmt.Formatter? // Skip check for the %w verb, which requires an error. formatter := false - if v.typ != argError && directive.Verb.ArgNum < len(call.Args) { - if tv, ok := pass.TypesInfo.Types[call.Args[directive.Verb.ArgNum]]; ok { + if v.typ != argError && directive.Verb.ArgIndex < len(call.Args) { + if tv, ok := pass.TypesInfo.Types[call.Args[directive.Verb.ArgIndex]]; ok { formatter = isFormatter(tv.Type) } } @@ -630,22 +630,23 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s } } } - var argNums []int - if directive.Width != nil && directive.Width.ArgNum != -1 { - argNums = append(argNums, directive.Width.ArgNum) + + var argIndexes []int + // First check for *. + if directive.Width != nil && directive.Width.ArgIndex != -1 { + argIndexes = append(argIndexes, directive.Width.ArgIndex) } - if directive.Prec != nil && directive.Prec.ArgNum != -1 { - argNums = append(argNums, directive.Prec.ArgNum) + if directive.Prec != nil && directive.Prec.ArgIndex != -1 { + argIndexes = append(argIndexes, directive.Prec.ArgIndex) } - - // Verb is good. If len(argNums)>0, we have something like %.*s and all - // args in argNums must be an integer. - for i := 0; i < len(argNums); i++ { - argNum := argNums[i] - if !argCanBeChecked(pass, call, argNums[i], directive, name) { + // If len(argIndexes)>0, we have something like %.*s and all + // indexes in argIndexes must be an integer. + for i := 0; i < len(argIndexes); i++ { + argIndex := argIndexes[i] + if !argCanBeChecked(pass, call, argIndex, firstArg, directive, name) { return } - arg := call.Args[argNum] + arg := call.Args[argIndex] if reason, ok := matchArgType(pass, argInt, arg); !ok { details := "" if reason != "" { @@ -657,25 +658,28 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgNum *int, name s } // Collect to update maxArgNum in one loop. - if directive.Verb != nil && directive.Verb.ArgNum != -1 && verb != '%' { - argNums = append(argNums, directive.Verb.ArgNum) + if directive.Verb.ArgIndex != -1 && verb != '%' { + argIndexes = append(argIndexes, directive.Verb.ArgIndex) } - for _, n := range argNums { - if n >= *maxArgNum { - *maxArgNum = n + 1 + for _, index := range argIndexes { + if index >= *maxArgIndex { + *maxArgIndex = index + 1 } } + // Special case for '%', go will print "fmt.Printf("%10.2%%dhello", 4)" + // as "%4hello", discard any runes between the two '%'s, and treat the verb '%' + // as an ordinary rune, so early return to skip the type check. if verb == '%' || formatter { return true } // Now check verb's type. - argNum := argNums[len(argNums)-1] - if !argCanBeChecked(pass, call, argNums[len(argNums)-1], directive, name) { + verbArgIndex := directive.Verb.ArgIndex + if !argCanBeChecked(pass, call, verbArgIndex, firstArg, directive, name) { return false } - arg := call.Args[argNum] + arg := call.Args[verbArgIndex] if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, directive.Format, analysisutil.Format(pass.Fset, arg)) return false @@ -778,24 +782,24 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argNum int, directive *fmtstr.FormatDirective, name string) bool { - if argNum <= 0 { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg int, directive *fmtstr.FormatDirective, name string) bool { + if argIndex <= 0 { // Shouldn't happen, so catch it with prejudice. - panic("negative arg num") + panic("negative argIndex") } - if argNum < len(call.Args)-1 { + if argIndex < len(call.Args)-1 { return true // Always OK. } if call.Ellipsis.IsValid() { return false // We just can't tell; there could be many more arguments. } - if argNum < len(call.Args) { + if argIndex < len(call.Args) { return true } // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". - arg := argNum - directive.FirstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Format, arg, count(len(call.Args)-directive.FirstArg, "arg")) + arg := argIndex - firstArg + 1 // People think of arguments as 1-indexed. + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Format, arg, count(len(call.Args)-firstArg, "arg")) return false } diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index 3aa875a7c4a..8330df4a5ec 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -51,7 +51,7 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po } } } - result, err := highlightPath(path, pgf.File, pkg.TypesInfo(), pos) + result, err := highlightPath(pkg.TypesInfo(), path, pos) if err != nil { return nil, err } @@ -71,7 +71,7 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po // highlightPath returns ranges to highlight for the given enclosing path, // which should be the result of astutil.PathEnclosingInterval. -func highlightPath(path []ast.Node, file *ast.File, info *types.Info, pos token.Pos) (map[posRange]protocol.DocumentHighlightKind, error) { +func highlightPath(info *types.Info, path []ast.Node, pos token.Pos) (map[posRange]protocol.DocumentHighlightKind, error) { result := make(map[posRange]protocol.DocumentHighlightKind) // Inside a printf-style call, printf("...%v...", arg)? @@ -88,6 +88,7 @@ func highlightPath(path []ast.Node, file *ast.File, info *types.Info, pos token. } } + file := path[len(path)-1].(*ast.File) switch node := path[0].(type) { case *ast.BasicLit: // Import path string literal? @@ -162,17 +163,17 @@ func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, return } - highlight := func(start, end token.Pos, argNum int) bool { + // highlightPair highlights the directive and its potential argument pair if the cursor is within either range. + highlightPair := func(start, end token.Pos, argIndex int) bool { var ( rangeStart = formatPos + token.Pos(start) + 1 // add offset for leading '"' rangeEnd = formatPos + token.Pos(end) + 1 // add offset for leading '"' arg ast.Expr // may not exist ) - if len(call.Args) > argNum { - arg = call.Args[argNum] + if len(call.Args) > argIndex { + arg = call.Args[argIndex] } - // Highlight the directive and its potential argument if the cursor is within etheir range. if (cursorPos >= rangeStart && cursorPos < rangeEnd) || (arg != nil && cursorPos >= arg.Pos() && cursorPos < arg.End()) { highlightRange(result, rangeStart, rangeEnd, protocol.Write) if arg != nil { @@ -192,26 +193,28 @@ func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, anyAsterisk := false for _, directive := range directives { width, prec, verb := directive.Width, directive.Prec, directive.Verb - if (prec != nil && prec.Kind != fmtstr.Literal) || - (width != nil && width.Kind != fmtstr.Literal) { + // Try highlight Width if there is a *. + if width != nil && width.ArgIndex != -1 { anyAsterisk = true + if highlightPair(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgIndex) { + return + } } - // Try highlight Width. - if width != nil && width.ArgNum != -1 && highlight(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgNum) { - return - } - - // Try highlight Prec. - if prec != nil && prec.ArgNum != -1 && highlight(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgNum) { - return + // Try highlight Precision if there is a *. + if prec != nil && prec.ArgIndex != -1 { + anyAsterisk = true + if highlightPair(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgIndex) { + return + } } // Try highlight Verb. if verb.Verb != '%' { - if anyAsterisk && highlight(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgNum) { + // If any * is found inside directive, narrow the highlight range. + if anyAsterisk && highlightPair(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgIndex) { return - } else if highlight(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgNum) { + } else if highlightPair(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgIndex) { return } } diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt index e954ef4facb..b014be68cb2 100644 --- a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt +++ b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt @@ -33,6 +33,11 @@ func VerbIsPercentage() { fmt.Printf("%4.2% %d", 6) //@hiloc(z1, "%d", write),hiloc(z2, "6", read),highlightall(z1, z2) } +func SpecialChars() { + fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(specials, "%s", write),hiloc(specialargs0, "\"Alice\"", read),highlightall(specials, specialargs0) + fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(speciald, "%d", write),hiloc(specialargs1, "5", read),highlightall(speciald, specialargs1) +} + func Indexed() { fmt.Printf("%[1]d", 3) //@hiloc(i1, "%[1]d", write),hiloc(i2, "3", read),highlightall(i1, i2) fmt.Printf("%[1]*d", 3, 6) //@hiloc(i3, "[1]*", write),hiloc(i4, "3", read),hiloc(i5, "d", write),hiloc(i6, "6", read),highlightall(i3, i4),highlightall(i5, i6) diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index c24cd7eec46..ee15f28cb6a 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -5,7 +5,6 @@ package fmtstr import ( - _ "embed" "fmt" "go/ast" "go/constant" @@ -13,9 +12,60 @@ import ( "strconv" "strings" "unicode/utf8" - // "golang.org/x/tools/go/analysis/passes/internal/analysisutil" ) +// FormatDirective holds the parsed representation of a printf directive such as "%3.*[4]d". +// It is constructed by [ParsePrintf]. +type FormatDirective struct { + Format string // Full directive, e.g. "%[2]*.3d" + Range posRange // The range of Format within the overall format string + Flags []byte // Formatting flags, e.g. ['-', '0'] + Width *DirectiveSize // Width specifier, if any (e.g., '3' in '%3d') + Prec *DirectiveSize // Precision specifier, if any (e.g., '.4' in '%.4f') + Verb DirectiveVerb // Verb specifier, guaranteed to exist (e.g., '[1]d' in '%[1]d') + + // Parsing state (not used after parsing): + firstArg int // Index of the first argument after the format string + call *ast.CallExpr + argNum int // Which argument we're expecting to format now. + hasIndex bool // Whether the argument is indexed. + index int // The encountered index + indexPos int // The encountered index's offset + indexPending bool // Whether we have an indexed argument that has not resolved. + nbytes int // number of bytes of the format string consumed. +} + +type SizeKind int + +const ( + Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" + Asterisk // A dynamic size from an argument, e.g. "%*d" + IndexedAsterisk // A dynamic size with an explicit index, e.g. "%[2]*d" +) + +// DirectiveSize describes a width or precision in a format directive. +// Depending on Kind, it may represent a literal number, a asterisk, or an indexed asterisk. +type DirectiveSize struct { + Kind SizeKind // Type of size specifier + Range posRange // Position of the size specifier within the directive + Size int // The literal size if Kind == Literal, otherwise -1 + Index int // If Kind == IndexedAsterisk, the argument index used to obtain the size, otherwise -1 + ArgIndex int // The argument index if Kind == Asterisk or IndexedAsterisk relative to CallExpr, otherwise -1 +} + +// DirectiveVerb represents the verb character of a format directive (e.g., 'd', 's', 'f'). +// It also includes positional information and any explicit argument indexing. +type DirectiveVerb struct { + Verb rune + Range posRange // The positional range of the verb in the format string + Index int // If the verb uses an indexed argument, this is the index, otherwise -1 + ArgIndex int // The argument index associated with this verb, relative to CallExpr, otherwise -1 +} + +type posRange struct { + Start, End int +} + // ParsePrintf takes a printf-like call expression, // extracts the format string, and parses out all format directives. Each // directive describes flags, width, precision, verb, and argument indexing. @@ -28,7 +78,7 @@ import ( func ParsePrintf(info *types.Info, call *ast.CallExpr) ([]*FormatDirective, error) { idx := FormatStringIndex(info, call) if idx < 0 || idx >= len(call.Args) { - return nil, fmt.Errorf("%s", "can't parse") + return nil, fmt.Errorf("not a valid printf-like call") } format, ok := StringConstantExpr(info, call.Args[idx]) if !ok { @@ -73,7 +123,7 @@ func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (* state := &FormatDirective{ Format: format, Flags: make([]byte, 0, 5), - FirstArg: firstArg, + firstArg: firstArg, call: call, argNum: argNum, hasIndex: false, @@ -105,26 +155,26 @@ func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (* } verb, w := utf8.DecodeRuneInString(state.Format[state.nbytes:]) - // Ensure there msut be a verb. + // Ensure there must be a verb. if state.indexPending { - state.Verb = &DirectiveVerb{ + state.Verb = DirectiveVerb{ Verb: verb, Range: posRange{ Start: state.indexPos, End: state.nbytes + w, }, - Index: state.index, - ArgNum: state.argNum, + Index: state.index, + ArgIndex: state.argNum, } } else { - state.Verb = &DirectiveVerb{ + state.Verb = DirectiveVerb{ Verb: verb, Range: posRange{ Start: state.nbytes, End: state.nbytes + w, }, - Index: -1, - ArgNum: state.argNum, + Index: -1, + ArgIndex: state.argNum, } } @@ -169,68 +219,14 @@ func StringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { return "", false } -// FormatDirective holds the parsed representation of a printf directive such as "%3.*[4]d". -// It is constructed by [ParsePrintf]. -type FormatDirective struct { - Format string // Full directive, e.g. "%[2]*.3d" - Range posRange // The range of Format within the overall format string - FirstArg int // Index of the first argument after the format string - Flags []byte // Formatting flags, e.g. ['-', '0'] - Width *DirectiveSize // Width specifier, if any (e.g., '3' in '%3d') - Prec *DirectiveSize // Precision specifier, if any (e.g., '.4' in '%.4f') - Verb *DirectiveVerb // Verb specifier, if any (e.g., '[1]d' in '%[1]d') - - // Parsing state (not used after parsing): - call *ast.CallExpr - argNum int - hasIndex bool - index int - indexPos int - indexPending bool - nbytes int -} - -type SizeKind int - -const ( - Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" - Asterisk // A dynamic size from an argument, e.g. "%*d" - IndexedAsterisk // A dynamic size with an explicit index, e.g. "%[2]*d" -) - -// DirectiveSize describes a width or precision in a format directive. -// Depending on Kind, it may represent a literal number, a asterisk, or an indexed asterisk. -type DirectiveSize struct { - Kind SizeKind // Type of size specifier - Range posRange // Position of the size specifier within the directive - Size int // The literal size if Kind == Literal, otherwise -1 - Index int // If Kind == IndexedAsterisk, the argument index used to obtain the size - ArgNum int // The argument position if Kind == Asterisk or IndexedAsterisk, relative to CallExpr. -} - -// DirectiveVerb represents the verb character of a format directive (e.g., 'd', 's', 'f'). -// It also includes positional information and any explicit argument indexing. -type DirectiveVerb struct { - Verb rune - Range posRange // The positional range of the verb in the format string - Index int // If the verb uses an indexed argument, this is the index, otherwise -1 - ArgNum int // The argument position associated with this verb, relative to CallExpr. -} - -type posRange struct { - Start, End int -} - // addOffset adjusts the recorded positions in Verb, Width, Prec, and the // directive's overall Range to be relative to the position in the full format string. func (s *FormatDirective) addOffset(parsedLen int) { - if s.Verb != nil { - s.Verb.Range.Start += parsedLen - s.Verb.Range.End += parsedLen + s.Verb.Range.Start += parsedLen + s.Verb.Range.End += parsedLen - s.Range.Start = parsedLen - s.Range.End = s.Verb.Range.End - } + s.Range.Start = parsedLen + s.Range.End = s.Verb.Range.End if s.Prec != nil { s.Prec.Range.Start += parsedLen s.Prec.Range.End += parsedLen @@ -254,23 +250,6 @@ func (s *FormatDirective) parseFlags() { } } -// scanNum advances through a decimal number if present, which represents a [Size] or [Index]. -func (s *FormatDirective) scanNum() (int, bool) { - start := s.nbytes - for ; s.nbytes < len(s.Format); s.nbytes++ { - c := s.Format[s.nbytes] - if c < '0' || '9' < c { - if start < s.nbytes { - num, _ := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) - return int(num), true - } else { - return 0, false - } - } - } - return 0, false -} - // parseIndex parses an argument index of the form "[n]" that can appear // in a printf directive (e.g., "%[2]d"). Returns an error if syntax is // malformed or index is invalid. @@ -297,19 +276,36 @@ func (s *FormatDirective) parseIndex() error { s.nbytes = s.nbytes + start } arg32, err := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) - if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.FirstArg) { + if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.firstArg) { return fmt.Errorf("format has invalid argument index [%s]", s.Format[start:s.nbytes]) } s.nbytes++ // skip ']' arg := int(arg32) - arg += s.FirstArg - 1 // We want to zero-index the actual arguments. + arg += s.firstArg - 1 // We want to zero-index the actual arguments. s.argNum = arg s.hasIndex = true s.indexPending = true return nil } +// scanNum advances through a decimal number if present, which represents a [Size] or [Index]. +func (s *FormatDirective) scanNum() (int, bool) { + start := s.nbytes + for ; s.nbytes < len(s.Format); s.nbytes++ { + c := s.Format[s.nbytes] + if c < '0' || '9' < c { + if start < s.nbytes { + num, _ := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) + return int(num), true + } else { + return 0, false + } + } + } + return 0, false +} + type sizeType int const ( @@ -334,8 +330,8 @@ func (s *FormatDirective) parseSize(kind sizeType) { Start: s.indexPos, End: s.nbytes, }, - Index: s.index, - ArgNum: s.argNum, + Index: s.index, + ArgIndex: s.argNum, } switch kind { case Width: @@ -356,8 +352,8 @@ func (s *FormatDirective) parseSize(kind sizeType) { Start: s.nbytes - 1, End: s.nbytes, }, - Index: -1, - ArgNum: s.argNum, + Index: -1, + ArgIndex: s.argNum, } switch kind { case Width: @@ -381,8 +377,8 @@ func (s *FormatDirective) parseSize(kind sizeType) { Start: start, End: s.nbytes, }, - Index: -1, - ArgNum: -1, + Index: -1, + ArgIndex: -1, } switch kind { case Width: From 8475e75c60dd36fced57247162e69921604e1dc2 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Fri, 20 Dec 2024 02:34:39 +0800 Subject: [PATCH 08/14] add a format arg --- go/analysis/passes/printf/printf.go | 24 ++++++++++--- gopls/internal/golang/highlight.go | 16 ++++----- .../testdata/highlight/highlight_printf.txt | 5 +++ internal/fmtstr/parse.go | 35 +++++-------------- 4 files changed, 42 insertions(+), 38 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index c28e185e3f1..a0c38c575a7 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -9,6 +9,7 @@ import ( _ "embed" "fmt" "go/ast" + "go/constant" "go/token" "go/types" "reflect" @@ -453,7 +454,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } formatArg := call.Args[idx] - format, ok := fmtstr.StringConstantExpr(pass.TypesInfo, formatArg) + format, ok := stringConstantExpr(pass.TypesInfo, formatArg) if !ok { // Format string argument is non-constant. @@ -487,7 +488,11 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string } return } - directives, err := fmtstr.ParsePrintf(pass.TypesInfo, call) + + // Pass the string constant value so + // fmt.Sprintf("%"+("s"), "hi", 3) can be reported as + // "fmt.Sprintf call needs 1 arg but has 2 args". + directives, err := fmtstr.ParsePrintf(pass.TypesInfo, call, format) if err != nil { pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) return @@ -857,7 +862,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } arg := args[0] - if s, ok := fmtstr.StringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { // Ignore trailing % character // The % in "abc 0.0%" couldn't be a formatting directive. s = strings.TrimSuffix(s, "%") @@ -871,7 +876,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { if strings.HasSuffix(name, "ln") { // The last item, if a string, should not have a newline. arg = args[len(args)-1] - if s, ok := fmtstr.StringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { if strings.HasSuffix(s, "\n") { pass.ReportRangef(call, "%s arg list ends with redundant newline", name) } @@ -887,6 +892,17 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } } +// StringConstantExpr returns expression's string constant value. +// +// ("", false) is returned if expression isn't a string constant. +func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { + lit := info.Types[expr].Value + if lit != nil && lit.Kind() == constant.String { + return constant.StringVal(lit), true + } + return "", false +} + // count(n, what) returns "1 what" or "N whats" // (assuming the plural of what is whats). func count(n int, what string) string { diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index 8330df4a5ec..beb3555038d 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -80,9 +80,9 @@ func highlightPath(info *types.Info, path []ast.Node, pos token.Pos) (map[posRan if call, ok := node.(*ast.CallExpr); ok { idx := fmtstr.FormatStringIndex(info, call) if idx >= 0 && idx < len(call.Args) { - format, ok := fmtstr.StringConstantExpr(info, call.Args[idx]) - if ok && strings.Contains(format, "%") { - highlightPrintf(info, call, call.Args[idx].Pos(), pos, result) + // We only care string literal, so fmt.Sprint("a"+"b%s", "bar") won't highlight. + if lit, ok := call.Args[idx].(*ast.BasicLit); ok && strings.Contains(lit.Value, "%") { + highlightPrintf(info, call, call.Args[idx].Pos(), pos, lit.Value, result) } } } @@ -157,8 +157,8 @@ func highlightPath(info *types.Info, path []ast.Node, pos token.Pos) (map[posRan // // If the cursor is on %s or name, highlightPrintf will highlight %s as a write operation, // and name as a read operation. -func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, cursorPos token.Pos, result map[posRange]protocol.DocumentHighlightKind) { - directives, err := fmtstr.ParsePrintf(info, call) +func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, cursorPos token.Pos, format string, result map[posRange]protocol.DocumentHighlightKind) { + directives, err := fmtstr.ParsePrintf(info, call, format) if err != nil { return } @@ -166,9 +166,9 @@ func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, // highlightPair highlights the directive and its potential argument pair if the cursor is within either range. highlightPair := func(start, end token.Pos, argIndex int) bool { var ( - rangeStart = formatPos + token.Pos(start) + 1 // add offset for leading '"' - rangeEnd = formatPos + token.Pos(end) + 1 // add offset for leading '"' - arg ast.Expr // may not exist + rangeStart = formatPos + token.Pos(start) + rangeEnd = formatPos + token.Pos(end) + arg ast.Expr // may not exist ) if len(call.Args) > argIndex { arg = call.Args[argIndex] diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt index b014be68cb2..baf635facf9 100644 --- a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt +++ b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt @@ -38,6 +38,11 @@ func SpecialChars() { fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(speciald, "%d", write),hiloc(specialargs1, "5", read),highlightall(speciald, specialargs1) } +func Escaped() { + fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapeds, "%s", write),hiloc(escapedargs0, "\"Alice\"", read),highlightall(escapeds, escapedargs0) + fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapedd, "%s", write),hiloc(escapedargs1, "\"Alice\"", read),highlightall(escapedd, escapedargs1) +} + func Indexed() { fmt.Printf("%[1]d", 3) //@hiloc(i1, "%[1]d", write),hiloc(i2, "3", read),highlightall(i1, i2) fmt.Printf("%[1]*d", 3, 6) //@hiloc(i3, "[1]*", write),hiloc(i4, "3", read),hiloc(i5, "d", write),hiloc(i6, "6", read),highlightall(i3, i4),highlightall(i5, i6) diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index ee15f28cb6a..81458d1c672 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -1,4 +1,4 @@ -// Copyright 2010 The Go Authors. All rights reserved. +// Copyright 2024 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. @@ -7,7 +7,6 @@ package fmtstr import ( "fmt" "go/ast" - "go/constant" "go/types" "strconv" "strings" @@ -67,23 +66,18 @@ type posRange struct { } // ParsePrintf takes a printf-like call expression, -// extracts the format string, and parses out all format directives. Each -// directive describes flags, width, precision, verb, and argument indexing. -// This function returns a slice of parsed FormatDirective objects or an error -// if parsing fails. It does not perform any validation of flags, verbs, and -// existence of corresponding argument. -// -// Typical use case: Validate arguments passed to a Printf-like function call, -// DocumentHighlight, Hover, or SemanticHighlight. -func ParsePrintf(info *types.Info, call *ast.CallExpr) ([]*FormatDirective, error) { +// extracts the format string, and parses out all format directives. +// It returns a slice of parsed [FormatDirective] which describes +// flags, width, precision, verb, and argument indexing, or an error +// if parsing fails. It does not perform any validation of flags, verbs, nor the +// existence of corresponding arguments. +// The provided format may differ from the one in CallExpr, such as a concatenated string or a string +// referred to by the argument in CallExpr. +func ParsePrintf(info *types.Info, call *ast.CallExpr, format string) ([]*FormatDirective, error) { idx := FormatStringIndex(info, call) if idx < 0 || idx >= len(call.Args) { return nil, fmt.Errorf("not a valid printf-like call") } - format, ok := StringConstantExpr(info, call.Args[idx]) - if !ok { - return nil, fmt.Errorf("non-constant format string") - } if !strings.Contains(format, "%") { return nil, fmt.Errorf("call has arguments but no formatting directives") } @@ -208,17 +202,6 @@ func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { return idx } -// StringConstantExpr returns expression's string constant value. -// -// ("", false) is returned if expression isn't a string constant. -func StringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { - lit := info.Types[expr].Value - if lit != nil && lit.Kind() == constant.String { - return constant.StringVal(lit), true - } - return "", false -} - // addOffset adjusts the recorded positions in Verb, Width, Prec, and the // directive's overall Range to be relative to the position in the full format string. func (s *FormatDirective) addOffset(parsedLen int) { From a8861b84765fa88a0bf938c09659827d8bf283b0 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Wed, 1 Jan 2025 17:39:27 +0800 Subject: [PATCH 09/14] ensure multiple Indexed directives get highlighted --- gopls/internal/golang/highlight.go | 35 ++++++++----------- .../testdata/highlight/highlight_printf.txt | 4 +++ 2 files changed, 19 insertions(+), 20 deletions(-) diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index beb3555038d..f447f052ec9 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -164,7 +164,7 @@ func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, } // highlightPair highlights the directive and its potential argument pair if the cursor is within either range. - highlightPair := func(start, end token.Pos, argIndex int) bool { + highlightPair := func(start, end token.Pos, argIndex int) { var ( rangeStart = formatPos + token.Pos(start) rangeEnd = formatPos + token.Pos(end) @@ -179,43 +179,38 @@ func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, if arg != nil { highlightRange(result, arg.Pos(), arg.End(), protocol.Read) } - return true } - return false } - // If width or prec has any *, we can not highlight the full range from % to verb, - // because it will overlap with the sub-range of *, for example: - // - // fmt.Printf("%*[3]d", 4, 5, 6) - // ^ ^ we can only highlight this range when cursor in 6. '*' as a one-rune range will - // highlight for 4. - anyAsterisk := false for _, directive := range directives { + // If width or prec has any *, we can not highlight the full range from % to verb, + // because it will overlap with the sub-range of *, for example: + // + // fmt.Printf("%*[3]d", 4, 5, 6) + // ^ ^ we can only highlight this range when cursor in 6. '*' as a one-rune range will + // highlight for 4. + anyAsterisk := false + width, prec, verb := directive.Width, directive.Prec, directive.Verb // Try highlight Width if there is a *. if width != nil && width.ArgIndex != -1 { anyAsterisk = true - if highlightPair(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgIndex) { - return - } + highlightPair(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgIndex) } // Try highlight Precision if there is a *. if prec != nil && prec.ArgIndex != -1 { anyAsterisk = true - if highlightPair(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgIndex) { - return - } + highlightPair(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgIndex) } // Try highlight Verb. if verb.Verb != '%' { // If any * is found inside directive, narrow the highlight range. - if anyAsterisk && highlightPair(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgIndex) { - return - } else if highlightPair(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgIndex) { - return + if anyAsterisk { + highlightPair(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgIndex) + } else { + highlightPair(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgIndex) } } } diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt index baf635facf9..94967638548 100644 --- a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt +++ b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt @@ -49,3 +49,7 @@ func Indexed() { fmt.Printf("%[2]*[1]d", 3, 4) //@hiloc(i7, "[2]*", write),hiloc(i8, "4", read),hiloc(i9, "[1]d", write),hiloc(i10, "3", read),highlightall(i7, i8),highlightall(i9, i10) fmt.Printf("%[2]*.[1]*[3]d", 4, 5, 6) //@hiloc(i11, "[2]*", write),hiloc(i12, "5", read),hiloc(i13, ".[1]*", write),hiloc(i14, "4", read),hiloc(i15, "[3]d", write),hiloc(i16, "6", read),highlightall(i11, i12),highlightall(i13, i14),highlightall(i15, i16) } + +func MultipleIndexed() { + fmt.Printf("%[1]d %[1].2d", 3) //@hiloc(m1, "%[1]d", write),hiloc(m2, "3", read),hiloc(m3, "%[1].2d", read),highlightall(m1, m2, m3) +} From 2173aa97f7aebfa61941d30af9132a39a8398f21 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 7 Jan 2025 08:10:54 +0800 Subject: [PATCH 10/14] test pass --- go/analysis/passes/printf/printf.go | 63 +++-- go/analysis/passes/printf/testdata/src/a/a.go | 4 +- gopls/internal/golang/highlight.go | 89 +----- .../testdata/highlight/highlight_printf.txt | 55 ---- internal/fmtstr/parse.go | 264 ++++++++---------- 5 files changed, 164 insertions(+), 311 deletions(-) delete mode 100644 gopls/internal/test/marker/testdata/highlight/highlight_printf.txt diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index a0c38c575a7..e9651e1a293 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -447,9 +447,34 @@ func isFormatter(typ types.Type) bool { types.Identical(sig.Params().At(1).Type(), types.Typ[types.Rune]) } +// FormatStringIndex returns the index of the format string (the last +// non-variadic parameter) within the given printf-like call +// expression, or -1 if unknown. +func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { + typ := info.Types[call.Fun].Type + if typ == nil { + return -1 // missing type + } + sig, ok := typ.(*types.Signature) + if !ok { + return -1 // ill-typed + } + if !sig.Variadic() { + // Skip checking non-variadic functions. + return -1 + } + idx := sig.Params().Len() - 2 + if idx < 0 { + // Skip checking variadic functions without + // fixed arguments. + return -1 + } + return idx +} + // checkPrintf checks a call to a formatted print routine such as Printf. func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { - idx := fmtstr.FormatStringIndex(pass.TypesInfo, call) + idx := FormatStringIndex(pass.TypesInfo, call) if idx < 0 || idx >= len(call.Args) { return } @@ -492,9 +517,9 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string // Pass the string constant value so // fmt.Sprintf("%"+("s"), "hi", 3) can be reported as // "fmt.Sprintf call needs 1 arg but has 2 args". - directives, err := fmtstr.ParsePrintf(pass.TypesInfo, call, format) + directives, err := fmtstr.Parse(format, idx) if err != nil { - pass.ReportRangef(call.Fun, "%s %s", name, err.Error()) + pass.ReportRangef(call.Args[idx], "%s %s", name, err) return } @@ -502,9 +527,9 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string anyIndex := false // Check formats against args. for _, directive := range directives { - if (directive.Prec != nil && directive.Prec.Index != -1) || - (directive.Width != nil && directive.Width.Index != -1) || - (directive.Verb.Index != -1) { + if (directive.Prec.Index > 0) || + (directive.Width.Index > 0) || + (directive.Verb.Index > 0) { anyIndex = true } if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, directive) { // One error per format is enough. @@ -597,7 +622,7 @@ var printVerbs = []printVerb{ // okPrintfArg compares the FormatDirective to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, directive *fmtstr.FormatDirective) (ok bool) { +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, directive *fmtstr.Operation) (ok bool) { verb := directive.Verb.Verb var v printVerb found := false @@ -620,7 +645,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", name, directive.Format, verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", name, directive.Text, verb) return false } for _, flag := range directive.Flags { @@ -630,7 +655,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, directive.Format, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, directive.Text, flag) return false } } @@ -638,11 +663,11 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs var argIndexes []int // First check for *. - if directive.Width != nil && directive.Width.ArgIndex != -1 { - argIndexes = append(argIndexes, directive.Width.ArgIndex) + if directive.Width.Dynamic > 0 { + argIndexes = append(argIndexes, directive.Width.Dynamic) } - if directive.Prec != nil && directive.Prec.ArgIndex != -1 { - argIndexes = append(argIndexes, directive.Prec.ArgIndex) + if directive.Prec.Dynamic > 0 { + argIndexes = append(argIndexes, directive.Prec.Dynamic) } // If len(argIndexes)>0, we have something like %.*s and all // indexes in argIndexes must be an integer. @@ -657,7 +682,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, directive.Format, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, directive.Text, analysisutil.Format(pass.Fset, arg), details) return false } } @@ -686,7 +711,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs } arg := call.Args[verbArgIndex] if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, directive.Format, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, directive.Text, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -698,12 +723,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, directive.Format, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, directive.Text, analysisutil.Format(pass.Fset, arg), typeString, details) return false } if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(directive.Flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, directive.Format, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, directive.Text, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -787,7 +812,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg int, directive *fmtstr.FormatDirective, name string) bool { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg int, directive *fmtstr.Operation, name string) bool { if argIndex <= 0 { // Shouldn't happen, so catch it with prejudice. panic("negative argIndex") @@ -804,7 +829,7 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". arg := argIndex - firstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Format, arg, count(len(call.Args)-firstArg, "arg")) + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Text, arg, count(len(call.Args)-firstArg, "arg")) return false } diff --git a/go/analysis/passes/printf/testdata/src/a/a.go b/go/analysis/passes/printf/testdata/src/a/a.go index 18b9e3be2b9..02ce425f8a3 100644 --- a/go/analysis/passes/printf/testdata/src/a/a.go +++ b/go/analysis/passes/printf/testdata/src/a/a.go @@ -212,8 +212,8 @@ func PrintfTests() { // Bad argument reorderings. Printf("%[xd", 3) // want `a.Printf format %\[xd is missing closing \]` Printf("%[x]d x", 3) // want `a.Printf format has invalid argument index \[x\]` - Printf("%[3]*s x", "hi", 2) // want `a.Printf format has invalid argument index \[3\]` - _ = fmt.Sprintf("%[3]d x", 2) // want `fmt.Sprintf format has invalid argument index \[3\]` + Printf("%[3]*s x", "hi", 2) // want `a.Printf format %\[3]\*s reads arg #3, but call has 2 args` + _ = fmt.Sprintf("%[3]d x", 2) // want `fmt.Sprintf format %\[3]d reads arg #3, but call has 1 arg` Printf("%[2]*.[1]*[3]d x", 2, "hi", 4) // want `a.Printf format %\[2]\*\.\[1\]\*\[3\]d uses non-int \x22hi\x22 as argument of \*` Printf("%[0]s x", "arg1") // want `a.Printf format has invalid argument index \[0\]` Printf("%[0]d x", 1) // want `a.Printf format has invalid argument index \[0\]` diff --git a/gopls/internal/golang/highlight.go b/gopls/internal/golang/highlight.go index f447f052ec9..1174ce7f7d4 100644 --- a/gopls/internal/golang/highlight.go +++ b/gopls/internal/golang/highlight.go @@ -10,14 +10,12 @@ import ( "go/ast" "go/token" "go/types" - "strings" "golang.org/x/tools/go/ast/astutil" "golang.org/x/tools/gopls/internal/cache" "golang.org/x/tools/gopls/internal/file" "golang.org/x/tools/gopls/internal/protocol" "golang.org/x/tools/internal/event" - "golang.org/x/tools/internal/fmtstr" ) func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, position protocol.Position) ([]protocol.DocumentHighlight, error) { @@ -51,7 +49,7 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po } } } - result, err := highlightPath(pkg.TypesInfo(), path, pos) + result, err := highlightPath(path, pgf.File, pkg.TypesInfo()) if err != nil { return nil, err } @@ -71,24 +69,8 @@ func Highlight(ctx context.Context, snapshot *cache.Snapshot, fh file.Handle, po // highlightPath returns ranges to highlight for the given enclosing path, // which should be the result of astutil.PathEnclosingInterval. -func highlightPath(info *types.Info, path []ast.Node, pos token.Pos) (map[posRange]protocol.DocumentHighlightKind, error) { +func highlightPath(path []ast.Node, file *ast.File, info *types.Info) (map[posRange]protocol.DocumentHighlightKind, error) { result := make(map[posRange]protocol.DocumentHighlightKind) - - // Inside a printf-style call, printf("...%v...", arg)? - // Treat each corresponding ("%v", arg) pair as a highlight class. - for _, node := range path { - if call, ok := node.(*ast.CallExpr); ok { - idx := fmtstr.FormatStringIndex(info, call) - if idx >= 0 && idx < len(call.Args) { - // We only care string literal, so fmt.Sprint("a"+"b%s", "bar") won't highlight. - if lit, ok := call.Args[idx].(*ast.BasicLit); ok && strings.Contains(lit.Value, "%") { - highlightPrintf(info, call, call.Args[idx].Pos(), pos, lit.Value, result) - } - } - } - } - - file := path[len(path)-1].(*ast.File) switch node := path[0].(type) { case *ast.BasicLit: // Import path string literal? @@ -149,73 +131,6 @@ func highlightPath(info *types.Info, path []ast.Node, pos token.Pos) (map[posRan return result, nil } -// highlightPrintf highlights directives in a format string and their corresponding -// variadic arguments in a printf-style function call. -// For example: -// -// fmt.Printf("Hello %s, you scored %d", name, score) -// -// If the cursor is on %s or name, highlightPrintf will highlight %s as a write operation, -// and name as a read operation. -func highlightPrintf(info *types.Info, call *ast.CallExpr, formatPos token.Pos, cursorPos token.Pos, format string, result map[posRange]protocol.DocumentHighlightKind) { - directives, err := fmtstr.ParsePrintf(info, call, format) - if err != nil { - return - } - - // highlightPair highlights the directive and its potential argument pair if the cursor is within either range. - highlightPair := func(start, end token.Pos, argIndex int) { - var ( - rangeStart = formatPos + token.Pos(start) - rangeEnd = formatPos + token.Pos(end) - arg ast.Expr // may not exist - ) - if len(call.Args) > argIndex { - arg = call.Args[argIndex] - } - - if (cursorPos >= rangeStart && cursorPos < rangeEnd) || (arg != nil && cursorPos >= arg.Pos() && cursorPos < arg.End()) { - highlightRange(result, rangeStart, rangeEnd, protocol.Write) - if arg != nil { - highlightRange(result, arg.Pos(), arg.End(), protocol.Read) - } - } - } - - for _, directive := range directives { - // If width or prec has any *, we can not highlight the full range from % to verb, - // because it will overlap with the sub-range of *, for example: - // - // fmt.Printf("%*[3]d", 4, 5, 6) - // ^ ^ we can only highlight this range when cursor in 6. '*' as a one-rune range will - // highlight for 4. - anyAsterisk := false - - width, prec, verb := directive.Width, directive.Prec, directive.Verb - // Try highlight Width if there is a *. - if width != nil && width.ArgIndex != -1 { - anyAsterisk = true - highlightPair(token.Pos(width.Range.Start), token.Pos(width.Range.End), width.ArgIndex) - } - - // Try highlight Precision if there is a *. - if prec != nil && prec.ArgIndex != -1 { - anyAsterisk = true - highlightPair(token.Pos(prec.Range.Start), token.Pos(prec.Range.End), prec.ArgIndex) - } - - // Try highlight Verb. - if verb.Verb != '%' { - // If any * is found inside directive, narrow the highlight range. - if anyAsterisk { - highlightPair(token.Pos(verb.Range.Start), token.Pos(verb.Range.End), verb.ArgIndex) - } else { - highlightPair(token.Pos(directive.Range.Start), token.Pos(directive.Range.End), verb.ArgIndex) - } - } - } -} - type posRange struct { start, end token.Pos } diff --git a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt b/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt deleted file mode 100644 index 94967638548..00000000000 --- a/gopls/internal/test/marker/testdata/highlight/highlight_printf.txt +++ /dev/null @@ -1,55 +0,0 @@ -This test checks functionality of the printf-like directives and operands highlight. - --- flags -- --ignore_extra_diags - --- highlights.go -- -package highlightprintf - -import ( - "fmt" -) - -func BasicPrintfHighlights() { - fmt.Printf("Hello %s, you have %d new messages!", "Alice", 5) //@hiloc(normals, "%s", write),hiloc(normalarg0, "\"Alice\"", read),highlightall(normals, normalarg0) - fmt.Printf("Hello %s, you have %d new messages!", "Alice", 5) //@hiloc(normald, "%d", write),hiloc(normalargs1, "5", read),highlightall(normald, normalargs1) -} - -func ComplexPrintfHighlights() { - fmt.Printf("Hello %#3.4s, you have %-2.3d new messages!", "Alice", 5) //@hiloc(complexs, "%#3.4s", write),hiloc(complexarg0, "\"Alice\"", read),highlightall(complexs, complexarg0) - fmt.Printf("Hello %#3.4s, you have %-2.3d new messages!", "Alice", 5) //@hiloc(complexd, "%-2.3d", write),hiloc(complexarg1, "5", read),highlightall(complexd, complexarg1) -} - -func MissingDirectives() { - fmt.Printf("Hello %s, you have 5 new messages!", "Alice", 5) //@hiloc(missings, "%s", write),hiloc(missingargs0, "\"Alice\"", read),highlightall(missings, missingargs0) -} - -func TooManyDirectives() { - fmt.Printf("Hello %s, you have %d new %s %q messages!", "Alice", 5) //@hiloc(toomanys, "%s", write),hiloc(toomanyargs0, "\"Alice\"", read),highlightall(toomanys, toomanyargs0) - fmt.Printf("Hello %s, you have %d new %s %q messages!", "Alice", 5) //@hiloc(toomanyd, "%d", write),hiloc(toomanyargs1, "5", read),highlightall(toomanyd, toomanyargs1) -} - -func VerbIsPercentage() { - fmt.Printf("%4.2% %d", 6) //@hiloc(z1, "%d", write),hiloc(z2, "6", read),highlightall(z1, z2) -} - -func SpecialChars() { - fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(specials, "%s", write),hiloc(specialargs0, "\"Alice\"", read),highlightall(specials, specialargs0) - fmt.Printf("Hello \n %s, you \t \n have %d new messages!", "Alice", 5) //@hiloc(speciald, "%d", write),hiloc(specialargs1, "5", read),highlightall(speciald, specialargs1) -} - -func Escaped() { - fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapeds, "%s", write),hiloc(escapedargs0, "\"Alice\"", read),highlightall(escapeds, escapedargs0) - fmt.Printf("Hello %% \n %s, you \t%% \n have %d new m%%essages!", "Alice", 5) //@hiloc(escapedd, "%s", write),hiloc(escapedargs1, "\"Alice\"", read),highlightall(escapedd, escapedargs1) -} - -func Indexed() { - fmt.Printf("%[1]d", 3) //@hiloc(i1, "%[1]d", write),hiloc(i2, "3", read),highlightall(i1, i2) - fmt.Printf("%[1]*d", 3, 6) //@hiloc(i3, "[1]*", write),hiloc(i4, "3", read),hiloc(i5, "d", write),hiloc(i6, "6", read),highlightall(i3, i4),highlightall(i5, i6) - fmt.Printf("%[2]*[1]d", 3, 4) //@hiloc(i7, "[2]*", write),hiloc(i8, "4", read),hiloc(i9, "[1]d", write),hiloc(i10, "3", read),highlightall(i7, i8),highlightall(i9, i10) - fmt.Printf("%[2]*.[1]*[3]d", 4, 5, 6) //@hiloc(i11, "[2]*", write),hiloc(i12, "5", read),hiloc(i13, ".[1]*", write),hiloc(i14, "4", read),hiloc(i15, "[3]d", write),hiloc(i16, "6", read),highlightall(i11, i12),highlightall(i13, i14),highlightall(i15, i16) -} - -func MultipleIndexed() { - fmt.Printf("%[1]d %[1].2d", 3) //@hiloc(m1, "%[1]d", write),hiloc(m2, "3", read),hiloc(m3, "%[1].2d", read),highlightall(m1, m2, m3) -} diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index 81458d1c672..96fb7a9a4d2 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -2,30 +2,31 @@ // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. +// Package fmtstr defines a parser for format strings as used by [fmt.Printf]. + package fmtstr import ( "fmt" - "go/ast" - "go/types" "strconv" "strings" "unicode/utf8" ) -// FormatDirective holds the parsed representation of a printf directive such as "%3.*[4]d". -// It is constructed by [ParsePrintf]. -type FormatDirective struct { - Format string // Full directive, e.g. "%[2]*.3d" - Range posRange // The range of Format within the overall format string - Flags []byte // Formatting flags, e.g. ['-', '0'] - Width *DirectiveSize // Width specifier, if any (e.g., '3' in '%3d') - Prec *DirectiveSize // Precision specifier, if any (e.g., '.4' in '%.4f') - Verb DirectiveVerb // Verb specifier, guaranteed to exist (e.g., '[1]d' in '%[1]d') +// Operation holds the parsed representation of a printf operation such as "%3.*[4]d". +// It is constructed by [Parse]. +type Operation struct { + Text string // Full text of the operation, e.g. "%[2]*.3d" + Verb Verb // Verb specifier, guaranteed to exist, e.g., 'd' in '%[1]d' + Range Range // The range of Text within the overall format string + Flags []byte // Formatting flags, e.g. "-0" + Width Size // Width specifier, e.g., '3' in '%3d' + Prec Size // Precision specifier, e.g., '.4' in '%.4f' +} - // Parsing state (not used after parsing): - firstArg int // Index of the first argument after the format string - call *ast.CallExpr +type state struct { + operation *Operation + firstArg int // Index of the first argument after the format string argNum int // Which argument we're expecting to format now. hasIndex bool // Whether the argument is indexed. index int // The encountered index @@ -34,97 +35,99 @@ type FormatDirective struct { nbytes int // number of bytes of the format string consumed. } -type SizeKind int +// Size describes a width or precision in a format operation. +// It may represent a literal number, a asterisk, or an indexed asterisk. +// +// Zero value of Size means non-exsistence. +type Size struct { + // At most one of these two fields is non-zero. + Fixed int // e.g. 4 from "%4d" + Dynamic int // index of argument providing dynamic size (e.g. %*d or %[3]*d) -const ( - Literal SizeKind = iota // A literal number, e.g. "4" in "%4d" - Asterisk // A dynamic size from an argument, e.g. "%*d" - IndexedAsterisk // A dynamic size with an explicit index, e.g. "%[2]*d" -) + Index int // If the width or precision uses an indexed argument (e.g. 2 in %[2]d), this is the index. + Range Range // Position of the size specifier within the operation +} -// DirectiveSize describes a width or precision in a format directive. -// Depending on Kind, it may represent a literal number, a asterisk, or an indexed asterisk. -type DirectiveSize struct { - Kind SizeKind // Type of size specifier - Range posRange // Position of the size specifier within the directive - Size int // The literal size if Kind == Literal, otherwise -1 - Index int // If Kind == IndexedAsterisk, the argument index used to obtain the size, otherwise -1 - ArgIndex int // The argument index if Kind == Asterisk or IndexedAsterisk relative to CallExpr, otherwise -1 +func (s Size) IsZero() bool { + return s.Fixed == 0 && s.Dynamic == 0 } -// DirectiveVerb represents the verb character of a format directive (e.g., 'd', 's', 'f'). +// Verb represents the verb character of a format operation (e.g., 'd', 's', 'f'). // It also includes positional information and any explicit argument indexing. -type DirectiveVerb struct { +type Verb struct { Verb rune - Range posRange // The positional range of the verb in the format string - Index int // If the verb uses an indexed argument, this is the index, otherwise -1 - ArgIndex int // The argument index associated with this verb, relative to CallExpr, otherwise -1 + Range Range // The positional range of the verb in the format string + Index int // If the verb uses an indexed argument, this is the index, otherwise -1 + ArgIndex int // The argument index associated with this verb, relative to CallExpr, otherwise -1 } -type posRange struct { +// byte offsets of format string +type Range struct { Start, End int } -// ParsePrintf takes a printf-like call expression, -// extracts the format string, and parses out all format directives. -// It returns a slice of parsed [FormatDirective] which describes -// flags, width, precision, verb, and argument indexing, or an error -// if parsing fails. It does not perform any validation of flags, verbs, nor the -// existence of corresponding arguments. -// The provided format may differ from the one in CallExpr, such as a concatenated string or a string +// Parse takes a format string and its index in the printf-like call, +// parses out all format operations. it returns a slice of parsed +// [Operation] which describes flags, width, precision, verb, and argument indexing, +// or an error if parsing fails. +// +// All error messages are in predicate form ("call has a problem") +// so that they may be affixed into a subject ("log.Printf "). +// See https://go-review.googlesource.com/c/tools/+/632598/comment/9d980373_e6460abf/ +// +// It does not perform any validation of flags, verbs, nor the +// existence of corresponding arguments. The provided format string may differ +// from the one in CallExpr, such as a concatenated string or a string // referred to by the argument in CallExpr. -func ParsePrintf(info *types.Info, call *ast.CallExpr, format string) ([]*FormatDirective, error) { - idx := FormatStringIndex(info, call) - if idx < 0 || idx >= len(call.Args) { - return nil, fmt.Errorf("not a valid printf-like call") - } +func Parse(format string, idx int) ([]*Operation, error) { if !strings.Contains(format, "%") { return nil, fmt.Errorf("call has arguments but no formatting directives") } firstArg := idx + 1 // Arguments are immediately after format string. argNum := firstArg - var states []*FormatDirective + var operations []*Operation for i, w := 0, 0; i < len(format); i += w { w = 1 if format[i] != '%' { continue } - state, err := parsePrintfVerb(call, format[i:], firstArg, argNum) + state, err := parseOperation(format[i:], firstArg, argNum) if err != nil { return nil, err } - state.addOffset(i) - states = append(states, state) + state.operation.addOffset(i) + operations = append(operations, state.operation) - w = len(state.Format) + w = len(state.operation.Text) // Do not waste an argument for '%'. - if state.Verb.Verb != '%' { + if state.operation.Verb.Verb != '%' { argNum = state.argNum + 1 } } - return states, nil + return operations, nil } -// parsePrintfVerb parses one format directive starting at the given substring `format`, -// which should begin with '%'. It returns a fully populated FormatDirective or an error -// if the directive is malformed. The firstArg and argNum parameters help determine how -// arguments map to this directive. +// parseOperation parses one format operation starting at the given substring `format`, +// which should begin with '%'. It returns a fully populated state or an error +// if the operation is malformed. The firstArg and argNum parameters help determine how +// arguments map to this operation. // // Parse sequence: '%' -> flags -> {[N]* or width} -> .{[N]* or precision} -> [N] -> verb. -func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (*FormatDirective, error) { - state := &FormatDirective{ - Format: format, - Flags: make([]byte, 0, 5), +func parseOperation(format string, firstArg, argNum int) (*state, error) { + state := &state{ + operation: &Operation{ + Text: format, + Flags: make([]byte, 0, 5), + }, firstArg: firstArg, - call: call, argNum: argNum, hasIndex: false, index: 0, indexPos: 0, indexPending: false, - nbytes: 1, // There's guaranteed to be a percent sign. + nbytes: len("%"), // There's guaranteed to be a percent sign. } // There may be flags. state.parseFlags() @@ -144,16 +147,16 @@ func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (* return nil, err } } - if state.nbytes == len(state.Format) { - return nil, fmt.Errorf("format %s is missing verb at end of string", state.Format) + if state.nbytes == len(state.operation.Text) { + return nil, fmt.Errorf("format %s is missing verb at end of string", state.operation.Text) } - verb, w := utf8.DecodeRuneInString(state.Format[state.nbytes:]) + verb, w := utf8.DecodeRuneInString(state.operation.Text[state.nbytes:]) // Ensure there must be a verb. if state.indexPending { - state.Verb = DirectiveVerb{ + state.operation.Verb = Verb{ Verb: verb, - Range: posRange{ + Range: Range{ Start: state.indexPos, End: state.nbytes + w, }, @@ -161,9 +164,9 @@ func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (* ArgIndex: state.argNum, } } else { - state.Verb = DirectiveVerb{ + state.operation.Verb = Verb{ Verb: verb, - Range: posRange{ + Range: Range{ Start: state.nbytes, End: state.nbytes + w, }, @@ -173,59 +176,34 @@ func parsePrintfVerb(call *ast.CallExpr, format string, firstArg, argNum int) (* } state.nbytes += w - state.Format = state.Format[:state.nbytes] + state.operation.Text = state.operation.Text[:state.nbytes] return state, nil } -// FormatStringIndex returns the index of the format string (the last -// non-variadic parameter) within the given printf-like call -// expression, or -1 if unknown. -func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { - typ := info.Types[call.Fun].Type - if typ == nil { - return -1 // missing type - } - sig, ok := typ.(*types.Signature) - if !ok { - return -1 // ill-typed - } - if !sig.Variadic() { - // Skip checking non-variadic functions. - return -1 - } - idx := sig.Params().Len() - 2 - if idx < 0 { - // Skip checking variadic functions without - // fixed arguments. - return -1 - } - return idx -} - // addOffset adjusts the recorded positions in Verb, Width, Prec, and the -// directive's overall Range to be relative to the position in the full format string. -func (s *FormatDirective) addOffset(parsedLen int) { +// operation's overall Range to be relative to the position in the full format string. +func (s *Operation) addOffset(parsedLen int) { s.Verb.Range.Start += parsedLen s.Verb.Range.End += parsedLen s.Range.Start = parsedLen s.Range.End = s.Verb.Range.End - if s.Prec != nil { + if !s.Prec.IsZero() { s.Prec.Range.Start += parsedLen s.Prec.Range.End += parsedLen } - if s.Width != nil { + if !s.Width.IsZero() { s.Width.Range.Start += parsedLen s.Width.Range.End += parsedLen } } // parseFlags accepts any printf flags. -func (s *FormatDirective) parseFlags() { - for s.nbytes < len(s.Format) { - switch c := s.Format[s.nbytes]; c { +func (s *state) parseFlags() { + for s.nbytes < len(s.operation.Text) { + switch c := s.operation.Text[s.nbytes]; c { case '#', '0', '+', '-', ' ': - s.Flags = append(s.Flags, c) + s.operation.Flags = append(s.operation.Flags, c) s.nbytes++ default: return @@ -236,8 +214,8 @@ func (s *FormatDirective) parseFlags() { // parseIndex parses an argument index of the form "[n]" that can appear // in a printf directive (e.g., "%[2]d"). Returns an error if syntax is // malformed or index is invalid. -func (s *FormatDirective) parseIndex() error { - if s.nbytes == len(s.Format) || s.Format[s.nbytes] != '[' { +func (s *state) parseIndex() error { + if s.nbytes == len(s.operation.Text) || s.operation.Text[s.nbytes] != '[' { return nil } // Argument index present. @@ -250,17 +228,17 @@ func (s *FormatDirective) parseIndex() error { } ok := true - if s.nbytes == len(s.Format) || s.nbytes == start || s.Format[s.nbytes] != ']' { + if s.nbytes == len(s.operation.Text) || s.nbytes == start || s.operation.Text[s.nbytes] != ']' { ok = false // syntax error is either missing "]" or invalid index. - s.nbytes = strings.Index(s.Format[start:], "]") + s.nbytes = strings.Index(s.operation.Text[start:], "]") if s.nbytes < 0 { - return fmt.Errorf("format %s is missing closing ]", s.Format) + return fmt.Errorf("format %s is missing closing ]", s.operation.Text) } s.nbytes = s.nbytes + start } - arg32, err := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) - if err != nil || !ok || arg32 <= 0 || arg32 > int64(len(s.call.Args)-s.firstArg) { - return fmt.Errorf("format has invalid argument index [%s]", s.Format[start:s.nbytes]) + arg32, err := strconv.ParseInt(s.operation.Text[start:s.nbytes], 10, 32) + if err != nil || !ok || arg32 <= 0 { + return fmt.Errorf("format has invalid argument index [%s]", s.operation.Text[start:s.nbytes]) } s.nbytes++ // skip ']' @@ -273,13 +251,13 @@ func (s *FormatDirective) parseIndex() error { } // scanNum advances through a decimal number if present, which represents a [Size] or [Index]. -func (s *FormatDirective) scanNum() (int, bool) { +func (s *state) scanNum() (int, bool) { start := s.nbytes - for ; s.nbytes < len(s.Format); s.nbytes++ { - c := s.Format[s.nbytes] + for ; s.nbytes < len(s.operation.Text); s.nbytes++ { + c := s.operation.Text[s.nbytes] if c < '0' || '9' < c { if start < s.nbytes { - num, _ := strconv.ParseInt(s.Format[start:s.nbytes], 10, 32) + num, _ := strconv.ParseInt(s.operation.Text[start:s.nbytes], 10, 32) return int(num), true } else { return 0, false @@ -297,54 +275,47 @@ const ( ) // parseSize parses a width or precision specifier. It handles literal numeric -// values (e.g., "%3d"), asterisk values (e.g., "%*d"), or indexed asterisk -// values (e.g., "%[2]*d"). The kind parameter specifies whether it's parsing -// a Width or a Precision. -func (s *FormatDirective) parseSize(kind sizeType) { - if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '*' { +// values (e.g., "%3d"), asterisk values (e.g., "%*d"), or indexed asterisk values (e.g., "%[2]*d"). +func (s *state) parseSize(kind sizeType) { + if s.nbytes < len(s.operation.Text) && s.operation.Text[s.nbytes] == '*' { s.nbytes++ if s.indexPending { // Absorb it. s.indexPending = false - size := &DirectiveSize{ - Kind: IndexedAsterisk, - Size: -1, - Range: posRange{ + size := Size{ + Dynamic: s.argNum, + Index: s.index, + Range: Range{ Start: s.indexPos, End: s.nbytes, }, - Index: s.index, - ArgIndex: s.argNum, } switch kind { case Width: - s.Width = size + s.operation.Width = size case Precision: // Include the leading '.'. - size.Range.Start -= 1 - s.Prec = size + size.Range.Start -= len(".") + s.operation.Prec = size default: panic(kind) } } else { // Non-indexed asterisk: "%*d". - size := &DirectiveSize{ - Kind: Asterisk, - Size: -1, - Range: posRange{ + size := Size{ + Dynamic: s.argNum, + Range: Range{ Start: s.nbytes - 1, End: s.nbytes, }, - Index: -1, - ArgIndex: s.argNum, } switch kind { case Width: - s.Width = size + s.operation.Width = size case Precision: // For precision, include the '.' in the range. size.Range.Start -= 1 - s.Prec = size + s.operation.Prec = size default: panic(kind) } @@ -353,23 +324,20 @@ func (s *FormatDirective) parseSize(kind sizeType) { } else { // Literal number, e.g. "%10d" start := s.nbytes if num, ok := s.scanNum(); ok { - size := &DirectiveSize{ - Kind: Literal, - Size: num, - Range: posRange{ + size := Size{ + Fixed: num, + Range: Range{ Start: start, End: s.nbytes, }, - Index: -1, - ArgIndex: -1, } switch kind { case Width: - s.Width = size + s.operation.Width = size case Precision: // Include the leading '.'. size.Range.Start -= 1 - s.Prec = size + s.operation.Prec = size default: panic(kind) } @@ -380,9 +348,9 @@ func (s *FormatDirective) parseSize(kind sizeType) { // parsePrecision checks if there's a precision specified after a '.' character. // If found, it may also parse an index or an asterisk. Returns an error if any index // parsing fails. -func (s *FormatDirective) parsePrecision() error { +func (s *state) parsePrecision() error { // If there's a period, there may be a precision. - if s.nbytes < len(s.Format) && s.Format[s.nbytes] == '.' { + if s.nbytes < len(s.operation.Text) && s.operation.Text[s.nbytes] == '.' { s.nbytes++ if err := s.parseIndex(); err != nil { return err From c3359f0b28d89b98e35214d2d121476f37a59bf9 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 7 Jan 2025 21:10:15 +0800 Subject: [PATCH 11/14] width and prec revert to use pointer --- go/analysis/passes/printf/printf.go | 62 ++++++++++++++--------------- internal/fmtstr/parse.go | 57 +++++++++++++------------- 2 files changed, 60 insertions(+), 59 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index e9651e1a293..bbc83a10585 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -517,7 +517,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string // Pass the string constant value so // fmt.Sprintf("%"+("s"), "hi", 3) can be reported as // "fmt.Sprintf call needs 1 arg but has 2 args". - directives, err := fmtstr.Parse(format, idx) + operations, err := fmtstr.Parse(format, idx) if err != nil { pass.ReportRangef(call.Args[idx], "%s %s", name, err) return @@ -526,16 +526,16 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string maxArgIndex := firstArg anyIndex := false // Check formats against args. - for _, directive := range directives { - if (directive.Prec.Index > 0) || - (directive.Width.Index > 0) || - (directive.Verb.Index > 0) { + for _, operation := range operations { + if operation.Prec != nil && operation.Prec.Index != -1 || + operation.Width != nil && operation.Width.Index != -1 || + operation.Verb.Index != -1 { anyIndex = true } - if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, directive) { // One error per format is enough. + if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, operation) { // One error per format is enough. return } - if directive.Verb.Verb == 'w' { + if operation.Verb.Verb == 'w' { switch kind { case KindNone, KindPrint, KindPrintf: pass.Reportf(call.Pos(), "%s does not support error-wrapping directive %%w", name) @@ -619,11 +619,11 @@ var printVerbs = []printVerb{ {'X', sharpNumFlag, argRune | argInt | argString | argPointer | argFloat | argComplex}, } -// okPrintfArg compares the FormatDirective to the arguments actually present, +// okPrintfArg compares the operation to the arguments actually present, // reporting any discrepancies it can discern. If the final argument is ellipsissed, // there's little it can do for that. -func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, directive *fmtstr.Operation) (ok bool) { - verb := directive.Verb.Verb +func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, operation *fmtstr.Operation) (ok bool) { + verb := operation.Verb.Verb var v printVerb found := false // Linear scan is fast enough for a small list. @@ -637,25 +637,25 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs // Could verb's arg implement fmt.Formatter? // Skip check for the %w verb, which requires an error. formatter := false - if v.typ != argError && directive.Verb.ArgIndex < len(call.Args) { - if tv, ok := pass.TypesInfo.Types[call.Args[directive.Verb.ArgIndex]]; ok { + if v.typ != argError && operation.Verb.ArgIndex < len(call.Args) { + if tv, ok := pass.TypesInfo.Types[call.Args[operation.Verb.ArgIndex]]; ok { formatter = isFormatter(tv.Type) } } if !formatter { if !found { - pass.ReportRangef(call, "%s format %s has unknown verb %c", name, directive.Text, verb) + pass.ReportRangef(call, "%s format %s has unknown verb %c", name, operation.Text, verb) return false } - for _, flag := range directive.Flags { + for _, flag := range operation.Flags { // TODO: Disable complaint about '0' for Go 1.10. To be fixed properly in 1.11. // See issues 23598 and 23605. if flag == '0' { continue } if !strings.ContainsRune(v.flags, rune(flag)) { - pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, directive.Text, flag) + pass.ReportRangef(call, "%s format %s has unrecognized flag %c", name, operation.Text, flag) return false } } @@ -663,17 +663,17 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs var argIndexes []int // First check for *. - if directive.Width.Dynamic > 0 { - argIndexes = append(argIndexes, directive.Width.Dynamic) + if operation.Width != nil && operation.Width.Dynamic != -1 { + argIndexes = append(argIndexes, operation.Width.Dynamic) } - if directive.Prec.Dynamic > 0 { - argIndexes = append(argIndexes, directive.Prec.Dynamic) + if operation.Prec != nil && operation.Prec.Dynamic > 0 { + argIndexes = append(argIndexes, operation.Prec.Dynamic) } // If len(argIndexes)>0, we have something like %.*s and all // indexes in argIndexes must be an integer. for i := 0; i < len(argIndexes); i++ { argIndex := argIndexes[i] - if !argCanBeChecked(pass, call, argIndex, firstArg, directive, name) { + if !argCanBeChecked(pass, call, argIndex, firstArg, operation, name) { return } arg := call.Args[argIndex] @@ -682,14 +682,14 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, directive.Text, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, operation.Text, analysisutil.Format(pass.Fset, arg), details) return false } } // Collect to update maxArgNum in one loop. - if directive.Verb.ArgIndex != -1 && verb != '%' { - argIndexes = append(argIndexes, directive.Verb.ArgIndex) + if operation.Verb.ArgIndex != -1 && verb != '%' { + argIndexes = append(argIndexes, operation.Verb.ArgIndex) } for _, index := range argIndexes { if index >= *maxArgIndex { @@ -705,13 +705,13 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs } // Now check verb's type. - verbArgIndex := directive.Verb.ArgIndex - if !argCanBeChecked(pass, call, verbArgIndex, firstArg, directive, name) { + verbArgIndex := operation.Verb.ArgIndex + if !argCanBeChecked(pass, call, verbArgIndex, firstArg, operation, name) { return false } arg := call.Args[verbArgIndex] if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, directive.Text, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, operation.Text, analysisutil.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -723,12 +723,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, directive.Text, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, operation.Text, analysisutil.Format(pass.Fset, arg), typeString, details) return false } - if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(directive.Flags, []byte{'#'}) { + if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(operation.Flags, []byte{'#'}) { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, directive.Text, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, operation.Text, analysisutil.Format(pass.Fset, arg), methodName) return false } } @@ -812,7 +812,7 @@ func isFunctionValue(pass *analysis.Pass, e ast.Expr) bool { // argCanBeChecked reports whether the specified argument is statically present; // it may be beyond the list of arguments or in a terminal slice... argument, which // means we can't see it. -func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg int, directive *fmtstr.Operation, name string) bool { +func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg int, operation *fmtstr.Operation, name string) bool { if argIndex <= 0 { // Shouldn't happen, so catch it with prejudice. panic("negative argIndex") @@ -829,7 +829,7 @@ func argCanBeChecked(pass *analysis.Pass, call *ast.CallExpr, argIndex, firstArg // There are bad indexes in the format or there are fewer arguments than the format needs. // This is the argument number relative to the format: Printf("%s", "hi") will give 1 for the "hi". arg := argIndex - firstArg + 1 // People think of arguments as 1-indexed. - pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, directive.Text, arg, count(len(call.Args)-firstArg, "arg")) + pass.ReportRangef(call, "%s format %s reads arg #%d, but call has %v", name, operation.Text, arg, count(len(call.Args)-firstArg, "arg")) return false } diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index 96fb7a9a4d2..76f0aa5e7a6 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -19,11 +19,12 @@ type Operation struct { Text string // Full text of the operation, e.g. "%[2]*.3d" Verb Verb // Verb specifier, guaranteed to exist, e.g., 'd' in '%[1]d' Range Range // The range of Text within the overall format string - Flags []byte // Formatting flags, e.g. "-0" - Width Size // Width specifier, e.g., '3' in '%3d' - Prec Size // Precision specifier, e.g., '.4' in '%.4f' + Flags []byte // Formatting flags, e.g. ['-', '0'] + Width *Size // Width specifier, e.g., '3' in '%3d' + Prec *Size // Precision specifier, e.g., '.4' in '%.4f' } +// Internal parsing state to operation. type state struct { operation *Operation firstArg int // Index of the first argument after the format string @@ -36,29 +37,23 @@ type state struct { } // Size describes a width or precision in a format operation. -// It may represent a literal number, a asterisk, or an indexed asterisk. -// -// Zero value of Size means non-exsistence. +// It may represent a literal number, an asterisk, or an indexed asterisk. type Size struct { - // At most one of these two fields is non-zero. - Fixed int // e.g. 4 from "%4d" - Dynamic int // index of argument providing dynamic size (e.g. %*d or %[3]*d) + // At most one of these two fields is non-negative. + Fixed int // e.g. 4 from "%4d", otherwise -1. + Dynamic int // index of argument providing dynamic size (e.g. %*d or %[3]*d), otherwise -1. - Index int // If the width or precision uses an indexed argument (e.g. 2 in %[2]d), this is the index. + Index int // If the width or precision uses an indexed argument (e.g. 2 in %[2]*d), this is the index, otherwise -1. Range Range // Position of the size specifier within the operation } -func (s Size) IsZero() bool { - return s.Fixed == 0 && s.Dynamic == 0 -} - // Verb represents the verb character of a format operation (e.g., 'd', 's', 'f'). // It also includes positional information and any explicit argument indexing. type Verb struct { Verb rune Range Range // The positional range of the verb in the format string - Index int // If the verb uses an indexed argument, this is the index, otherwise -1 - ArgIndex int // The argument index associated with this verb, relative to CallExpr, otherwise -1 + Index int // The index of an indexed argument, (e.g. 2 in %[2]d), otherwise -1. + ArgIndex int // The argument index (0-based) associated with this verb, relative to CallExpr. } // byte offsets of format string @@ -67,7 +62,7 @@ type Range struct { } // Parse takes a format string and its index in the printf-like call, -// parses out all format operations. it returns a slice of parsed +// parses out all format operations, returns a slice of parsed // [Operation] which describes flags, width, precision, verb, and argument indexing, // or an error if parsing fails. // @@ -75,10 +70,11 @@ type Range struct { // so that they may be affixed into a subject ("log.Printf "). // See https://go-review.googlesource.com/c/tools/+/632598/comment/9d980373_e6460abf/ // -// It does not perform any validation of flags, verbs, nor the -// existence of corresponding arguments. The provided format string may differ +// The flags will only be a subset of ['#', '0', '+', '-', ' ']. +// It does not perform any validation of verbs, nor the +// existence of corresponding arguments (obviously it can't). The provided format string may differ // from the one in CallExpr, such as a concatenated string or a string -// referred to by the argument in CallExpr. +// referred to by the argument in the CallExpr. func Parse(format string, idx int) ([]*Operation, error) { if !strings.Contains(format, "%") { return nil, fmt.Errorf("call has arguments but no formatting directives") @@ -119,7 +115,7 @@ func parseOperation(format string, firstArg, argNum int) (*state, error) { state := &state{ operation: &Operation{ Text: format, - Flags: make([]byte, 0, 5), + Flags: make([]byte, 0), }, firstArg: firstArg, argNum: argNum, @@ -188,11 +184,11 @@ func (s *Operation) addOffset(parsedLen int) { s.Range.Start = parsedLen s.Range.End = s.Verb.Range.End - if !s.Prec.IsZero() { + if s.Prec != nil { s.Prec.Range.Start += parsedLen s.Prec.Range.End += parsedLen } - if !s.Width.IsZero() { + if s.Width != nil { s.Width.Range.Start += parsedLen s.Width.Range.End += parsedLen } @@ -212,7 +208,7 @@ func (s *state) parseFlags() { } // parseIndex parses an argument index of the form "[n]" that can appear -// in a printf directive (e.g., "%[2]d"). Returns an error if syntax is +// in a printf operation (e.g., "%[2]d"). Returns an error if syntax is // malformed or index is invalid. func (s *state) parseIndex() error { if s.nbytes == len(s.operation.Text) || s.operation.Text[s.nbytes] != '[' { @@ -282,7 +278,8 @@ func (s *state) parseSize(kind sizeType) { if s.indexPending { // Absorb it. s.indexPending = false - size := Size{ + size := &Size{ + Fixed: -1, Dynamic: s.argNum, Index: s.index, Range: Range{ @@ -302,8 +299,10 @@ func (s *state) parseSize(kind sizeType) { } } else { // Non-indexed asterisk: "%*d". - size := Size{ + size := &Size{ Dynamic: s.argNum, + Index: -1, + Fixed: -1, Range: Range{ Start: s.nbytes - 1, End: s.nbytes, @@ -324,8 +323,10 @@ func (s *state) parseSize(kind sizeType) { } else { // Literal number, e.g. "%10d" start := s.nbytes if num, ok := s.scanNum(); ok { - size := Size{ - Fixed: num, + size := &Size{ + Fixed: num, + Index: -1, + Dynamic: -1, Range: Range{ Start: start, End: s.nbytes, From 2b99de4bd57802a7baf2e009454425d17de29cd0 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Tue, 7 Jan 2025 23:37:39 +0800 Subject: [PATCH 12/14] use -1 defualt value --- go/analysis/passes/printf/printf.go | 72 +++++++++++----------- gopls/internal/golang/codeaction.go | 6 +- gopls/internal/golang/fix.go | 2 +- gopls/internal/golang/undeclared.go | 4 +- internal/fmtstr/parse.go | 96 ++++++++++++++++------------- 5 files changed, 96 insertions(+), 84 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index bbc83a10585..bb549ae2e54 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -5,7 +5,6 @@ package printf import ( - "bytes" _ "embed" "fmt" "go/ast" @@ -372,6 +371,18 @@ var isPrint = stringSet{ "(testing.TB).Skipf": true, } +// stringConstantExpr returns expression's string constant value. +// +// ("", false) is returned if expression isn't a string +// constant. +func stringConstantExpr(pass *analysis.Pass, expr ast.Expr) (string, bool) { + lit := pass.TypesInfo.Types[expr].Value + if lit != nil && lit.Kind() == constant.String { + return constant.StringVal(lit), true + } + return "", false +} + // checkCall triggers the print-specific checks if the call invokes a print function. func checkCall(pass *analysis.Pass) { inspect := pass.ResultOf[inspect.Analyzer].(*inspector.Inspector) @@ -447,10 +458,10 @@ func isFormatter(typ types.Type) bool { types.Identical(sig.Params().At(1).Type(), types.Typ[types.Rune]) } -// FormatStringIndex returns the index of the format string (the last +// formatStringIndex returns the index of the format string (the last // non-variadic parameter) within the given printf-like call // expression, or -1 if unknown. -func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { +func formatStringIndex(info *types.Info, call *ast.CallExpr) int { typ := info.Types[call.Fun].Type if typ == nil { return -1 // missing type @@ -474,12 +485,12 @@ func FormatStringIndex(info *types.Info, call *ast.CallExpr) int { // checkPrintf checks a call to a formatted print routine such as Printf. func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { - idx := FormatStringIndex(pass.TypesInfo, call) + idx := formatStringIndex(pass.TypesInfo, call) if idx < 0 || idx >= len(call.Args) { return } formatArg := call.Args[idx] - format, ok := stringConstantExpr(pass.TypesInfo, formatArg) + format, ok := stringConstantExpr(pass, formatArg) if !ok { // Format string argument is non-constant. @@ -519,20 +530,25 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string // "fmt.Sprintf call needs 1 arg but has 2 args". operations, err := fmtstr.Parse(format, idx) if err != nil { + // All error messages are in predicate form ("call has a problem") + // so that they may be affixed into a subject ("log.Printf "). + // See https://go-review.googlesource.com/c/tools/+/632598/comment/9d980373_e6460abf/ pass.ReportRangef(call.Args[idx], "%s %s", name, err) return } - maxArgIndex := firstArg + // index of the highest used index. + maxArgIndex := firstArg - 1 anyIndex := false // Check formats against args. for _, operation := range operations { - if operation.Prec != nil && operation.Prec.Index != -1 || - operation.Width != nil && operation.Width.Index != -1 || + if operation.Prec.Index != -1 || + operation.Width.Index != -1 || operation.Verb.Index != -1 { anyIndex = true } - if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, operation) { // One error per format is enough. + if !okPrintfArg(pass, call, &maxArgIndex, firstArg, name, operation) { + // One error per format is enough. return } if operation.Verb.Verb == 'w' { @@ -544,7 +560,7 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string } } // Dotdotdot is hard. - if call.Ellipsis.IsValid() && maxArgIndex >= len(call.Args)-1 { + if call.Ellipsis.IsValid() && maxArgIndex >= len(call.Args)-2 { return } // If any formats are indexed, extra arguments are ignored. @@ -552,8 +568,8 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string return } // There should be no leftover arguments. - if maxArgIndex != len(call.Args) { - expect := maxArgIndex - firstArg + if maxArgIndex+1 < len(call.Args) { + expect := maxArgIndex + 1 - firstArg numArgs := len(call.Args) - firstArg pass.ReportRangef(call, "%s call needs %v but has %v", name, count(expect, "arg"), count(numArgs, "arg")) } @@ -620,8 +636,8 @@ var printVerbs = []printVerb{ } // okPrintfArg compares the operation to the arguments actually present, -// reporting any discrepancies it can discern. If the final argument is ellipsissed, -// there's little it can do for that. +// reporting any discrepancies it can discern, maxArgIndex was the index of the highest used index. +// If the final argument is ellipsissed, there's little it can do for that. func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firstArg int, name string, operation *fmtstr.Operation) (ok bool) { verb := operation.Verb.Verb var v printVerb @@ -663,16 +679,15 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs var argIndexes []int // First check for *. - if operation.Width != nil && operation.Width.Dynamic != -1 { + if operation.Width.Dynamic != -1 { argIndexes = append(argIndexes, operation.Width.Dynamic) } - if operation.Prec != nil && operation.Prec.Dynamic > 0 { + if operation.Prec.Dynamic != -1 { argIndexes = append(argIndexes, operation.Prec.Dynamic) } // If len(argIndexes)>0, we have something like %.*s and all // indexes in argIndexes must be an integer. - for i := 0; i < len(argIndexes); i++ { - argIndex := argIndexes[i] + for _, argIndex := range argIndexes { if !argCanBeChecked(pass, call, argIndex, firstArg, operation, name) { return } @@ -692,9 +707,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs argIndexes = append(argIndexes, operation.Verb.ArgIndex) } for _, index := range argIndexes { - if index >= *maxArgIndex { - *maxArgIndex = index + 1 - } + *maxArgIndex = max(*maxArgIndex, index) } // Special case for '%', go will print "fmt.Printf("%10.2%%dhello", 4)" @@ -726,7 +739,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, operation.Text, analysisutil.Format(pass.Fset, arg), typeString, details) return false } - if v.typ&argString != 0 && v.verb != 'T' && !bytes.Contains(operation.Flags, []byte{'#'}) { + if v.typ&argString != 0 && v.verb != 'T' && !strings.Contains(operation.Flags, "#") { if methodName, ok := recursiveStringer(pass, arg); ok { pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, operation.Text, analysisutil.Format(pass.Fset, arg), methodName) return false @@ -887,7 +900,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } arg := args[0] - if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := stringConstantExpr(pass, arg); ok { // Ignore trailing % character // The % in "abc 0.0%" couldn't be a formatting directive. s = strings.TrimSuffix(s, "%") @@ -901,7 +914,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { if strings.HasSuffix(name, "ln") { // The last item, if a string, should not have a newline. arg = args[len(args)-1] - if s, ok := stringConstantExpr(pass.TypesInfo, arg); ok { + if s, ok := stringConstantExpr(pass, arg); ok { if strings.HasSuffix(s, "\n") { pass.ReportRangef(call, "%s arg list ends with redundant newline", name) } @@ -917,17 +930,6 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } } -// StringConstantExpr returns expression's string constant value. -// -// ("", false) is returned if expression isn't a string constant. -func stringConstantExpr(info *types.Info, expr ast.Expr) (string, bool) { - lit := info.Types[expr].Value - if lit != nil && lit.Kind() == constant.String { - return constant.StringVal(lit), true - } - return "", false -} - // count(n, what) returns "1 what" or "N whats" // (assuming the plural of what is whats). func count(n int, what string) string { diff --git a/gopls/internal/golang/codeaction.go b/gopls/internal/golang/codeaction.go index 9a7bee7f817..627ba1a60d6 100644 --- a/gopls/internal/golang/codeaction.go +++ b/gopls/internal/golang/codeaction.go @@ -335,9 +335,9 @@ func quickFix(ctx context.Context, req *codeActionsRequest) error { req.addApplyFixAction(msg, fixMissingCalledFunction, req.loc) } - // "undeclared name: X" or "undefined: X" compiler error. - // Offer a "Create variable/function X" code action. - // See [createUndeclared] for command implementation. + // "undeclared name: x" or "undefined: x" compiler error. + // Offer a "Create variable/function x" code action. + // See [fixUndeclared] for command implementation. case strings.HasPrefix(msg, "undeclared name: "), strings.HasPrefix(msg, "undefined: "): path, _ := astutil.PathEnclosingInterval(req.pgf.File, start, end) diff --git a/gopls/internal/golang/fix.go b/gopls/internal/golang/fix.go index e812c677541..7e83c1d6700 100644 --- a/gopls/internal/golang/fix.go +++ b/gopls/internal/golang/fix.go @@ -112,7 +112,7 @@ func ApplyFix(ctx context.Context, fix string, snapshot *cache.Snapshot, fh file fixInvertIfCondition: singleFile(invertIfCondition), fixSplitLines: singleFile(splitLines), fixJoinLines: singleFile(joinLines), - fixCreateUndeclared: singleFile(createUndeclared), + fixCreateUndeclared: singleFile(CreateUndeclared), fixMissingInterfaceMethods: stubMissingInterfaceMethodsFixer, fixMissingCalledFunction: stubMissingCalledFunctionFixer, } diff --git a/gopls/internal/golang/undeclared.go b/gopls/internal/golang/undeclared.go index 0615386e9bf..35a5c7a1e57 100644 --- a/gopls/internal/golang/undeclared.go +++ b/gopls/internal/golang/undeclared.go @@ -68,8 +68,8 @@ func undeclaredFixTitle(path []ast.Node, errMsg string) string { return fmt.Sprintf("Create %s %s", noun, name) } -// createUndeclared generates a suggested declaration for an undeclared variable or function. -func createUndeclared(fset *token.FileSet, start, end token.Pos, content []byte, file *ast.File, pkg *types.Package, info *types.Info) (*token.FileSet, *analysis.SuggestedFix, error) { +// CreateUndeclared generates a suggested declaration for an undeclared variable or function. +func CreateUndeclared(fset *token.FileSet, start, end token.Pos, content []byte, file *ast.File, pkg *types.Package, info *types.Info) (*token.FileSet, *analysis.SuggestedFix, error) { pos := start // don't use the end path, _ := astutil.PathEnclosingInterval(file, pos, pos) if len(path) < 2 { diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index 76f0aa5e7a6..db671f2f95c 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -16,44 +16,32 @@ import ( // Operation holds the parsed representation of a printf operation such as "%3.*[4]d". // It is constructed by [Parse]. type Operation struct { - Text string // Full text of the operation, e.g. "%[2]*.3d" - Verb Verb // Verb specifier, guaranteed to exist, e.g., 'd' in '%[1]d' - Range Range // The range of Text within the overall format string - Flags []byte // Formatting flags, e.g. ['-', '0'] - Width *Size // Width specifier, e.g., '3' in '%3d' - Prec *Size // Precision specifier, e.g., '.4' in '%.4f' + Text string // full text of the operation, e.g. "%[2]*.3d" + Verb Verb // verb specifier, guaranteed to exist, e.g., 'd' in '%[1]d' + Range Range // the range of Text within the overall format string + Flags string // formatting flags, e.g. "-0" + Width Size // width specifier, e.g., '3' in '%3d' + Prec Size // precision specifier, e.g., '.4' in '%.4f' } -// Internal parsing state to operation. -type state struct { - operation *Operation - firstArg int // Index of the first argument after the format string - argNum int // Which argument we're expecting to format now. - hasIndex bool // Whether the argument is indexed. - index int // The encountered index - indexPos int // The encountered index's offset - indexPending bool // Whether we have an indexed argument that has not resolved. - nbytes int // number of bytes of the format string consumed. -} - -// Size describes a width or precision in a format operation. -// It may represent a literal number, an asterisk, or an indexed asterisk. +// Size describes an optional width or precision in a format operation. +// It may represent no value, a literal number, an asterisk, or an indexed asterisk. type Size struct { // At most one of these two fields is non-negative. - Fixed int // e.g. 4 from "%4d", otherwise -1. - Dynamic int // index of argument providing dynamic size (e.g. %*d or %[3]*d), otherwise -1. + Fixed int // e.g. 4 from "%4d", otherwise -1 + Dynamic int // index of argument providing dynamic size (e.g. %*d or %[3]*d), otherwise -1 - Index int // If the width or precision uses an indexed argument (e.g. 2 in %[2]*d), this is the index, otherwise -1. - Range Range // Position of the size specifier within the operation + Index int // If the width or precision uses an indexed argument (e.g. 2 in %[2]*d), this is the index, otherwise -1 + Range Range // position of the size specifier within the operation } // Verb represents the verb character of a format operation (e.g., 'd', 's', 'f'). // It also includes positional information and any explicit argument indexing. type Verb struct { Verb rune - Range Range // The positional range of the verb in the format string - Index int // The index of an indexed argument, (e.g. 2 in %[2]d), otherwise -1. - ArgIndex int // The argument index (0-based) associated with this verb, relative to CallExpr. + Range Range // positional range of the verb in the format string + Index int // index of an indexed argument, (e.g. 2 in %[2]d), otherwise -1 + ArgIndex int // argument index (0-based) associated with this verb, relative to CallExpr } // byte offsets of format string @@ -105,6 +93,18 @@ func Parse(format string, idx int) ([]*Operation, error) { return operations, nil } +// Internal parsing state to operation. +type state struct { + operation *Operation + firstArg int // index of the first argument after the format string + argNum int // which argument we're expecting to format now + hasIndex bool // whether the argument is indexed + index int // the encountered index + indexPos int // the encountered index's offset + indexPending bool // whether we have an indexed argument that has not resolved + nbytes int // number of bytes of the format string consumed +} + // parseOperation parses one format operation starting at the given substring `format`, // which should begin with '%'. It returns a fully populated state or an error // if the operation is malformed. The firstArg and argNum parameters help determine how @@ -114,8 +114,17 @@ func Parse(format string, idx int) ([]*Operation, error) { func parseOperation(format string, firstArg, argNum int) (*state, error) { state := &state{ operation: &Operation{ - Text: format, - Flags: make([]byte, 0), + Text: format, + Width: Size{ + Fixed: -1, + Dynamic: -1, + Index: -1, + }, + Prec: Size{ + Fixed: -1, + Dynamic: -1, + Index: -1, + }, }, firstArg: firstArg, argNum: argNum, @@ -184,11 +193,13 @@ func (s *Operation) addOffset(parsedLen int) { s.Range.Start = parsedLen s.Range.End = s.Verb.Range.End - if s.Prec != nil { + + // one of Fixed or Dynamic is non-negative means existence. + if s.Prec.Fixed == -1 && s.Prec.Dynamic == -1 { s.Prec.Range.Start += parsedLen s.Prec.Range.End += parsedLen } - if s.Width != nil { + if s.Width.Fixed == -1 && s.Width.Dynamic == -1 { s.Width.Range.Start += parsedLen s.Width.Range.End += parsedLen } @@ -196,15 +207,14 @@ func (s *Operation) addOffset(parsedLen int) { // parseFlags accepts any printf flags. func (s *state) parseFlags() { - for s.nbytes < len(s.operation.Text) { - switch c := s.operation.Text[s.nbytes]; c { - case '#', '0', '+', '-', ' ': - s.operation.Flags = append(s.operation.Flags, c) - s.nbytes++ - default: - return - } - } + s.operation.Flags = prefixOf(s.operation.Text[s.nbytes:], "#0+- ") + s.nbytes += len(s.operation.Flags) +} + +// prefixOf returns the prefix of s composed only of runes from the specified set. +func prefixOf(s, set string) string { + rest := strings.TrimLeft(s, set) + return s[:len(s)-len(rest)] } // parseIndex parses an argument index of the form "[n]" that can appear @@ -278,7 +288,7 @@ func (s *state) parseSize(kind sizeType) { if s.indexPending { // Absorb it. s.indexPending = false - size := &Size{ + size := Size{ Fixed: -1, Dynamic: s.argNum, Index: s.index, @@ -299,7 +309,7 @@ func (s *state) parseSize(kind sizeType) { } } else { // Non-indexed asterisk: "%*d". - size := &Size{ + size := Size{ Dynamic: s.argNum, Index: -1, Fixed: -1, @@ -323,7 +333,7 @@ func (s *state) parseSize(kind sizeType) { } else { // Literal number, e.g. "%10d" start := s.nbytes if num, ok := s.scanNum(); ok { - size := &Size{ + size := Size{ Fixed: num, Index: -1, Dynamic: -1, From cab5b9391c239d3ca8bda7e7f59277c98a9c7431 Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Wed, 8 Jan 2025 02:45:09 +0800 Subject: [PATCH 13/14] Add main.go --- go/analysis/passes/printf/printf.go | 52 ++++++++-------- internal/fmtstr/main.go | 94 +++++++++++++++++++++++++++++ 2 files changed, 120 insertions(+), 26 deletions(-) create mode 100644 internal/fmtstr/main.go diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index bb549ae2e54..836b18d363d 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -371,6 +371,31 @@ var isPrint = stringSet{ "(testing.TB).Skipf": true, } +// formatStringIndex returns the index of the format string (the last +// non-variadic parameter) within the given printf-like call +// expression, or -1 if unknown. +func formatStringIndex(pass *analysis.Pass, call *ast.CallExpr) int { + typ := pass.TypesInfo.Types[call.Fun].Type + if typ == nil { + return -1 // missing type + } + sig, ok := typ.(*types.Signature) + if !ok { + return -1 // ill-typed + } + if !sig.Variadic() { + // Skip checking non-variadic functions. + return -1 + } + idx := sig.Params().Len() - 2 + if idx < 0 { + // Skip checking variadic functions without + // fixed arguments. + return -1 + } + return idx +} + // stringConstantExpr returns expression's string constant value. // // ("", false) is returned if expression isn't a string @@ -458,34 +483,9 @@ func isFormatter(typ types.Type) bool { types.Identical(sig.Params().At(1).Type(), types.Typ[types.Rune]) } -// formatStringIndex returns the index of the format string (the last -// non-variadic parameter) within the given printf-like call -// expression, or -1 if unknown. -func formatStringIndex(info *types.Info, call *ast.CallExpr) int { - typ := info.Types[call.Fun].Type - if typ == nil { - return -1 // missing type - } - sig, ok := typ.(*types.Signature) - if !ok { - return -1 // ill-typed - } - if !sig.Variadic() { - // Skip checking non-variadic functions. - return -1 - } - idx := sig.Params().Len() - 2 - if idx < 0 { - // Skip checking variadic functions without - // fixed arguments. - return -1 - } - return idx -} - // checkPrintf checks a call to a formatted print routine such as Printf. func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string) { - idx := formatStringIndex(pass.TypesInfo, call) + idx := formatStringIndex(pass, call) if idx < 0 || idx >= len(call.Args) { return } diff --git a/internal/fmtstr/main.go b/internal/fmtstr/main.go new file mode 100644 index 00000000000..7fcbfdbbf2c --- /dev/null +++ b/internal/fmtstr/main.go @@ -0,0 +1,94 @@ +// Copyright 2024 The Go Authors. All rights reserved. +// Use of this source code is governed by a BSD-style +// license that can be found in the LICENSE file. + +//go:build ignore + +// The fmtstr command parses the format strings of calls to selected +// printf-like functions in the specified source file, and prints the +// formatting operations and their operands. +// +// It is intended only for debugging and is not a supported interface. +package main + +import ( + "flag" + "fmt" + "go/ast" + "go/parser" + "go/printer" + "go/token" + "log" + "strconv" + "strings" + + "golang.org/x/tools/internal/fmtstr" +) + +func main() { + log.SetPrefix("fmtstr: ") + log.SetFlags(0) + flag.Parse() + + fset := token.NewFileSet() + f, err := parser.ParseFile(fset, flag.Args()[0], nil, 0) + if err != nil { + log.Fatal(err) + } + + functions := map[string]int{ + "fmt.Errorf": 0, + "fmt.Fprintf": 1, + "fmt.Printf": 0, + "fmt.Sprintf": 0, + "log.Printf": 0, + } + + ast.Inspect(f, func(n ast.Node) bool { + if call, ok := n.(*ast.CallExpr); ok && !call.Ellipsis.IsValid() { + if sel, ok := call.Fun.(*ast.SelectorExpr); ok && is[*ast.Ident](sel.X) { + name := sel.X.(*ast.Ident).Name + "." + sel.Sel.Name // e.g. "fmt.Printf" + if fmtstrIndex, ok := functions[name]; ok && + len(call.Args) > fmtstrIndex { + // Is it a string literal? + if fmtstrArg, ok := call.Args[fmtstrIndex].(*ast.BasicLit); ok && + fmtstrArg.Kind == token.STRING { + // Have fmt.Printf("format", ...) + format, _ := strconv.Unquote(fmtstrArg.Value) + + ops, err := fmtstr.Parse(format, 0) + if err != nil { + log.Printf("%s: %v", fset.Position(fmtstrArg.Pos()), err) + return true + } + + fmt.Printf("%s: %s(%s, ...)\n", + fset.Position(fmtstrArg.Pos()), + name, + fmtstrArg.Value) + for _, op := range ops { + // TODO(adonovan): show more detail. + fmt.Printf("\t%q\t%v\n", + op.Text, + formatNode(fset, call.Args[op.Verb.ArgIndex])) + } + } + } + } + } + return true + }) +} + +func is[T any](x any) bool { + _, ok := x.(T) + return ok +} + +func formatNode(fset *token.FileSet, n ast.Node) string { + var buf strings.Builder + if err := printer.Fprint(&buf, fset, n); err != nil { + return "" + } + return buf.String() +} From 8e576345020d79d5c5534f8e66c3eee5f7bb2edd Mon Sep 17 00:00:00 2001 From: xzb <2598514867@qq.com> Date: Wed, 8 Jan 2025 03:11:10 +0800 Subject: [PATCH 14/14] rebase --- go/analysis/passes/printf/printf.go | 15 +++++++-------- internal/fmtstr/parse.go | 6 ++---- 2 files changed, 9 insertions(+), 12 deletions(-) diff --git a/go/analysis/passes/printf/printf.go b/go/analysis/passes/printf/printf.go index 836b18d363d..b95e2fd6f1a 100644 --- a/go/analysis/passes/printf/printf.go +++ b/go/analysis/passes/printf/printf.go @@ -532,7 +532,6 @@ func checkPrintf(pass *analysis.Pass, kind Kind, call *ast.CallExpr, name string if err != nil { // All error messages are in predicate form ("call has a problem") // so that they may be affixed into a subject ("log.Printf "). - // See https://go-review.googlesource.com/c/tools/+/632598/comment/9d980373_e6460abf/ pass.ReportRangef(call.Args[idx], "%s %s", name, err) return } @@ -697,7 +696,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, operation.Text, analysisutil.Format(pass.Fset, arg), details) + pass.ReportRangef(call, "%s format %s uses non-int %s%s as argument of *", name, operation.Text, analysisinternal.Format(pass.Fset, arg), details) return false } } @@ -724,7 +723,7 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs } arg := call.Args[verbArgIndex] if isFunctionValue(pass, arg) && verb != 'p' && verb != 'T' { - pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, operation.Text, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s format %s arg %s is a func value, not called", name, operation.Text, analysisinternal.Format(pass.Fset, arg)) return false } if reason, ok := matchArgType(pass, v.typ, arg); !ok { @@ -736,12 +735,12 @@ func okPrintfArg(pass *analysis.Pass, call *ast.CallExpr, maxArgIndex *int, firs if reason != "" { details = " (" + reason + ")" } - pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, operation.Text, analysisutil.Format(pass.Fset, arg), typeString, details) + pass.ReportRangef(call, "%s format %s has arg %s of wrong type %s%s", name, operation.Text, analysisinternal.Format(pass.Fset, arg), typeString, details) return false } if v.typ&argString != 0 && v.verb != 'T' && !strings.Contains(operation.Flags, "#") { if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, operation.Text, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s format %s with arg %s causes recursive %s method call", name, operation.Text, analysisinternal.Format(pass.Fset, arg), methodName) return false } } @@ -893,7 +892,7 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { if sel, ok := call.Args[0].(*ast.SelectorExpr); ok { if x, ok := sel.X.(*ast.Ident); ok { if x.Name == "os" && strings.HasPrefix(sel.Sel.Name, "Std") { - pass.ReportRangef(call, "%s does not take io.Writer but has first arg %s", name, analysisutil.Format(pass.Fset, call.Args[0])) + pass.ReportRangef(call, "%s does not take io.Writer but has first arg %s", name, analysisinternal.Format(pass.Fset, call.Args[0])) } } } @@ -922,10 +921,10 @@ func checkPrint(pass *analysis.Pass, call *ast.CallExpr, name string) { } for _, arg := range args { if isFunctionValue(pass, arg) { - pass.ReportRangef(call, "%s arg %s is a func value, not called", name, analysisutil.Format(pass.Fset, arg)) + pass.ReportRangef(call, "%s arg %s is a func value, not called", name, analysisinternal.Format(pass.Fset, arg)) } if methodName, ok := recursiveStringer(pass, arg); ok { - pass.ReportRangef(call, "%s arg %s causes recursive call to %s method", name, analysisutil.Format(pass.Fset, arg), methodName) + pass.ReportRangef(call, "%s arg %s causes recursive call to %s method", name, analysisinternal.Format(pass.Fset, arg), methodName) } } } diff --git a/internal/fmtstr/parse.go b/internal/fmtstr/parse.go index db671f2f95c..9ab264f45d6 100644 --- a/internal/fmtstr/parse.go +++ b/internal/fmtstr/parse.go @@ -3,7 +3,6 @@ // license that can be found in the LICENSE file. // Package fmtstr defines a parser for format strings as used by [fmt.Printf]. - package fmtstr import ( @@ -56,7 +55,6 @@ type Range struct { // // All error messages are in predicate form ("call has a problem") // so that they may be affixed into a subject ("log.Printf "). -// See https://go-review.googlesource.com/c/tools/+/632598/comment/9d980373_e6460abf/ // // The flags will only be a subset of ['#', '0', '+', '-', ' ']. // It does not perform any validation of verbs, nor the @@ -195,11 +193,11 @@ func (s *Operation) addOffset(parsedLen int) { s.Range.End = s.Verb.Range.End // one of Fixed or Dynamic is non-negative means existence. - if s.Prec.Fixed == -1 && s.Prec.Dynamic == -1 { + if s.Prec.Fixed != -1 || s.Prec.Dynamic != -1 { s.Prec.Range.Start += parsedLen s.Prec.Range.End += parsedLen } - if s.Width.Fixed == -1 && s.Width.Dynamic == -1 { + if s.Width.Fixed != -1 || s.Width.Dynamic != -1 { s.Width.Range.Start += parsedLen s.Width.Range.End += parsedLen }