Skip to content

Commit 52b319b

Browse files
authored
Refactor pprof labels and process desc (#32909)
* Deprecate "gopid" in log, it is not useful and requires very hacky approach * Remove "git.Command.SetDescription" because it is not useful and only makes the logs too flexible
1 parent c66de24 commit 52b319b

31 files changed

+182
-247
lines changed

modules/git/batch_reader.go

-18
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,8 @@ import (
77
"bufio"
88
"bytes"
99
"context"
10-
"fmt"
1110
"io"
1211
"math"
13-
"runtime"
1412
"strconv"
1513
"strings"
1614

@@ -32,7 +30,6 @@ type WriteCloserError interface {
3230
func ensureValidGitRepository(ctx context.Context, repoPath string) error {
3331
stderr := strings.Builder{}
3432
err := NewCommand(ctx, "rev-parse").
35-
SetDescription(fmt.Sprintf("%s rev-parse [repo_path: %s]", GitExecutable, repoPath)).
3633
Run(&RunOpts{
3734
Dir: repoPath,
3835
Stderr: &stderr,
@@ -62,13 +59,9 @@ func catFileBatchCheck(ctx context.Context, repoPath string) (WriteCloserError,
6259
cancel()
6360
}()
6461

65-
_, filename, line, _ := runtime.Caller(2)
66-
filename = strings.TrimPrefix(filename, callerPrefix)
67-
6862
go func() {
6963
stderr := strings.Builder{}
7064
err := NewCommand(ctx, "cat-file", "--batch-check").
71-
SetDescription(fmt.Sprintf("%s cat-file --batch-check [repo_path: %s] (%s:%d)", GitExecutable, repoPath, filename, line)).
7265
Run(&RunOpts{
7366
Dir: repoPath,
7467
Stdin: batchStdinReader,
@@ -114,13 +107,9 @@ func catFileBatch(ctx context.Context, repoPath string) (WriteCloserError, *bufi
114107
cancel()
115108
}()
116109

117-
_, filename, line, _ := runtime.Caller(2)
118-
filename = strings.TrimPrefix(filename, callerPrefix)
119-
120110
go func() {
121111
stderr := strings.Builder{}
122112
err := NewCommand(ctx, "cat-file", "--batch").
123-
SetDescription(fmt.Sprintf("%s cat-file --batch [repo_path: %s] (%s:%d)", GitExecutable, repoPath, filename, line)).
124113
Run(&RunOpts{
125114
Dir: repoPath,
126115
Stdin: batchStdinReader,
@@ -320,13 +309,6 @@ func ParseTreeLine(objectFormat ObjectFormat, rd *bufio.Reader, modeBuf, fnameBu
320309
return mode, fname, sha, n, err
321310
}
322311

323-
var callerPrefix string
324-
325-
func init() {
326-
_, filename, _, _ := runtime.Caller(0)
327-
callerPrefix = strings.TrimSuffix(filename, "modules/git/batch_reader.go")
328-
}
329-
330312
func DiscardFull(rd *bufio.Reader, discard int64) error {
331313
if discard > math.MaxInt32 {
332314
n, err := rd.Discard(math.MaxInt32)

modules/git/blame.go

+1-4
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,6 @@ import (
77
"bufio"
88
"bytes"
99
"context"
10-
"fmt"
1110
"io"
1211
"os"
1312

@@ -142,9 +141,7 @@ func CreateBlameReader(ctx context.Context, objectFormat ObjectFormat, repoPath
142141
// There is no equivalent on Windows. May be implemented if Gitea uses an external git backend.
143142
cmd.AddOptionValues("--ignore-revs-file", *ignoreRevsFile)
144143
}
145-
cmd.AddDynamicArguments(commit.ID.String()).
146-
AddDashesAndList(file).
147-
SetDescription(fmt.Sprintf("GetBlame [repo_path: %s]", repoPath))
144+
cmd.AddDynamicArguments(commit.ID.String()).AddDashesAndList(file)
148145
reader, stdout, err := os.Pipe()
149146
if err != nil {
150147
if ignoreRevsFile != nil {

modules/git/command.go

+35-33
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@ import (
1212
"io"
1313
"os"
1414
"os/exec"
15+
"path/filepath"
1516
"runtime"
1617
"strings"
1718
"time"
@@ -43,18 +44,24 @@ type Command struct {
4344
prog string
4445
args []string
4546
parentContext context.Context
46-
desc string
4747
globalArgsLength int
4848
brokenArgs []string
4949
}
5050

51-
func (c *Command) String() string {
52-
return c.toString(false)
51+
func logArgSanitize(arg string) string {
52+
if strings.Contains(arg, "://") && strings.Contains(arg, "@") {
53+
return util.SanitizeCredentialURLs(arg)
54+
} else if filepath.IsAbs(arg) {
55+
base := filepath.Base(arg)
56+
dir := filepath.Dir(arg)
57+
return filepath.Join(filepath.Base(dir), base)
58+
}
59+
return arg
5360
}
5461

55-
func (c *Command) toString(sanitizing bool) string {
62+
func (c *Command) LogString() string {
5663
// WARNING: this function is for debugging purposes only. It's much better than old code (which only joins args with space),
57-
// It's impossible to make a simple and 100% correct implementation of argument quoting for different platforms.
64+
// It's impossible to make a simple and 100% correct implementation of argument quoting for different platforms here.
5865
debugQuote := func(s string) string {
5966
if strings.ContainsAny(s, " `'\"\t\r\n") {
6067
return fmt.Sprintf("%q", s)
@@ -63,12 +70,11 @@ func (c *Command) toString(sanitizing bool) string {
6370
}
6471
a := make([]string, 0, len(c.args)+1)
6572
a = append(a, debugQuote(c.prog))
66-
for _, arg := range c.args {
67-
if sanitizing && (strings.Contains(arg, "://") && strings.Contains(arg, "@")) {
68-
a = append(a, debugQuote(util.SanitizeCredentialURLs(arg)))
69-
} else {
70-
a = append(a, debugQuote(arg))
71-
}
73+
if c.globalArgsLength > 0 {
74+
a = append(a, "...global...")
75+
}
76+
for i := c.globalArgsLength; i < len(c.args); i++ {
77+
a = append(a, debugQuote(logArgSanitize(c.args[i])))
7278
}
7379
return strings.Join(a, " ")
7480
}
@@ -112,12 +118,6 @@ func (c *Command) SetParentContext(ctx context.Context) *Command {
112118
return c
113119
}
114120

115-
// SetDescription sets the description for this command which be returned on c.String()
116-
func (c *Command) SetDescription(desc string) *Command {
117-
c.desc = desc
118-
return c
119-
}
120-
121121
// isSafeArgumentValue checks if the argument is safe to be used as a value (not an option)
122122
func isSafeArgumentValue(s string) bool {
123123
return s == "" || s[0] != '-'
@@ -271,8 +271,12 @@ var ErrBrokenCommand = errors.New("git command is broken")
271271

272272
// Run runs the command with the RunOpts
273273
func (c *Command) Run(opts *RunOpts) error {
274+
return c.run(1, opts)
275+
}
276+
277+
func (c *Command) run(skip int, opts *RunOpts) error {
274278
if len(c.brokenArgs) != 0 {
275-
log.Error("git command is broken: %s, broken args: %s", c.String(), strings.Join(c.brokenArgs, " "))
279+
log.Error("git command is broken: %s, broken args: %s", c.LogString(), strings.Join(c.brokenArgs, " "))
276280
return ErrBrokenCommand
277281
}
278282
if opts == nil {
@@ -285,20 +289,14 @@ func (c *Command) Run(opts *RunOpts) error {
285289
timeout = defaultCommandExecutionTimeout
286290
}
287291

288-
if len(opts.Dir) == 0 {
289-
log.Debug("git.Command.Run: %s", c)
290-
} else {
291-
log.Debug("git.Command.RunDir(%s): %s", opts.Dir, c)
292-
}
293-
294-
desc := c.desc
295-
if desc == "" {
296-
if opts.Dir == "" {
297-
desc = fmt.Sprintf("git: %s", c.toString(true))
298-
} else {
299-
desc = fmt.Sprintf("git(dir:%s): %s", opts.Dir, c.toString(true))
300-
}
292+
var desc string
293+
callerInfo := util.CallerFuncName(1 /* util */ + 1 /* this */ + skip /* parent */)
294+
if pos := strings.LastIndex(callerInfo, "/"); pos >= 0 {
295+
callerInfo = callerInfo[pos+1:]
301296
}
297+
// these logs are for debugging purposes only, so no guarantee of correctness or stability
298+
desc = fmt.Sprintf("git.Run(by:%s, repo:%s): %s", callerInfo, logArgSanitize(opts.Dir), c.LogString())
299+
log.Debug("git.Command: %s", desc)
302300

303301
var ctx context.Context
304302
var cancel context.CancelFunc
@@ -401,7 +399,7 @@ func IsErrorExitCode(err error, code int) bool {
401399

402400
// RunStdString runs the command with options and returns stdout/stderr as string. and store stderr to returned error (err combined with stderr).
403401
func (c *Command) RunStdString(opts *RunOpts) (stdout, stderr string, runErr RunStdError) {
404-
stdoutBytes, stderrBytes, err := c.RunStdBytes(opts)
402+
stdoutBytes, stderrBytes, err := c.runStdBytes(opts)
405403
stdout = util.UnsafeBytesToString(stdoutBytes)
406404
stderr = util.UnsafeBytesToString(stderrBytes)
407405
if err != nil {
@@ -413,6 +411,10 @@ func (c *Command) RunStdString(opts *RunOpts) (stdout, stderr string, runErr Run
413411

414412
// RunStdBytes runs the command with options and returns stdout/stderr as bytes. and store stderr to returned error (err combined with stderr).
415413
func (c *Command) RunStdBytes(opts *RunOpts) (stdout, stderr []byte, runErr RunStdError) {
414+
return c.runStdBytes(opts)
415+
}
416+
417+
func (c *Command) runStdBytes(opts *RunOpts) (stdout, stderr []byte, runErr RunStdError) {
416418
if opts == nil {
417419
opts = &RunOpts{}
418420
}
@@ -435,7 +437,7 @@ func (c *Command) RunStdBytes(opts *RunOpts) (stdout, stderr []byte, runErr RunS
435437
PipelineFunc: opts.PipelineFunc,
436438
}
437439

438-
err := c.Run(newOpts)
440+
err := c.run(2, newOpts)
439441
stderr = stderrBuf.Bytes()
440442
if err != nil {
441443
return nil, stderr, &runStdError{err: err, stderr: util.UnsafeBytesToString(stderr)}

modules/git/command_test.go

+3-3
Original file line numberDiff line numberDiff line change
@@ -55,8 +55,8 @@ func TestGitArgument(t *testing.T) {
5555

5656
func TestCommandString(t *testing.T) {
5757
cmd := NewCommandContextNoGlobals(context.Background(), "a", "-m msg", "it's a test", `say "hello"`)
58-
assert.EqualValues(t, cmd.prog+` a "-m msg" "it's a test" "say \"hello\""`, cmd.String())
58+
assert.EqualValues(t, cmd.prog+` a "-m msg" "it's a test" "say \"hello\""`, cmd.LogString())
5959

60-
cmd = NewCommandContextNoGlobals(context.Background(), "url: https://a:b@c/")
61-
assert.EqualValues(t, cmd.prog+` "url: https://sanitized-credential@c/"`, cmd.toString(true))
60+
cmd = NewCommandContextNoGlobals(context.Background(), "url: https://a:b@c/", "/root/dir-a/dir-b")
61+
assert.EqualValues(t, cmd.prog+` "url: https://sanitized-credential@c/" dir-a/dir-b`, cmd.LogString())
6262
}

modules/git/repo.go

-13
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@ import (
1818
"time"
1919

2020
"code.gitea.io/gitea/modules/proxy"
21-
"code.gitea.io/gitea/modules/util"
2221
)
2322

2423
// GPGSettings represents the default GPG settings for this repository
@@ -160,12 +159,6 @@ func CloneWithArgs(ctx context.Context, args TrustedCmdArgs, from, to string, op
160159
}
161160
cmd.AddDashesAndList(from, to)
162161

163-
if strings.Contains(from, "://") && strings.Contains(from, "@") {
164-
cmd.SetDescription(fmt.Sprintf("clone branch %s from %s to %s (shared: %t, mirror: %t, depth: %d)", opts.Branch, util.SanitizeCredentialURLs(from), to, opts.Shared, opts.Mirror, opts.Depth))
165-
} else {
166-
cmd.SetDescription(fmt.Sprintf("clone branch %s from %s to %s (shared: %t, mirror: %t, depth: %d)", opts.Branch, from, to, opts.Shared, opts.Mirror, opts.Depth))
167-
}
168-
169162
if opts.Timeout <= 0 {
170163
opts.Timeout = -1
171164
}
@@ -213,12 +206,6 @@ func Push(ctx context.Context, repoPath string, opts PushOptions) error {
213206
}
214207
cmd.AddDashesAndList(remoteBranchArgs...)
215208

216-
if strings.Contains(opts.Remote, "://") && strings.Contains(opts.Remote, "@") {
217-
cmd.SetDescription(fmt.Sprintf("push branch %s to %s (force: %t, mirror: %t)", opts.Branch, util.SanitizeCredentialURLs(opts.Remote), opts.Force, opts.Mirror))
218-
} else {
219-
cmd.SetDescription(fmt.Sprintf("push branch %s to %s (force: %t, mirror: %t)", opts.Branch, opts.Remote, opts.Force, opts.Mirror))
220-
}
221-
222209
stdout, stderr, err := cmd.RunStdString(&RunOpts{Env: opts.Env, Timeout: opts.Timeout, Dir: repoPath})
223210
if err != nil {
224211
if strings.Contains(stderr, "non-fast-forward") {

modules/graceful/manager.go

+4-3
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@ import (
99
"sync"
1010
"time"
1111

12+
"code.gitea.io/gitea/modules/gtprof"
1213
"code.gitea.io/gitea/modules/log"
1314
"code.gitea.io/gitea/modules/process"
1415
"code.gitea.io/gitea/modules/setting"
@@ -136,7 +137,7 @@ func (g *Manager) doShutdown() {
136137
}
137138
g.lock.Lock()
138139
g.shutdownCtxCancel()
139-
atShutdownCtx := pprof.WithLabels(g.hammerCtx, pprof.Labels(LifecyclePProfLabel, "post-shutdown"))
140+
atShutdownCtx := pprof.WithLabels(g.hammerCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "post-shutdown"))
140141
pprof.SetGoroutineLabels(atShutdownCtx)
141142
for _, fn := range g.toRunAtShutdown {
142143
go fn()
@@ -167,7 +168,7 @@ func (g *Manager) doHammerTime(d time.Duration) {
167168
default:
168169
log.Warn("Setting Hammer condition")
169170
g.hammerCtxCancel()
170-
atHammerCtx := pprof.WithLabels(g.terminateCtx, pprof.Labels(LifecyclePProfLabel, "post-hammer"))
171+
atHammerCtx := pprof.WithLabels(g.terminateCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "post-hammer"))
171172
pprof.SetGoroutineLabels(atHammerCtx)
172173
}
173174
g.lock.Unlock()
@@ -183,7 +184,7 @@ func (g *Manager) doTerminate() {
183184
default:
184185
log.Warn("Terminating")
185186
g.terminateCtxCancel()
186-
atTerminateCtx := pprof.WithLabels(g.managerCtx, pprof.Labels(LifecyclePProfLabel, "post-terminate"))
187+
atTerminateCtx := pprof.WithLabels(g.managerCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "post-terminate"))
187188
pprof.SetGoroutineLabels(atTerminateCtx)
188189

189190
for _, fn := range g.toRunAtTerminate {

modules/graceful/manager_common.go

+6-10
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,8 @@ import (
88
"runtime/pprof"
99
"sync"
1010
"time"
11+
12+
"code.gitea.io/gitea/modules/gtprof"
1113
)
1214

1315
// FIXME: it seems that there is a bug when using systemd Type=notify: the "Install Page" (INSTALL_LOCK=false) doesn't notify properly.
@@ -22,12 +24,6 @@ const (
2224
watchdogMsg systemdNotifyMsg = "WATCHDOG=1"
2325
)
2426

25-
// LifecyclePProfLabel is a label marking manager lifecycle phase
26-
// Making it compliant with prometheus key regex https://prometheus.io/docs/concepts/data_model/#metric-names-and-labels
27-
// would enable someone interested to be able to to continuously gather profiles into pyroscope.
28-
// Other labels for pprof (in "modules/process" package) should also follow this rule.
29-
const LifecyclePProfLabel = "graceful_lifecycle"
30-
3127
func statusMsg(msg string) systemdNotifyMsg {
3228
return systemdNotifyMsg("STATUS=" + msg)
3329
}
@@ -71,10 +67,10 @@ func (g *Manager) prepare(ctx context.Context) {
7167
g.hammerCtx, g.hammerCtxCancel = context.WithCancel(ctx)
7268
g.managerCtx, g.managerCtxCancel = context.WithCancel(ctx)
7369

74-
g.terminateCtx = pprof.WithLabels(g.terminateCtx, pprof.Labels(LifecyclePProfLabel, "with-terminate"))
75-
g.shutdownCtx = pprof.WithLabels(g.shutdownCtx, pprof.Labels(LifecyclePProfLabel, "with-shutdown"))
76-
g.hammerCtx = pprof.WithLabels(g.hammerCtx, pprof.Labels(LifecyclePProfLabel, "with-hammer"))
77-
g.managerCtx = pprof.WithLabels(g.managerCtx, pprof.Labels(LifecyclePProfLabel, "with-manager"))
70+
g.terminateCtx = pprof.WithLabels(g.terminateCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "with-terminate"))
71+
g.shutdownCtx = pprof.WithLabels(g.shutdownCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "with-shutdown"))
72+
g.hammerCtx = pprof.WithLabels(g.hammerCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "with-hammer"))
73+
g.managerCtx = pprof.WithLabels(g.managerCtx, pprof.Labels(gtprof.LabelGracefulLifecycle, "with-manager"))
7874

7975
if !g.setStateTransition(stateInit, stateRunning) {
8076
panic("invalid graceful manager state: transition from init to running failed")

modules/gtprof/gtprof.go

+25
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
// Copyright 2024 The Gitea Authors. All rights reserved.
2+
// SPDX-License-Identifier: MIT
3+
4+
package gtprof
5+
6+
// This is a Gitea-specific profiling package,
7+
// the name is chosen to distinguish it from the standard pprof tool and "GNU gprof"
8+
9+
// LabelGracefulLifecycle is a label marking manager lifecycle phase
10+
// Making it compliant with prometheus key regex https://prometheus.io/docs/concepts/data_model/#metric-names-and-labels
11+
// would enable someone interested to be able to continuously gather profiles into pyroscope.
12+
// Other labels for pprof should also follow this rule.
13+
const LabelGracefulLifecycle = "graceful_lifecycle"
14+
15+
// LabelPid is a label set on goroutines that have a process attached
16+
const LabelPid = "pid"
17+
18+
// LabelPpid is a label set on goroutines that have a process attached
19+
const LabelPpid = "ppid"
20+
21+
// LabelProcessType is a label set on goroutines that have a process attached
22+
const LabelProcessType = "process_type"
23+
24+
// LabelProcessDescription is a label set on goroutines that have a process attached
25+
const LabelProcessDescription = "process_description"

0 commit comments

Comments
 (0)