// Copyright 2022 The Gitea Authors. All rights reserved. // SPDX-License-Identifier: MIT package process import ( "bytes" "fmt" "runtime/pprof" "sort" "time" "github.com/google/pprof/profile" ) // StackEntry is an entry on a stacktrace type StackEntry struct { Function string File string Line int } // Label represents a pprof label assigned to goroutine stack type Label struct { Name string Value string } // Stack is a stacktrace relating to a goroutine. (Multiple goroutines may have the same stacktrace) type Stack struct { Count int64 // Number of goroutines with this stack trace Description string Labels []*Label `json:",omitempty"` Entry []*StackEntry `json:",omitempty"` } // A Process is a combined representation of a Process and a Stacktrace for the goroutines associated with it type Process struct { PID IDType ParentPID IDType Description string Start time.Time Type string Children []*Process `json:",omitempty"` Stacks []*Stack `json:",omitempty"` } // Processes gets the processes in a thread safe manner func (pm *Manager) Processes(flat, noSystem bool) ([]*Process, int) { pm.mutex.Lock() processCount := len(pm.processMap) processes := make([]*Process, 0, len(pm.processMap)) if flat { for _, process := range pm.processMap { if noSystem && process.Type == SystemProcessType { continue } processes = append(processes, process.toProcess()) } } else { // We need our own processMap processMap := map[IDType]*Process{} for _, internalProcess := range pm.processMap { process, ok := processMap[internalProcess.PID] if !ok { process = internalProcess.toProcess() processMap[process.PID] = process } // Check its parent if process.ParentPID == "" { processes = append(processes, process) continue } internalParentProcess, ok := pm.processMap[internalProcess.ParentPID] if ok { parentProcess, ok := processMap[process.ParentPID] if !ok { parentProcess = internalParentProcess.toProcess() processMap[parentProcess.PID] = parentProcess } parentProcess.Children = append(parentProcess.Children, process) continue } processes = append(processes, process) } } pm.mutex.Unlock() if !flat && noSystem { for i := 0; i < len(processes); i++ { process := processes[i] if process.Type != SystemProcessType { continue } processes[len(processes)-1], processes[i] = processes[i], processes[len(processes)-1] processes = append(processes[:len(processes)-1], process.Children...) i-- } } // Sort by process' start time. Oldest process appears first. sort.Slice(processes, func(i, j int) bool { left, right := processes[i], processes[j] return left.Start.Before(right.Start) }) return processes, processCount } // ProcessStacktraces gets the processes and stacktraces in a thread safe manner func (pm *Manager) ProcessStacktraces(flat, noSystem bool) ([]*Process, int, int64, error) { var stacks *profile.Profile var err error // We cannot use the pm.ProcessMap here because we will release the mutex ... processMap := map[IDType]*Process{} var processCount int // Lock the manager pm.mutex.Lock() processCount = len(pm.processMap) // Add a defer to unlock in case there is a panic unlocked := false defer func() { if !unlocked { pm.mutex.Unlock() } }() processes := make([]*Process, 0, len(pm.processMap)) if flat { for _, internalProcess := range pm.processMap { process := internalProcess.toProcess() processMap[process.PID] = process if noSystem && internalProcess.Type == SystemProcessType { continue } processes = append(processes, process) } } else { for _, internalProcess := range pm.processMap { process, ok := processMap[internalProcess.PID] if !ok { process = internalProcess.toProcess() processMap[process.PID] = process } // Check its parent if process.ParentPID == "" { processes = append(processes, process) continue } internalParentProcess, ok := pm.processMap[internalProcess.ParentPID] if ok { parentProcess, ok := processMap[process.ParentPID] if !ok { parentProcess = internalParentProcess.toProcess() processMap[parentProcess.PID] = parentProcess } parentProcess.Children = append(parentProcess.Children, process) continue } processes = append(processes, process) } } // Now from within the lock we need to get the goroutines. // Why? If we release the lock then between between filling the above map and getting // the stacktraces another process could be created which would then look like a dead process below var buf bytes.Buffer if err := pprof.Lookup("goroutine").WriteTo(&buf, 0); err != nil { return nil, 0, 0, err } stacks, err = profile.ParseData(buf.Bytes()) if err != nil { return nil, 0, 0, err } // Unlock the mutex pm.mutex.Unlock() unlocked = true goroutineCount := int64(0) // Now walk through the "Sample" slice in the goroutines stack for _, sample := range stacks.Sample { // In the "goroutine" pprof profile each sample represents one or more goroutines // with the same labels and stacktraces. // We will represent each goroutine by a `Stack` stack := &Stack{} // Add the non-process associated labels from the goroutine sample to the Stack for name, value := range sample.Label { if name == DescriptionPProfLabel || name == PIDPProfLabel || (!flat && name == PPIDPProfLabel) || name == ProcessTypePProfLabel { continue } // Labels from the "goroutine" pprof profile only have one value. // This is because the underlying representation is a map[string]string if len(value) != 1 { // Unexpected... return nil, 0, 0, fmt.Errorf("label: %s in goroutine stack with unexpected number of values: %v", name, value) } stack.Labels = append(stack.Labels, &Label{Name: name, Value: value[0]}) } // The number of goroutines that this sample represents is the `stack.Value[0]` stack.Count = sample.Value[0] goroutineCount += stack.Count // Now we want to associate this Stack with a Process. var process *Process // Try to get the PID from the goroutine labels if pidvalue, ok := sample.Label[PIDPProfLabel]; ok && len(pidvalue) == 1 { pid := IDType(pidvalue[0]) // Now try to get the process from our map process, ok = processMap[pid] if !ok && pid != "" { // This means that no process has been found in the process map - but there was a process PID // Therefore this goroutine belongs to a dead process and it has escaped control of the process as it // should have died with the process context cancellation. // We need to create a dead process holder for this process and label it appropriately // get the parent PID ppid := IDType("") if value, ok := sample.Label[PPIDPProfLabel]; ok && len(value) == 1 { ppid = IDType(value[0]) } // format the description description := "(dead process)" if value, ok := sample.Label[DescriptionPProfLabel]; ok && len(value) == 1 { description = value[0] + " " + description } // override the type of the process to "code" but add the old type as a label on the first stack ptype := NoneProcessType if value, ok := sample.Label[ProcessTypePProfLabel]; ok && len(value) == 1 { stack.Labels = append(stack.Labels, &Label{Name: ProcessTypePProfLabel, Value: value[0]}) } process = &Process{ PID: pid, ParentPID: ppid, Description: description, Type: ptype, } // Now add the dead process back to the map and tree so we don't go back through this again. processMap[process.PID] = process added := false if process.ParentPID != "" && !flat { if parent, ok := processMap[process.ParentPID]; ok { parent.Children = append(parent.Children, process) added = true } } if !added { processes = append(processes, process) } } } if process == nil { // This means that the sample we're looking has no PID label var ok bool process, ok = processMap[""] if !ok { // this is the first time we've come acrross an unassociated goroutine so create a "process" to hold them process = &Process{ Description: "(unassociated)", Type: NoneProcessType, } processMap[process.PID] = process processes = append(processes, process) } } // The sample.Location represents a stack trace for this goroutine, // however each Location can represent multiple lines (mostly due to inlining) // so we need to walk the lines too for _, location := range sample.Location { for _, line := range location.Line { entry := &StackEntry{ Function: line.Function.Name, File: line.Function.Filename, Line: int(line.Line), } stack.Entry = append(stack.Entry, entry) } } // Now we need a short-descriptive name to call the stack trace if when it is folded and // assuming the stack trace has some lines we'll choose the bottom of the stack (i.e. the // initial function that started the stack trace.) The top of the stack is unlikely to // be very helpful as a lot of the time it will be runtime.select or some other call into // a std library. stack.Description = "(unknown)" if len(stack.Entry) > 0 { stack.Description = stack.Entry[len(stack.Entry)-1].Function } process.Stacks = append(process.Stacks, stack) } // restrict to not show system processes if noSystem { for i := 0; i < len(processes); i++ { process := processes[i] if process.Type != SystemProcessType && process.Type != NoneProcessType { continue } processes[len(processes)-1], processes[i] = processes[i], processes[len(processes)-1] processes = append(processes[:len(processes)-1], process.Children...) i-- } } // Now finally re-sort the processes. Newest process appears first after := func(processes []*Process) func(i, j int) bool { return func(i, j int) bool { left, right := processes[i], processes[j] return left.Start.After(right.Start) } } sort.Slice(processes, after(processes)) if !flat { var sortChildren func(process *Process) sortChildren = func(process *Process) { sort.Slice(process.Children, after(process.Children)) for _, child := range process.Children { sortChildren(child) } } } return processes, processCount, goroutineCount, err }