Enhance synctrace logging.

Switched the maps to be indexed by the .Pointer (not a string)
Grouped the lockCount, unlockCount ,and lastLock in an trackingEntry so we can detect unlocks of something that wasn't ever locked and excessive unlocks and also tracks the first time locked and the last unlock time.
Added LogDangledLocks for debugging use.
Added a panic handler to the Main so we can log out panics
This commit is contained in:
Marc Brooks 2025-11-18 17:50:54 -06:00
parent d49e2680d0
commit 979b32b86c
No known key found for this signature in database
GPG Key ID: 583A6AF2D6AE1DC6
3 changed files with 118 additions and 48 deletions

View File

@ -10,6 +10,7 @@ import (
"time" "time"
"github.com/jetkvm/kvm/internal/logging" "github.com/jetkvm/kvm/internal/logging"
"github.com/rs/zerolog" "github.com/rs/zerolog"
) )
@ -47,103 +48,160 @@ func logTrack(callerSkip int) *zerolog.Logger {
return &l return &l
} }
func logLockTrack(i string) *zerolog.Logger { func logLockTrack(ptr uintptr) *zerolog.Logger {
l := logTrack(4). l := logTrack(4).
With(). With().
Str("index", i). Str("ptr", fmt.Sprintf("%x", ptr)).
Logger() Logger()
return &l return &l
} }
var (
indexMu sync.Mutex
lockCount map[string]int = make(map[string]int)
unlockCount map[string]int = make(map[string]int)
lastLock map[string]time.Time = make(map[string]time.Time)
)
type trackable interface { type trackable interface {
sync.Locker sync.Locker
} }
func getIndex(t trackable) string { type trackingEntry struct {
ptr := reflect.ValueOf(t).Pointer() lockCount int
return fmt.Sprintf("%x", ptr) unlockCount int
firstLock time.Time
lastLock time.Time
lastUnlock time.Time
} }
func increaseLockCount(i string) { var (
indexMu sync.Mutex
tracking map[uintptr]*trackingEntry = make(map[uintptr]*trackingEntry)
)
func getPointer(t trackable) uintptr {
return reflect.ValueOf(t).Pointer()
}
func increaseLockCount(ptr uintptr) {
indexMu.Lock() indexMu.Lock()
defer indexMu.Unlock() defer indexMu.Unlock()
if _, ok := lockCount[i]; !ok { entry, ok := tracking[ptr]
lockCount[i] = 0 if !ok {
} entry = &trackingEntry{}
lockCount[i]++ entry.firstLock = time.Now()
tracking[ptr] = entry
if _, ok := lastLock[i]; !ok {
lastLock[i] = time.Now()
} }
entry.lockCount++
entry.lastLock = time.Now()
} }
func increaseUnlockCount(i string) { func increaseUnlockCount(ptr uintptr) {
indexMu.Lock() indexMu.Lock()
defer indexMu.Unlock()
if _, ok := unlockCount[i]; !ok { entry, ok := tracking[ptr]
unlockCount[i] = 0 if !ok {
entry = &trackingEntry{}
tracking[ptr] = entry
}
entry.unlockCount++
entry.lastUnlock = time.Now()
delta := entry.lockCount - entry.unlockCount
indexMu.Unlock()
if !ok {
logLockTrack(ptr).Warn().Interface("entry", entry).Msg("Unlock called without prior Lock")
}
if delta < 0 {
logLockTrack(ptr).Warn().Interface("entry", entry).Msg("Unlock called more times than Lock")
} }
unlockCount[i]++
} }
func logLock(t trackable) { func logLock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
increaseLockCount(i) increaseLockCount(ptr)
logLockTrack(i).Trace().Msg("locking mutex") logLockTrack(ptr).Trace().Msg("locking mutex")
} }
func logUnlock(t trackable) { func logUnlock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
increaseUnlockCount(i) increaseUnlockCount(ptr)
logLockTrack(i).Trace().Msg("unlocking mutex") logLockTrack(ptr).Trace().Msg("unlocking mutex")
} }
func logTryLock(t trackable) { func logTryLock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
logLockTrack(i).Trace().Msg("trying to lock mutex") logLockTrack(ptr).Trace().Msg("trying to lock mutex")
} }
func logTryLockResult(t trackable, l bool) { func logTryLockResult(t trackable, l bool) {
if !l { if !l {
return return
} }
i := getIndex(t) ptr := getPointer(t)
increaseLockCount(i) increaseLockCount(ptr)
logLockTrack(i).Trace().Msg("locked mutex") logLockTrack(ptr).Trace().Msg("locked mutex")
} }
func logRLock(t trackable) { func logRLock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
increaseLockCount(i) increaseLockCount(ptr)
logLockTrack(i).Trace().Msg("locking mutex for reading") logLockTrack(ptr).Trace().Msg("locking mutex for reading")
} }
func logRUnlock(t trackable) { func logRUnlock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
increaseUnlockCount(i) increaseUnlockCount(ptr)
logLockTrack(i).Trace().Msg("unlocking mutex for reading") logLockTrack(ptr).Trace().Msg("unlocking mutex for reading")
} }
func logTryRLock(t trackable) { func logTryRLock(t trackable) {
i := getIndex(t) ptr := getPointer(t)
logLockTrack(i).Trace().Msg("trying to lock mutex for reading") logLockTrack(ptr).Trace().Msg("trying to lock mutex for reading")
} }
func logTryRLockResult(t trackable, l bool) { func logTryRLockResult(t trackable, l bool) {
if !l { if !l {
return return
} }
i := getIndex(t) ptr := getPointer(t)
increaseLockCount(i) increaseLockCount(ptr)
logLockTrack(i).Trace().Msg("locked mutex for reading") logLockTrack(ptr).Trace().Msg("locked mutex for reading")
}
// You can all this function at any time to log any dangled locks currently tracked
// it's not an error for there to be open locks, but this can help identify any
// potential issues if called judiciously
func LogDangledLocks() {
defaultLogger.Info().Msgf("Checking %v tracked locks for dangles", len(tracking))
indexMu.Lock()
var issues []struct {
ptr uintptr
entry trackingEntry
}
for ptr, entry := range tracking {
if entry.lockCount != entry.unlockCount {
issues = append(issues, struct {
ptr uintptr
entry trackingEntry
}{ptr, *entry})
}
}
indexMu.Unlock()
defaultLogger.Info().Msgf("%v potential issues", len(issues))
for _, issue := range issues {
ptr := issue.ptr
entry := issue.entry
delta := entry.lockCount - entry.unlockCount
failureType := "excess unlocks"
if delta > 0 {
failureType = "held locks"
}
defaultLogger.Warn().
Str("ptr", fmt.Sprintf("%x", ptr)).
Interface("entry", entry).
Int("delta", delta).
Msgf("dangled lock detected: %s", failureType)
}
} }

View File

@ -90,3 +90,7 @@ type Once struct {
func (o *Once) Do(f func()) { func (o *Once) Do(f func()) {
o.mu.Do(f) o.mu.Do(f)
} }
// logDangledLocks is a no-op in non-synctrace builds
func LogDangledLocks() {
}

View File

@ -16,6 +16,13 @@ var appCtx context.Context
func Main() { func Main() {
logger.Log().Msg("JetKVM Starting Up") logger.Log().Msg("JetKVM Starting Up")
defer func() {
if r := recover(); r != nil {
logger.Panic().Interface("error", r).Msg("Received panic")
panic(r) // Re-panic to crash as usual
}
}()
checkFailsafeReason() checkFailsafeReason()
if failsafeModeActive { if failsafeModeActive {
logger.Warn().Str("reason", failsafeModeReason).Msg("failsafe mode activated") logger.Warn().Str("reason", failsafeModeReason).Msg("failsafe mode activated")
@ -140,6 +147,7 @@ func Main() {
<-sigs <-sigs
logger.Log().Msg("JetKVM Shutting Down") logger.Log().Msg("JetKVM Shutting Down")
//if fuseServer != nil { //if fuseServer != nil {
// err := setMassStorageImage(" ") // err := setMassStorageImage(" ")
// if err != nil { // if err != nil {