-
Notifications
You must be signed in to change notification settings - Fork 44
hami-webui 反复重启及出现hami-webui-be-oss报下标越界 #52
Description
当 qwen3-1-7-int8服务pod启动时,原本正常running 中的hami-webui 立马就崩溃,一直起不来,关掉或删除qwen3pod, 可恢复正常,但是系统是必须部署和随机启动此类服务的。 请提供有效的解决方案

INFO ts=2025-11-06T20:00:04+08:00 caller=util/util.go:336 msg=Decoded pod annos: poddevices map[NVIDIA:[[{0 GPU-86c7ecde-1d5d-3bd5-0a6b-09337b2f304d NVIDIA 4272 16 }]]]
INFO ts=2025-11-06T20:00:04+08:00 caller=util/util.go:336 msg=Decoded pod annos: poddevices map[NVIDIA:[[{0 GPU-86c7ecde-1d5d-3bd5-0a6b-09337b2f304d NVIDIA 4272 16 }]]]
E1106 20:00:04.601004 1 runtime.go:79] Observed a panic: runtime.boundsError{x:1, y:1, signed:true, code:0x0} (runtime error: index out of range [1] with length 1)
goroutine 72 [running]:
k8s.io/apimachinery/pkg/util/runtime.logPanic({0x1d3d580, 0xc00071eac8})
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/runtime/runtime.go:75 +0x85
k8s.io/apimachinery/pkg/util/runtime.HandleCrash({0x0, 0x0, 0xc0002620e0?})
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/runtime/runtime.go:49 +0x6b
panic({0x1d3d580?, 0xc00071eac8?})
/usr/local/go/src/runtime/panic.go:785 +0x132
vgpu/internal/data.(*podRepo).fetchContainerInfo(0xc0002620c0, 0xc000734008)
/src/internal/data/pod.go:145 +0x96b
vgpu/internal/data.(*podRepo).addPod(0xc0002620c0, 0xc000734008, {0xc000639818, 0x8}, 0xc0006fd650)
/src/internal/data/pod.go:93 +0x98
vgpu/internal/data.(*podRepo).onAddPod(0xc0002620c0, {0x1e3a4a0?, 0xc000734008?})
/src/internal/data/pod.go:70 +0x189
k8s.io/client-go/tools/cache.ResourceEventHandlerFuncs.OnAdd(...)
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/controller.go:239
k8s.io/client-go/tools/cache.(*processorListener).run.func1()
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/shared_informer.go:978 +0x13e
k8s.io/apimachinery/pkg/util/wait.BackoffUntil.func1(0x30?)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:226 +0x33
k8s.io/apimachinery/pkg/util/wait.BackoffUntil(0xc000065f70, {0x26466c0, 0xc000163da0}, 0x1, 0xc0002487e0)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:227 +0xaf
k8s.io/apimachinery/pkg/util/wait.JitterUntil(0xc0000b5770, 0x3b9aca00, 0x0, 0x1, 0xc0002487e0)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:204 +0x7f
k8s.io/apimachinery/pkg/util/wait.Until(...)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:161
k8s.io/client-go/tools/cache.(*processorListener).run(0xc0002407e0)
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/shared_informer.go:972 +0x5a
k8s.io/apimachinery/pkg/util/wait.(*Group).Start.func1()
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/wait.go:72 +0x4c
created by k8s.io/apimachinery/pkg/util/wait.(*Group).Start in goroutine 67
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/wait.go:70 +0x73
panic: runtime error: index out of range [1] with length 1 [recovered]
panic: runtime error: index out of range [1] with length 1
goroutine 72 [running]:
k8s.io/apimachinery/pkg/util/runtime.HandleCrash({0x0, 0x0, 0xc0002620e0?})
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/runtime/runtime.go:56 +0xcd
panic({0x1d3d580?, 0xc00071eac8?})
/usr/local/go/src/runtime/panic.go:785 +0x132
vgpu/internal/data.(*podRepo).fetchContainerInfo(0xc0002620c0, 0xc000734008)
/src/internal/data/pod.go:145 +0x96b
vgpu/internal/data.(*podRepo).addPod(0xc0002620c0, 0xc000734008, {0xc000639818, 0x8}, 0xc0006fd650)
/src/internal/data/pod.go:93 +0x98
vgpu/internal/data.(*podRepo).onAddPod(0xc0002620c0, {0x1e3a4a0?, 0xc000734008?})
/src/internal/data/pod.go:70 +0x189
k8s.io/client-go/tools/cache.ResourceEventHandlerFuncs.OnAdd(...)
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/controller.go:239
k8s.io/client-go/tools/cache.(*processorListener).run.func1()
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/shared_informer.go:978 +0x13e
k8s.io/apimachinery/pkg/util/wait.BackoffUntil.func1(0x30?)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:226 +0x33
k8s.io/apimachinery/pkg/util/wait.BackoffUntil(0xc000065f70, {0x26466c0, 0xc000163da0}, 0x1, 0xc0002487e0)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:227 +0xaf
k8s.io/apimachinery/pkg/util/wait.JitterUntil(0xc0000b5770, 0x3b9aca00, 0x0, 0x1, 0xc0002487e0)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:204 +0x7f
k8s.io/apimachinery/pkg/util/wait.Until(...)
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/backoff.go:161
k8s.io/client-go/tools/cache.(*processorListener).run(0xc0002407e0)
/go/pkg/mod/k8s.io/client-go@v0.30.1/tools/cache/shared_informer.go:972 +0x5a
k8s.io/apimachinery/pkg/util/wait.(*Group).Start.func1()
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/wait.go:72 +0x4c
created by k8s.io/apimachinery/pkg/util/wait.(*Group).Start in goroutine 67
/go/pkg/mod/k8s.io/apimachinery@v0.30.1/pkg/util/wait/wait.go:70 +0x73
