From 47a834eb80c97ffb278e9f727866eb0657002def Mon Sep 17 00:00:00 2001 From: lirui238 <2396601465@qq.com> Date: Fri, 6 Jun 2025 00:34:26 +0800 Subject: [PATCH 1/2] =?UTF-8?q?=E4=BF=AE=E6=94=B9=E8=AF=B4=E6=98=8E?= =?UTF-8?q?=E3=80=91[taskd]=20log?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../taskd/go/framework_backend/manager/manager.go | 2 ++ .../taskd/taskd/go/framework_backend/worker/worker.go | 11 ++++------- 2 files changed, 6 insertions(+), 7 deletions(-) diff --git a/component/taskd/taskd/go/framework_backend/manager/manager.go b/component/taskd/taskd/go/framework_backend/manager/manager.go index 4579ea240..07e034613 100644 --- a/component/taskd/taskd/go/framework_backend/manager/manager.go +++ b/component/taskd/taskd/go/framework_backend/manager/manager.go @@ -88,6 +88,7 @@ func (m *BaseManager) Init() error { fmt.Printf("manager init hwlog failed, err: %v \n", err) return err } + hwlog.RunLog.Infof("manager config: %v", m.Config) m.svcCtx, m.cancelFunc = context.WithCancel(context.Background()) m.MsgHd = application.NewMsgHandler() m.MsgHd.Start(m.svcCtx) @@ -153,6 +154,7 @@ func (m *BaseManager) registerClusterD(retryTime time.Duration) { hwlog.RunLog.Errorf("get clusterd address err: %v", err) return } + hwlog.RunLog.Info("get clusterd addr %v", addr) conn, err := grpc.Dial(addr, grpc.WithTransportCredentials(insecure.NewCredentials())) if err != nil { hwlog.RunLog.Errorf("init clusterd connect err: %v", err) diff --git a/component/taskd/taskd/go/framework_backend/worker/worker.go b/component/taskd/taskd/go/framework_backend/worker/worker.go index 59ff21b56..220d69e4b 100644 --- a/component/taskd/taskd/go/framework_backend/worker/worker.go +++ b/component/taskd/taskd/go/framework_backend/worker/worker.go @@ -18,7 +18,6 @@ package worker import "C" import ( "context" - "os" "strconv" "time" @@ -35,7 +34,7 @@ var monitorInitCtx context.Context var monitorInitNotify context.CancelFunc const ( - waitInitMsptiTimeout = 60 * time.Second + waitInitMsptiTimeout = 180 * time.Second ) func init() { @@ -59,13 +58,10 @@ func InitMonitor(ctx context.Context, globalRank int, upperLimitOfDiskInMb int) // InitNetwork register worker to manager func InitNetwork(globalRank, nodeRank int) { + hwlog.RunLog.Infof("worker %d init network begin", globalRank) profiling.GlobalRank = globalRank profiling.NodeRank = nodeRank - ip := os.Getenv("POD_IP") - if ip == "" { - ip = "127.0.0.1" - } - addr := ip + constant.ProxyPort + addr := constant.DefaultIP + constant.ProxyPort var err error netTool, err = net.InitNetwork(&common.TaskNetConfig{ Pos: common.Position{ @@ -81,6 +77,7 @@ func InitNetwork(globalRank, nodeRank int) { if err != nil { hwlog.RunLog.Errorf("worker %d init network err: %v", globalRank, err) } + hwlog.RunLog.Infof("worker %d init network end", globalRank) profiling.NetTool = netTool profiling.NetToolInitNotify() } -- Gitee From fd5c09874425efdb602d265d7a14c350efc8bdd9 Mon Sep 17 00:00:00 2001 From: lirui238 <2396601465@qq.com> Date: Fri, 6 Jun 2025 10:02:18 +0800 Subject: [PATCH 2/2] =?UTF-8?q?=E4=BF=AE=E6=94=B9=E8=AF=B4=E6=98=8E?= =?UTF-8?q?=E3=80=91[taskd]=20log?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- component/taskd/taskd/go/framework_backend/manager/manager.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/component/taskd/taskd/go/framework_backend/manager/manager.go b/component/taskd/taskd/go/framework_backend/manager/manager.go index 07e034613..096aa3847 100644 --- a/component/taskd/taskd/go/framework_backend/manager/manager.go +++ b/component/taskd/taskd/go/framework_backend/manager/manager.go @@ -154,7 +154,7 @@ func (m *BaseManager) registerClusterD(retryTime time.Duration) { hwlog.RunLog.Errorf("get clusterd address err: %v", err) return } - hwlog.RunLog.Info("get clusterd addr %v", addr) + hwlog.RunLog.Infof("get clusterd addr %v", addr) conn, err := grpc.Dial(addr, grpc.WithTransportCredentials(insecure.NewCredentials())) if err != nil { hwlog.RunLog.Errorf("init clusterd connect err: %v", err) -- Gitee