LingxinMeng 1 year ago
parent
commit
257fccafa4

+ 1 - 0
amd64/dispatch_server/package/domain/comm_with_redis.go

@@ -125,6 +125,7 @@ func AddRunningCluster(taskCache entity.TaskCache, nodeName string) error {
 			node.Parallelism--
 			nodeJson, _ := GpuNodeToJson(node)
 			_, _ = infra.GlobalRedisClient.LSet(global.KeyGpuNodeList, int64(i), nodeJson).Result()
+			infra.GlobalLogger.Infof("节点 %v 并行度减一后剩余并行度为 %v。", node.Hostname, node.Parallelism)
 		}
 	}
 	global.ParallelismMutex.Unlock()

+ 1 - 1
amd64/dispatch_server/package/infra/application.yaml

@@ -39,7 +39,7 @@ gpu-node-list:
 
 k8s:
   pod-yaml-dir: /mnt/disk001/cicv-data-closedloop/pod-yaml/
-  vtd-pod-template-yaml: /mnt/disk001/cicv-data-closedloop/pod-template/vtd-pod-template.yaml
+  vtd-pod-template-yaml: /mnt/disk001/cicv-data-closedloop/amd64/dispatch_server/vtd-pod-template_20240506.yaml
   algorithm-tar-temp-dir: /mnt/disk001/cicv-data-closedloop/temp/algorithm/
   registry-uri: 10.14.85.237:5000
   namespace-name: cicvdcl