@@ -125,6 +125,7 @@ func AddRunningCluster(taskCache entity.TaskCache, nodeName string) error {
node.Parallelism--
nodeJson, _ := GpuNodeToJson(node)
_, _ = infra.GlobalRedisClient.LSet(global.KeyGpuNodeList, int64(i), nodeJson).Result()
+ infra.GlobalLogger.Infof("节点 %v 并行度减一后剩余并行度为 %v。", node.Hostname, node.Parallelism)
}
global.ParallelismMutex.Unlock()
@@ -39,7 +39,7 @@ gpu-node-list:
k8s:
pod-yaml-dir: /mnt/disk001/cicv-data-closedloop/pod-yaml/
- vtd-pod-template-yaml: /mnt/disk001/cicv-data-closedloop/pod-template/vtd-pod-template.yaml
+ vtd-pod-template-yaml: /mnt/disk001/cicv-data-closedloop/amd64/dispatch_server/vtd-pod-template_20240506.yaml
algorithm-tar-temp-dir: /mnt/disk001/cicv-data-closedloop/temp/algorithm/
registry-uri: 10.14.85.237:5000
namespace-name: cicvdcl