Skip to content

Commit e116cfe

Browse files
committed
fix: worker metrics raw cost zero bug
1 parent 331e4bb commit e116cfe

File tree

3 files changed

+3
-1
lines changed

3 files changed

+3
-1
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,3 +38,4 @@ tmp*
3838
__debug*
3939

4040
vendor
41+
logs

.vscode/launch.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -64,6 +64,7 @@
6464
"ENABLE_CR_CONTROLLER": "true"
6565
},
6666
"args": [
67+
"--metrics-path", "${workspaceFolder}/logs/metrics.log",
6768
"--gpu-info-config", "${workspaceFolder}/config/samples/gpu-info-config.yaml",
6869
"--dynamic-config", "${workspaceFolder}/config/samples/dynamic-config.yaml",
6970
"--scheduler-config", "${workspaceFolder}/config/samples/scheduler-config.yaml",

internal/controller/tensorfusioncluster_controller.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -325,8 +325,8 @@ func (r *TensorFusionClusterReconciler) reconcileGPUPool(ctx context.Context, tf
325325
errors = append(errors, fmt.Errorf("failed to update GPUPool %s: %w", key, err))
326326
}
327327
anyPoolChanged = true
328-
r.updateMetricsRecorder(ctx, existingPool)
329328
}
329+
r.updateMetricsRecorder(ctx, existingPool)
330330
}
331331
}
332332

0 commit comments

Comments
 (0)