# Get current GPU metrics
metrics = client.telemetry.get_metrics(
node='gpu-worker-1',
gpu=0
)
print(f"GPU Utilization: {metrics.utilization}%")
print(f"Memory Usage: {metrics.memory_used / 1e9:.1f} GB")
print(f"Temperature: {metrics.temperature}°C")
# Get historical metrics
historical = client.telemetry.get_historical_metrics(
node='gpu-worker-1',
start_time='2024-01-01T00:00:00Z',
end_time='2024-01-02T00:00:00Z'
)
# Create alert rule
alert = client.telemetry.create_alert(
name='High GPU Temperature',
condition='gpu_temperature > 85',
duration='5m',
severity='critical'
)