Table of Contents

Class DeviceHealthInfo

Namespace
Orleans.GpuBridge.Abstractions.Models
Assembly
Orleans.GpuBridge.Abstractions.dll

Comprehensive device health information for production monitoring

public sealed record DeviceHealthInfo : IEquatable<DeviceHealthInfo>
Inheritance
DeviceHealthInfo
Implements
Inherited Members

Properties

ConsecutiveFailures

Consecutive failed health checks

public int ConsecutiveFailures { get; init; }

Property Value

int

DeviceId

Device identifier

public string DeviceId { get; init; }

Property Value

string

ErrorCount

Error count since last reset

public int ErrorCount { get; init; }

Property Value

int

GpuUtilizationPercent

GPU utilization percentage (0-100)

public double GpuUtilizationPercent { get; init; }

Property Value

double

HealthScore

Overall health score (0.0 to 1.0, higher is better)

public double HealthScore { get; }

Property Value

double

IsHealthy

Whether the device is considered healthy

public bool IsHealthy { get; }

Property Value

bool

IsThermalThrottling

Whether the device is currently thermal throttling

public bool IsThermalThrottling { get; init; }

Property Value

bool

LastCheckTime

Last health check timestamp

public DateTime LastCheckTime { get; init; }

Property Value

DateTime

MaxTemperatureCelsius

Maximum safe operating temperature

public int MaxTemperatureCelsius { get; init; }

Property Value

int

MemoryUtilizationPercent

Memory utilization percentage (0-100)

public double MemoryUtilizationPercent { get; init; }

Property Value

double

PowerLimitWatts

Maximum power limit in watts

public double PowerLimitWatts { get; init; }

Property Value

double

PowerUsageWatts

Current power usage in watts

public double PowerUsageWatts { get; init; }

Property Value

double

PredictedFailureProbability

Predicted failure probability in next hour (0.0 to 1.0)

public double PredictedFailureProbability { get; init; }

Property Value

double

Status

Current device status

public DeviceStatus Status { get; init; }

Property Value

DeviceStatus

TemperatureCelsius

Current device temperature in Celsius

public int TemperatureCelsius { get; init; }

Property Value

int

TimeSinceLastSuccess

Time since last successful operation

public TimeSpan TimeSinceLastSuccess { get; init; }

Property Value

TimeSpan