Class PerformanceStats (0.1.0)

public final class PerformanceStats extends GeneratedMessageV3 implements PerformanceStatsOrBuilder

Performance statistics for a model deployment.

Protobuf type google.cloud.gkerecommender.v1.PerformanceStats

Static Fields

COST_FIELD_NUMBER

public static final int COST_FIELD_NUMBER
Field Value
Type Description
int

NTPOT_MILLISECONDS_FIELD_NUMBER

public static final int NTPOT_MILLISECONDS_FIELD_NUMBER
Field Value
Type Description
int

OUTPUT_TOKENS_PER_SECOND_FIELD_NUMBER

public static final int OUTPUT_TOKENS_PER_SECOND_FIELD_NUMBER
Field Value
Type Description
int

QUERIES_PER_SECOND_FIELD_NUMBER

public static final int QUERIES_PER_SECOND_FIELD_NUMBER
Field Value
Type Description
int

TTFT_MILLISECONDS_FIELD_NUMBER

public static final int TTFT_MILLISECONDS_FIELD_NUMBER
Field Value
Type Description
int

Static Methods

getDefaultInstance()

public static PerformanceStats getDefaultInstance()
Returns
Type Description
PerformanceStats

getDescriptor()

public static final Descriptors.Descriptor getDescriptor()
Returns
Type Description
Descriptor

newBuilder()

public static PerformanceStats.Builder newBuilder()
Returns
Type Description
PerformanceStats.Builder

newBuilder(PerformanceStats prototype)

public static PerformanceStats.Builder newBuilder(PerformanceStats prototype)
Parameter
Name Description
prototype PerformanceStats
Returns
Type Description
PerformanceStats.Builder

parseDelimitedFrom(InputStream input)

public static PerformanceStats parseDelimitedFrom(InputStream input)
Parameter
Name Description
input InputStream
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
input InputStream
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseFrom(byte[] data)

public static PerformanceStats parseFrom(byte[] data)
Parameter
Name Description
data byte[]
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
data byte[]
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parseFrom(ByteString data)

public static PerformanceStats parseFrom(ByteString data)
Parameter
Name Description
data ByteString
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
data ByteString
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parseFrom(CodedInputStream input)

public static PerformanceStats parseFrom(CodedInputStream input)
Parameter
Name Description
input CodedInputStream
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
input CodedInputStream
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseFrom(InputStream input)

public static PerformanceStats parseFrom(InputStream input)
Parameter
Name Description
input InputStream
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
input InputStream
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
IOException

parseFrom(ByteBuffer data)

public static PerformanceStats parseFrom(ByteBuffer data)
Parameter
Name Description
data ByteBuffer
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)

public static PerformanceStats parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)
Parameters
Name Description
data ByteBuffer
extensionRegistry ExtensionRegistryLite
Returns
Type Description
PerformanceStats
Exceptions
Type Description
InvalidProtocolBufferException

parser()

public static Parser<PerformanceStats> parser()
Returns
Type Description
Parser<PerformanceStats>

Methods

equals(Object obj)

public boolean equals(Object obj)
Parameter
Name Description
obj Object
Returns
Type Description
boolean
Overrides

getCost(int index)

public Cost getCost(int index)

Output only. The cost of running the model deployment.

repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];

Parameter
Name Description
index int
Returns
Type Description
Cost

getCostCount()

public int getCostCount()

Output only. The cost of running the model deployment.

repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
int

getCostList()

public List<Cost> getCostList()

Output only. The cost of running the model deployment.

repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
List<Cost>

getCostOrBuilder(int index)

public CostOrBuilder getCostOrBuilder(int index)

Output only. The cost of running the model deployment.

repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];

Parameter
Name Description
index int
Returns
Type Description
CostOrBuilder

getCostOrBuilderList()

public List<? extends CostOrBuilder> getCostOrBuilderList()

Output only. The cost of running the model deployment.

repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
List<? extends com.google.cloud.gkerecommender.v1.CostOrBuilder>

getDefaultInstanceForType()

public PerformanceStats getDefaultInstanceForType()
Returns
Type Description
PerformanceStats

getNtpotMilliseconds()

public int getNtpotMilliseconds()

Output only. The Normalized Time Per Output Token (NTPOT) in milliseconds. This is the request latency normalized by the number of output tokens, measured as request_latency / total_output_tokens.

int32 ntpot_milliseconds = 3 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
int

The ntpotMilliseconds.

getOutputTokensPerSecond()

public int getOutputTokensPerSecond()

Output only. The number of output tokens per second. This is the throughput measured as total_output_tokens_generated_by_server / elapsed_time_in_seconds.

int32 output_tokens_per_second = 2 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
int

The outputTokensPerSecond.

getParserForType()

public Parser<PerformanceStats> getParserForType()
Returns
Type Description
Parser<PerformanceStats>
Overrides

getQueriesPerSecond()

public float getQueriesPerSecond()

Output only. The number of queries per second. Note: This metric can vary widely based on context length and may not be a reliable measure of LLM throughput.

float queries_per_second = 1 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
float

The queriesPerSecond.

getSerializedSize()

public int getSerializedSize()
Returns
Type Description
int
Overrides

getTtftMilliseconds()

public int getTtftMilliseconds()

Output only. The Time To First Token (TTFT) in milliseconds. This is the time it takes to generate the first token for a request.

int32 ttft_milliseconds = 4 [(.google.api.field_behavior) = OUTPUT_ONLY];

Returns
Type Description
int

The ttftMilliseconds.

hashCode()

public int hashCode()
Returns
Type Description
int
Overrides

internalGetFieldAccessorTable()

protected GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
Returns
Type Description
FieldAccessorTable
Overrides

isInitialized()

public final boolean isInitialized()
Returns
Type Description
boolean
Overrides

newBuilderForType()

public PerformanceStats.Builder newBuilderForType()
Returns
Type Description
PerformanceStats.Builder

newBuilderForType(GeneratedMessageV3.BuilderParent parent)

protected PerformanceStats.Builder newBuilderForType(GeneratedMessageV3.BuilderParent parent)
Parameter
Name Description
parent BuilderParent
Returns
Type Description
PerformanceStats.Builder
Overrides

newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)

protected Object newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)
Parameter
Name Description
unused UnusedPrivateParameter
Returns
Type Description
Object
Overrides

toBuilder()

public PerformanceStats.Builder toBuilder()
Returns
Type Description
PerformanceStats.Builder

writeTo(CodedOutputStream output)

public void writeTo(CodedOutputStream output)
Parameter
Name Description
output CodedOutputStream
Overrides
Exceptions
Type Description
IOException