Class PerformanceStats (0.1.0)
public final class PerformanceStats extends GeneratedMessageV3 implements PerformanceStatsOrBuilder
Performance statistics for a model deployment.
Protobuf type google.cloud.gkerecommender.v1.PerformanceStats
Inherited Members
com.google.protobuf.GeneratedMessageV3.<ListT>makeMutableCopy(ListT)
com.google.protobuf.GeneratedMessageV3.<ListT>makeMutableCopy(ListT,int)
com.google.protobuf.GeneratedMessageV3.<T>emptyList(java.lang.Class<T>)
com.google.protobuf.GeneratedMessageV3.internalGetMapFieldReflection(int)
Static Fields
public static final int COST_FIELD_NUMBER
| Field Value |
| Type |
Description |
int |
|
public static final int NTPOT_MILLISECONDS_FIELD_NUMBER
| Field Value |
| Type |
Description |
int |
|
public static final int OUTPUT_TOKENS_PER_SECOND_FIELD_NUMBER
| Field Value |
| Type |
Description |
int |
|
public static final int QUERIES_PER_SECOND_FIELD_NUMBER
| Field Value |
| Type |
Description |
int |
|
public static final int TTFT_MILLISECONDS_FIELD_NUMBER
| Field Value |
| Type |
Description |
int |
|
Static Methods
public static PerformanceStats getDefaultInstance()
public static final Descriptors.Descriptor getDescriptor()
public static PerformanceStats.Builder newBuilder()
public static PerformanceStats.Builder newBuilder(PerformanceStats prototype)
public static PerformanceStats parseDelimitedFrom(InputStream input)
public static PerformanceStats parseDelimitedFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
public static PerformanceStats parseFrom(byte[] data)
| Parameter |
| Name |
Description |
data |
byte[]
|
public static PerformanceStats parseFrom(byte[] data, ExtensionRegistryLite extensionRegistry)
public static PerformanceStats parseFrom(ByteString data)
public static PerformanceStats parseFrom(ByteString data, ExtensionRegistryLite extensionRegistry)
public static PerformanceStats parseFrom(CodedInputStream input)
public static PerformanceStats parseFrom(CodedInputStream input, ExtensionRegistryLite extensionRegistry)
public static PerformanceStats parseFrom(InputStream input)
public static PerformanceStats parseFrom(InputStream input, ExtensionRegistryLite extensionRegistry)
public static PerformanceStats parseFrom(ByteBuffer data)
public static PerformanceStats parseFrom(ByteBuffer data, ExtensionRegistryLite extensionRegistry)
public static Parser<PerformanceStats> parser()
Methods
public boolean equals(Object obj)
| Parameter |
| Name |
Description |
obj |
Object
|
Overrides
public Cost getCost(int index)
Output only. The cost of running the model deployment.
repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Parameter |
| Name |
Description |
index |
int
|
| Returns |
| Type |
Description |
Cost |
|
public int getCostCount()
Output only. The cost of running the model deployment.
repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
int |
|
public List<Cost> getCostList()
Output only. The cost of running the model deployment.
repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];
public CostOrBuilder getCostOrBuilder(int index)
Output only. The cost of running the model deployment.
repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Parameter |
| Name |
Description |
index |
int
|
public List<? extends CostOrBuilder> getCostOrBuilderList()
Output only. The cost of running the model deployment.
repeated .google.cloud.gkerecommender.v1.Cost cost = 5 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
List<? extends com.google.cloud.gkerecommender.v1.CostOrBuilder> |
|
public PerformanceStats getDefaultInstanceForType()
public int getNtpotMilliseconds()
Output only. The Normalized Time Per Output Token (NTPOT) in milliseconds.
This is the request latency normalized by the number of output tokens,
measured as request_latency / total_output_tokens.
int32 ntpot_milliseconds = 3 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
int |
The ntpotMilliseconds.
|
public int getOutputTokensPerSecond()
Output only. The number of output tokens per second. This is the throughput
measured as total_output_tokens_generated_by_server /
elapsed_time_in_seconds.
int32 output_tokens_per_second = 2 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
int |
The outputTokensPerSecond.
|
public Parser<PerformanceStats> getParserForType()
Overrides
public float getQueriesPerSecond()
Output only. The number of queries per second.
Note: This metric can vary widely based on context length and may not be a
reliable measure of LLM throughput.
float queries_per_second = 1 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
float |
The queriesPerSecond.
|
public int getSerializedSize()
| Returns |
| Type |
Description |
int |
|
Overrides
public int getTtftMilliseconds()
Output only. The Time To First Token (TTFT) in milliseconds. This is the
time it takes to generate the first token for a request.
int32 ttft_milliseconds = 4 [(.google.api.field_behavior) = OUTPUT_ONLY];
| Returns |
| Type |
Description |
int |
The ttftMilliseconds.
|
| Returns |
| Type |
Description |
int |
|
Overrides
protected GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
Overrides
public final boolean isInitialized()
Overrides
public PerformanceStats.Builder newBuilderForType()
protected PerformanceStats.Builder newBuilderForType(GeneratedMessageV3.BuilderParent parent)
Overrides
protected Object newInstance(GeneratedMessageV3.UnusedPrivateParameter unused)
| Returns |
| Type |
Description |
Object |
|
Overrides
public PerformanceStats.Builder toBuilder()
public void writeTo(CodedOutputStream output)
Overrides
Except as otherwise noted, the content of this page is licensed under the Creative Commons Attribution 4.0 License, and code samples are licensed under the Apache 2.0 License. For details, see the Google Developers Site Policies. Java is a registered trademark of Oracle and/or its affiliates.
Last updated 2025-12-17 UTC.
[[["Easy to understand","easyToUnderstand","thumb-up"],["Solved my problem","solvedMyProblem","thumb-up"],["Other","otherUp","thumb-up"]],[["Missing the information I need","missingTheInformationINeed","thumb-down"],["Too complicated / too many steps","tooComplicatedTooManySteps","thumb-down"],["Out of date","outOfDate","thumb-down"],["Samples / code issue","samplesCodeIssue","thumb-down"],["Other","otherDown","thumb-down"]],["Last updated 2025-12-17 UTC."],[],[]]