Package inference
Class ModelConfigOuterClass.ModelDynamicBatching
java.lang.Object
com.google.protobuf.AbstractMessageLite
com.google.protobuf.AbstractMessage
com.google.protobuf.GeneratedMessageV3
inference.ModelConfigOuterClass.ModelDynamicBatching
- All Implemented Interfaces:
com.google.protobuf.Message,com.google.protobuf.MessageLite,com.google.protobuf.MessageLiteOrBuilder,com.google.protobuf.MessageOrBuilder,ModelConfigOuterClass.ModelDynamicBatchingOrBuilder,Serializable
- Enclosing class:
ModelConfigOuterClass
public static final class ModelConfigOuterClass.ModelDynamicBatching
extends com.google.protobuf.GeneratedMessageV3
implements ModelConfigOuterClass.ModelDynamicBatchingOrBuilder
@@ @@.. cpp:var:: message ModelDynamicBatching @@ @@ Dynamic batching configuration. These settings control how dynamic @@ batching operates for the model. @@Protobuf type
inference.ModelDynamicBatching- See Also:
-
Nested Class Summary
Nested ClassesModifier and TypeClassDescriptionstatic final class@@ @@..Nested classes/interfaces inherited from class com.google.protobuf.GeneratedMessageV3
com.google.protobuf.GeneratedMessageV3.BuilderParent, com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>,BuilderT extends com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT, BuilderT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessageOrBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.FieldAccessorTable, com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter Nested classes/interfaces inherited from class com.google.protobuf.AbstractMessageLite
com.google.protobuf.AbstractMessageLite.InternalOneOfEnum -
Field Summary
FieldsModifier and TypeFieldDescriptionstatic final intstatic final intstatic final intstatic final intstatic final intstatic final intstatic final intFields inherited from class com.google.protobuf.GeneratedMessageV3
alwaysUseFieldBuilders, unknownFieldsFields inherited from class com.google.protobuf.AbstractMessage
memoizedSizeFields inherited from class com.google.protobuf.AbstractMessageLite
memoizedHashCode -
Method Summary
Modifier and TypeMethodDescriptionbooleancontainsPriorityQueuePolicy(long key) @@ ..booleanlong@@ ..@@ ..@@ ..static final com.google.protobuf.Descriptors.Descriptorlong@@ ..com.google.protobuf.Parser<ModelConfigOuterClass.ModelDynamicBatching> intgetPreferredBatchSize(int index) @@ ..int@@ ..@@ ..boolean@@ ..long@@ ..Deprecated.int@@ ..@@ ..getPriorityQueuePolicyOrDefault(long key, ModelConfigOuterClass.ModelQueuePolicy defaultValue) @@ ..getPriorityQueuePolicyOrThrow(long key) @@ ..intboolean@@ ..inthashCode()protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTableprotected com.google.protobuf.MapFieldReflectionAccessorinternalGetMapFieldReflection(int number) final booleannewBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent) protected ObjectnewInstance(com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter unused) parseDelimitedFrom(InputStream input) parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(byte[] data) parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(com.google.protobuf.ByteString data) parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(com.google.protobuf.CodedInputStream input) parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(InputStream input) parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(ByteBuffer data) parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) static com.google.protobuf.Parser<ModelConfigOuterClass.ModelDynamicBatching> parser()voidwriteTo(com.google.protobuf.CodedOutputStream output) Methods inherited from class com.google.protobuf.GeneratedMessageV3
canUseUnsafe, computeStringSize, computeStringSizeNoTag, emptyBooleanList, emptyDoubleList, emptyFloatList, emptyIntList, emptyList, emptyLongList, getAllFields, getDescriptorForType, getField, getOneofFieldDescriptor, getRepeatedField, getRepeatedFieldCount, getUnknownFields, hasField, hasOneof, internalGetMapField, isStringEmpty, makeExtensionsImmutable, makeMutableCopy, makeMutableCopy, mergeFromAndMakeImmutableInternal, mutableCopy, mutableCopy, mutableCopy, mutableCopy, mutableCopy, newBooleanList, newBuilderForType, newDoubleList, newFloatList, newIntList, newLongList, parseDelimitedWithIOException, parseDelimitedWithIOException, parseUnknownField, parseUnknownFieldProto3, parseWithIOException, parseWithIOException, parseWithIOException, parseWithIOException, serializeBooleanMapTo, serializeIntegerMapTo, serializeLongMapTo, serializeStringMapTo, writeReplace, writeString, writeStringNoTagMethods inherited from class com.google.protobuf.AbstractMessage
findInitializationErrors, getInitializationErrorString, hashBoolean, hashEnum, hashEnumList, hashFields, hashLong, toStringMethods inherited from class com.google.protobuf.AbstractMessageLite
addAll, addAll, checkByteStringIsUtf8, toByteArray, toByteString, writeDelimitedTo, writeToMethods inherited from class java.lang.Object
clone, finalize, getClass, notify, notifyAll, wait, wait, waitMethods inherited from interface com.google.protobuf.MessageLite
toByteArray, toByteString, writeDelimitedTo, writeToMethods inherited from interface com.google.protobuf.MessageOrBuilder
findInitializationErrors, getAllFields, getDescriptorForType, getField, getInitializationErrorString, getOneofFieldDescriptor, getRepeatedField, getRepeatedFieldCount, getUnknownFields, hasField, hasOneof
-
Field Details
-
PREFERRED_BATCH_SIZE_FIELD_NUMBER
public static final int PREFERRED_BATCH_SIZE_FIELD_NUMBER- See Also:
-
MAX_QUEUE_DELAY_MICROSECONDS_FIELD_NUMBER
public static final int MAX_QUEUE_DELAY_MICROSECONDS_FIELD_NUMBER- See Also:
-
PRESERVE_ORDERING_FIELD_NUMBER
public static final int PRESERVE_ORDERING_FIELD_NUMBER- See Also:
-
PRIORITY_LEVELS_FIELD_NUMBER
public static final int PRIORITY_LEVELS_FIELD_NUMBER- See Also:
-
DEFAULT_PRIORITY_LEVEL_FIELD_NUMBER
public static final int DEFAULT_PRIORITY_LEVEL_FIELD_NUMBER- See Also:
-
DEFAULT_QUEUE_POLICY_FIELD_NUMBER
public static final int DEFAULT_QUEUE_POLICY_FIELD_NUMBER- See Also:
-
PRIORITY_QUEUE_POLICY_FIELD_NUMBER
public static final int PRIORITY_QUEUE_POLICY_FIELD_NUMBER- See Also:
-
-
Method Details
-
newInstance
- Overrides:
newInstancein classcom.google.protobuf.GeneratedMessageV3
-
getDescriptor
public static final com.google.protobuf.Descriptors.Descriptor getDescriptor() -
internalGetMapFieldReflection
protected com.google.protobuf.MapFieldReflectionAccessor internalGetMapFieldReflection(int number) - Overrides:
internalGetMapFieldReflectionin classcom.google.protobuf.GeneratedMessageV3
-
internalGetFieldAccessorTable
protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()- Specified by:
internalGetFieldAccessorTablein classcom.google.protobuf.GeneratedMessageV3
-
getPreferredBatchSizeList
@@ .. cpp:var:: int32 preferred_batch_size (repeated) @@ @@ Preferred batch sizes for dynamic batching. If a batch of one of @@ these sizes can be formed it will be executed immediately. If @@ not specified a preferred batch size will be chosen automatically @@ based on model and GPU characteristics. @@
repeated int32 preferred_batch_size = 1;- Specified by:
getPreferredBatchSizeListin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- A list containing the preferredBatchSize.
-
getPreferredBatchSizeCount
public int getPreferredBatchSizeCount()@@ .. cpp:var:: int32 preferred_batch_size (repeated) @@ @@ Preferred batch sizes for dynamic batching. If a batch of one of @@ these sizes can be formed it will be executed immediately. If @@ not specified a preferred batch size will be chosen automatically @@ based on model and GPU characteristics. @@
repeated int32 preferred_batch_size = 1;- Specified by:
getPreferredBatchSizeCountin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The count of preferredBatchSize.
-
getPreferredBatchSize
public int getPreferredBatchSize(int index) @@ .. cpp:var:: int32 preferred_batch_size (repeated) @@ @@ Preferred batch sizes for dynamic batching. If a batch of one of @@ these sizes can be formed it will be executed immediately. If @@ not specified a preferred batch size will be chosen automatically @@ based on model and GPU characteristics. @@
repeated int32 preferred_batch_size = 1;- Specified by:
getPreferredBatchSizein interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Parameters:
index- The index of the element to return.- Returns:
- The preferredBatchSize at the given index.
-
getMaxQueueDelayMicroseconds
public long getMaxQueueDelayMicroseconds()@@ .. cpp:var:: uint64 max_queue_delay_microseconds @@ @@ The maximum time, in microseconds, a request will be delayed in @@ the scheduling queue to wait for additional requests for @@ batching. Default is 0. @@
uint64 max_queue_delay_microseconds = 2;- Specified by:
getMaxQueueDelayMicrosecondsin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The maxQueueDelayMicroseconds.
-
getPreserveOrdering
public boolean getPreserveOrdering()@@ .. cpp:var:: bool preserve_ordering @@ @@ Should the dynamic batcher preserve the ordering of responses to @@ match the order of requests received by the scheduler. Default is @@ false. If true, the responses will be returned in the same order as @@ the order of requests sent to the scheduler. If false, the responses @@ may be returned in arbitrary order. This option is specifically @@ needed when a sequence of related inference requests (i.e. inference @@ requests with the same correlation ID) are sent to the dynamic @@ batcher to ensure that the sequence responses are in the correct @@ order. @@
bool preserve_ordering = 3;- Specified by:
getPreserveOrderingin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The preserveOrdering.
-
getPriorityLevels
public long getPriorityLevels()@@ .. cpp:var:: uint64 priority_levels @@ @@ The number of priority levels to be enabled for the model, @@ the priority level starts from 1 and 1 is the highest priority. @@ Requests are handled in priority order with all priority 1 requests @@ processed before priority 2, all priority 2 requests processed before @@ priority 3, etc. Requests with the same priority level will be @@ handled in the order that they are received. @@
uint64 priority_levels = 4;- Specified by:
getPriorityLevelsin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The priorityLevels.
-
getDefaultPriorityLevel
public long getDefaultPriorityLevel()@@ .. cpp:var:: uint64 default_priority_level @@ @@ The priority level used for requests that don't specify their @@ priority. The value must be in the range [ 1, 'priority_levels' ]. @@
uint64 default_priority_level = 5;- Specified by:
getDefaultPriorityLevelin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The defaultPriorityLevel.
-
hasDefaultQueuePolicy
public boolean hasDefaultQueuePolicy()@@ .. cpp:var:: ModelQueuePolicy default_queue_policy @@ @@ The default queue policy used for requests that don't require @@ priority handling and requests that specify priority levels where @@ there is no specific policy given. If not specified, a policy with @@ default field values will be used. @@
.inference.ModelQueuePolicy default_queue_policy = 6;- Specified by:
hasDefaultQueuePolicyin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- Whether the defaultQueuePolicy field is set.
-
getDefaultQueuePolicy
@@ .. cpp:var:: ModelQueuePolicy default_queue_policy @@ @@ The default queue policy used for requests that don't require @@ priority handling and requests that specify priority levels where @@ there is no specific policy given. If not specified, a policy with @@ default field values will be used. @@
.inference.ModelQueuePolicy default_queue_policy = 6;- Specified by:
getDefaultQueuePolicyin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder- Returns:
- The defaultQueuePolicy.
-
getDefaultQueuePolicyOrBuilder
@@ .. cpp:var:: ModelQueuePolicy default_queue_policy @@ @@ The default queue policy used for requests that don't require @@ priority handling and requests that specify priority levels where @@ there is no specific policy given. If not specified, a policy with @@ default field values will be used. @@
.inference.ModelQueuePolicy default_queue_policy = 6;- Specified by:
getDefaultQueuePolicyOrBuilderin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
getPriorityQueuePolicyCount
public int getPriorityQueuePolicyCount()Description copied from interface:ModelConfigOuterClass.ModelDynamicBatchingOrBuilder@@ .. cpp:var:: map<uint64, ModelQueuePolicy> priority_queue_policy @@ @@ Specify the queue policy for the priority level. The default queue @@ policy will be used if a priority level doesn't specify a queue @@ policy. @@
map<uint64, .inference.ModelQueuePolicy> priority_queue_policy = 7;- Specified by:
getPriorityQueuePolicyCountin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
containsPriorityQueuePolicy
public boolean containsPriorityQueuePolicy(long key) @@ .. cpp:var:: map<uint64, ModelQueuePolicy> priority_queue_policy @@ @@ Specify the queue policy for the priority level. The default queue @@ policy will be used if a priority level doesn't specify a queue @@ policy. @@
map<uint64, .inference.ModelQueuePolicy> priority_queue_policy = 7;- Specified by:
containsPriorityQueuePolicyin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
getPriorityQueuePolicy
Deprecated.UsegetPriorityQueuePolicyMap()instead.- Specified by:
getPriorityQueuePolicyin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
getPriorityQueuePolicyMap
@@ .. cpp:var:: map<uint64, ModelQueuePolicy> priority_queue_policy @@ @@ Specify the queue policy for the priority level. The default queue @@ policy will be used if a priority level doesn't specify a queue @@ policy. @@
map<uint64, .inference.ModelQueuePolicy> priority_queue_policy = 7;- Specified by:
getPriorityQueuePolicyMapin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
getPriorityQueuePolicyOrDefault
public ModelConfigOuterClass.ModelQueuePolicy getPriorityQueuePolicyOrDefault(long key, ModelConfigOuterClass.ModelQueuePolicy defaultValue) @@ .. cpp:var:: map<uint64, ModelQueuePolicy> priority_queue_policy @@ @@ Specify the queue policy for the priority level. The default queue @@ policy will be used if a priority level doesn't specify a queue @@ policy. @@
map<uint64, .inference.ModelQueuePolicy> priority_queue_policy = 7;- Specified by:
getPriorityQueuePolicyOrDefaultin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
getPriorityQueuePolicyOrThrow
@@ .. cpp:var:: map<uint64, ModelQueuePolicy> priority_queue_policy @@ @@ Specify the queue policy for the priority level. The default queue @@ policy will be used if a priority level doesn't specify a queue @@ policy. @@
map<uint64, .inference.ModelQueuePolicy> priority_queue_policy = 7;- Specified by:
getPriorityQueuePolicyOrThrowin interfaceModelConfigOuterClass.ModelDynamicBatchingOrBuilder
-
isInitialized
public final boolean isInitialized()- Specified by:
isInitializedin interfacecom.google.protobuf.MessageLiteOrBuilder- Overrides:
isInitializedin classcom.google.protobuf.GeneratedMessageV3
-
writeTo
- Specified by:
writeToin interfacecom.google.protobuf.MessageLite- Overrides:
writeToin classcom.google.protobuf.GeneratedMessageV3- Throws:
IOException
-
getSerializedSize
public int getSerializedSize()- Specified by:
getSerializedSizein interfacecom.google.protobuf.MessageLite- Overrides:
getSerializedSizein classcom.google.protobuf.GeneratedMessageV3
-
equals
- Specified by:
equalsin interfacecom.google.protobuf.Message- Overrides:
equalsin classcom.google.protobuf.AbstractMessage
-
hashCode
public int hashCode()- Specified by:
hashCodein interfacecom.google.protobuf.Message- Overrides:
hashCodein classcom.google.protobuf.AbstractMessage
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(ByteBuffer data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(com.google.protobuf.ByteString data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(byte[] data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(InputStream input) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
parseDelimitedFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseDelimitedFrom(InputStream input) throws IOException - Throws:
IOException
-
parseDelimitedFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(com.google.protobuf.CodedInputStream input) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelDynamicBatching parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
newBuilderForType
- Specified by:
newBuilderForTypein interfacecom.google.protobuf.Message- Specified by:
newBuilderForTypein interfacecom.google.protobuf.MessageLite
-
newBuilder
-
newBuilder
public static ModelConfigOuterClass.ModelDynamicBatching.Builder newBuilder(ModelConfigOuterClass.ModelDynamicBatching prototype) -
toBuilder
- Specified by:
toBuilderin interfacecom.google.protobuf.Message- Specified by:
toBuilderin interfacecom.google.protobuf.MessageLite
-
newBuilderForType
protected ModelConfigOuterClass.ModelDynamicBatching.Builder newBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent) - Specified by:
newBuilderForTypein classcom.google.protobuf.GeneratedMessageV3
-
getDefaultInstance
-
parser
-
getParserForType
- Specified by:
getParserForTypein interfacecom.google.protobuf.Message- Specified by:
getParserForTypein interfacecom.google.protobuf.MessageLite- Overrides:
getParserForTypein classcom.google.protobuf.GeneratedMessageV3
-
getDefaultInstanceForType
- Specified by:
getDefaultInstanceForTypein interfacecom.google.protobuf.MessageLiteOrBuilder- Specified by:
getDefaultInstanceForTypein interfacecom.google.protobuf.MessageOrBuilder
-