Package inference
Class ModelConfigOuterClass.ModelOptimizationPolicy.Cuda
java.lang.Object
com.google.protobuf.AbstractMessageLite
com.google.protobuf.AbstractMessage
com.google.protobuf.GeneratedMessageV3
inference.ModelConfigOuterClass.ModelOptimizationPolicy.Cuda
- All Implemented Interfaces:
com.google.protobuf.Message,com.google.protobuf.MessageLite,com.google.protobuf.MessageLiteOrBuilder,com.google.protobuf.MessageOrBuilder,ModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder,Serializable
- Enclosing class:
ModelConfigOuterClass.ModelOptimizationPolicy
public static final class ModelConfigOuterClass.ModelOptimizationPolicy.Cuda
extends com.google.protobuf.GeneratedMessageV3
implements ModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
@@ @@ .. cpp:var:: message Cuda @@ @@ CUDA-specific optimization settings. @@Protobuf type
inference.ModelOptimizationPolicy.Cuda- See Also:
-
Nested Class Summary
Nested ClassesModifier and TypeClassDescriptionstatic final class@@ @@ ..static final class@@ ..static interfaceNested classes/interfaces inherited from class com.google.protobuf.GeneratedMessageV3
com.google.protobuf.GeneratedMessageV3.BuilderParent, com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>,BuilderT extends com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT, BuilderT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessageOrBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.FieldAccessorTable, com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter Nested classes/interfaces inherited from class com.google.protobuf.AbstractMessageLite
com.google.protobuf.AbstractMessageLite.InternalOneOfEnum -
Field Summary
FieldsModifier and TypeFieldDescriptionstatic final intstatic final intstatic final intstatic final intFields inherited from class com.google.protobuf.GeneratedMessageV3
alwaysUseFieldBuilders, unknownFieldsFields inherited from class com.google.protobuf.AbstractMessage
memoizedSizeFields inherited from class com.google.protobuf.AbstractMessageLite
memoizedHashCode -
Method Summary
Modifier and TypeMethodDescriptionbooleanboolean@@ ..static final com.google.protobuf.Descriptors.Descriptorboolean@@ ..getGraphSpec(int index) @@ ..int@@ ..@@ ..getGraphSpecOrBuilder(int index) @@ ..@@ ..boolean@@ ..com.google.protobuf.Parser<ModelConfigOuterClass.ModelOptimizationPolicy.Cuda> intinthashCode()protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTablefinal booleannewBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent) protected ObjectnewInstance(com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter unused) parseDelimitedFrom(InputStream input) parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(byte[] data) parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(com.google.protobuf.ByteString data) parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(com.google.protobuf.CodedInputStream input) parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(InputStream input) parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) parseFrom(ByteBuffer data) parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) static com.google.protobuf.Parser<ModelConfigOuterClass.ModelOptimizationPolicy.Cuda> parser()voidwriteTo(com.google.protobuf.CodedOutputStream output) Methods inherited from class com.google.protobuf.GeneratedMessageV3
canUseUnsafe, computeStringSize, computeStringSizeNoTag, emptyBooleanList, emptyDoubleList, emptyFloatList, emptyIntList, emptyList, emptyLongList, getAllFields, getDescriptorForType, getField, getOneofFieldDescriptor, getRepeatedField, getRepeatedFieldCount, getUnknownFields, hasField, hasOneof, internalGetMapField, internalGetMapFieldReflection, isStringEmpty, makeExtensionsImmutable, makeMutableCopy, makeMutableCopy, mergeFromAndMakeImmutableInternal, mutableCopy, mutableCopy, mutableCopy, mutableCopy, mutableCopy, newBooleanList, newBuilderForType, newDoubleList, newFloatList, newIntList, newLongList, parseDelimitedWithIOException, parseDelimitedWithIOException, parseUnknownField, parseUnknownFieldProto3, parseWithIOException, parseWithIOException, parseWithIOException, parseWithIOException, serializeBooleanMapTo, serializeIntegerMapTo, serializeLongMapTo, serializeStringMapTo, writeReplace, writeString, writeStringNoTagMethods inherited from class com.google.protobuf.AbstractMessage
findInitializationErrors, getInitializationErrorString, hashBoolean, hashEnum, hashEnumList, hashFields, hashLong, toStringMethods inherited from class com.google.protobuf.AbstractMessageLite
addAll, addAll, checkByteStringIsUtf8, toByteArray, toByteString, writeDelimitedTo, writeToMethods inherited from class java.lang.Object
clone, finalize, getClass, notify, notifyAll, wait, wait, waitMethods inherited from interface com.google.protobuf.MessageLite
toByteArray, toByteString, writeDelimitedTo, writeToMethods inherited from interface com.google.protobuf.MessageOrBuilder
findInitializationErrors, getAllFields, getDescriptorForType, getField, getInitializationErrorString, getOneofFieldDescriptor, getRepeatedField, getRepeatedFieldCount, getUnknownFields, hasField, hasOneof
-
Field Details
-
GRAPHS_FIELD_NUMBER
public static final int GRAPHS_FIELD_NUMBER- See Also:
-
BUSY_WAIT_EVENTS_FIELD_NUMBER
public static final int BUSY_WAIT_EVENTS_FIELD_NUMBER- See Also:
-
GRAPH_SPEC_FIELD_NUMBER
public static final int GRAPH_SPEC_FIELD_NUMBER- See Also:
-
OUTPUT_COPY_STREAM_FIELD_NUMBER
public static final int OUTPUT_COPY_STREAM_FIELD_NUMBER- See Also:
-
-
Method Details
-
newInstance
- Overrides:
newInstancein classcom.google.protobuf.GeneratedMessageV3
-
getDescriptor
public static final com.google.protobuf.Descriptors.Descriptor getDescriptor() -
internalGetFieldAccessorTable
protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()- Specified by:
internalGetFieldAccessorTablein classcom.google.protobuf.GeneratedMessageV3
-
getGraphs
public boolean getGraphs()@@ .. cpp:var:: bool graphs @@ @@ Use CUDA graphs API to capture model operations and execute @@ them more efficiently. Default value is false. @@ Currently only recognized by TensorRT backend. @@
bool graphs = 1;- Specified by:
getGraphsin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder- Returns:
- The graphs.
-
getBusyWaitEvents
public boolean getBusyWaitEvents()@@ .. cpp:var:: bool busy_wait_events @@ @@ Use busy-waiting to synchronize CUDA events to achieve minimum @@ latency from event complete to host thread to be notified, with @@ the cost of high CPU load. Default value is false. @@ Currently only recognized by TensorRT backend. @@
bool busy_wait_events = 2;- Specified by:
getBusyWaitEventsin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder- Returns:
- The busyWaitEvents.
-
getGraphSpecList
@@ .. cpp:var:: GraphSpec graph_spec (repeated) @@ @@ Specification of the CUDA graph to be captured. If not specified @@ and 'graphs' is true, the default CUDA graphs will be captured @@ based on model settings. @@ Currently only recognized by TensorRT backend. @@
repeated .inference.ModelOptimizationPolicy.Cuda.GraphSpec graph_spec = 3;- Specified by:
getGraphSpecListin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
-
getGraphSpecOrBuilderList
public List<? extends ModelConfigOuterClass.ModelOptimizationPolicy.Cuda.GraphSpecOrBuilder> getGraphSpecOrBuilderList()@@ .. cpp:var:: GraphSpec graph_spec (repeated) @@ @@ Specification of the CUDA graph to be captured. If not specified @@ and 'graphs' is true, the default CUDA graphs will be captured @@ based on model settings. @@ Currently only recognized by TensorRT backend. @@
repeated .inference.ModelOptimizationPolicy.Cuda.GraphSpec graph_spec = 3;- Specified by:
getGraphSpecOrBuilderListin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
-
getGraphSpecCount
public int getGraphSpecCount()@@ .. cpp:var:: GraphSpec graph_spec (repeated) @@ @@ Specification of the CUDA graph to be captured. If not specified @@ and 'graphs' is true, the default CUDA graphs will be captured @@ based on model settings. @@ Currently only recognized by TensorRT backend. @@
repeated .inference.ModelOptimizationPolicy.Cuda.GraphSpec graph_spec = 3;- Specified by:
getGraphSpecCountin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
-
getGraphSpec
@@ .. cpp:var:: GraphSpec graph_spec (repeated) @@ @@ Specification of the CUDA graph to be captured. If not specified @@ and 'graphs' is true, the default CUDA graphs will be captured @@ based on model settings. @@ Currently only recognized by TensorRT backend. @@
repeated .inference.ModelOptimizationPolicy.Cuda.GraphSpec graph_spec = 3;- Specified by:
getGraphSpecin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
-
getGraphSpecOrBuilder
public ModelConfigOuterClass.ModelOptimizationPolicy.Cuda.GraphSpecOrBuilder getGraphSpecOrBuilder(int index) @@ .. cpp:var:: GraphSpec graph_spec (repeated) @@ @@ Specification of the CUDA graph to be captured. If not specified @@ and 'graphs' is true, the default CUDA graphs will be captured @@ based on model settings. @@ Currently only recognized by TensorRT backend. @@
repeated .inference.ModelOptimizationPolicy.Cuda.GraphSpec graph_spec = 3;- Specified by:
getGraphSpecOrBuilderin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder
-
getOutputCopyStream
public boolean getOutputCopyStream()@@ .. cpp:var:: bool output_copy_stream @@ @@ Uses a CUDA stream separate from the inference stream to copy the @@ output to host. However, be aware that setting this option to @@ true will lead to an increase in the memory consumption of the @@ model as Triton will allocate twice as much GPU memory for its @@ I/O tensor buffers. Default value is false. @@ Currently only recognized by TensorRT backend. @@
bool output_copy_stream = 4;- Specified by:
getOutputCopyStreamin interfaceModelConfigOuterClass.ModelOptimizationPolicy.CudaOrBuilder- Returns:
- The outputCopyStream.
-
isInitialized
public final boolean isInitialized()- Specified by:
isInitializedin interfacecom.google.protobuf.MessageLiteOrBuilder- Overrides:
isInitializedin classcom.google.protobuf.GeneratedMessageV3
-
writeTo
- Specified by:
writeToin interfacecom.google.protobuf.MessageLite- Overrides:
writeToin classcom.google.protobuf.GeneratedMessageV3- Throws:
IOException
-
getSerializedSize
public int getSerializedSize()- Specified by:
getSerializedSizein interfacecom.google.protobuf.MessageLite- Overrides:
getSerializedSizein classcom.google.protobuf.GeneratedMessageV3
-
equals
- Specified by:
equalsin interfacecom.google.protobuf.Message- Overrides:
equalsin classcom.google.protobuf.AbstractMessage
-
hashCode
public int hashCode()- Specified by:
hashCodein interfacecom.google.protobuf.Message- Overrides:
hashCodein classcom.google.protobuf.AbstractMessage
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(ByteBuffer data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(com.google.protobuf.ByteString data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(byte[] data) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException - Throws:
com.google.protobuf.InvalidProtocolBufferException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(InputStream input) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
parseDelimitedFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseDelimitedFrom(InputStream input) throws IOException - Throws:
IOException
-
parseDelimitedFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(com.google.protobuf.CodedInputStream input) throws IOException - Throws:
IOException
-
parseFrom
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException - Throws:
IOException
-
newBuilderForType
- Specified by:
newBuilderForTypein interfacecom.google.protobuf.Message- Specified by:
newBuilderForTypein interfacecom.google.protobuf.MessageLite
-
newBuilder
-
newBuilder
public static ModelConfigOuterClass.ModelOptimizationPolicy.Cuda.Builder newBuilder(ModelConfigOuterClass.ModelOptimizationPolicy.Cuda prototype) -
toBuilder
- Specified by:
toBuilderin interfacecom.google.protobuf.Message- Specified by:
toBuilderin interfacecom.google.protobuf.MessageLite
-
newBuilderForType
protected ModelConfigOuterClass.ModelOptimizationPolicy.Cuda.Builder newBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent) - Specified by:
newBuilderForTypein classcom.google.protobuf.GeneratedMessageV3
-
getDefaultInstance
-
parser
public static com.google.protobuf.Parser<ModelConfigOuterClass.ModelOptimizationPolicy.Cuda> parser() -
getParserForType
public com.google.protobuf.Parser<ModelConfigOuterClass.ModelOptimizationPolicy.Cuda> getParserForType()- Specified by:
getParserForTypein interfacecom.google.protobuf.Message- Specified by:
getParserForTypein interfacecom.google.protobuf.MessageLite- Overrides:
getParserForTypein classcom.google.protobuf.GeneratedMessageV3
-
getDefaultInstanceForType
- Specified by:
getDefaultInstanceForTypein interfacecom.google.protobuf.MessageLiteOrBuilder- Specified by:
getDefaultInstanceForTypein interfacecom.google.protobuf.MessageOrBuilder
-