Package inference

Class ModelConfigOuterClass.ModelInstanceGroup

java.lang.Object
com.google.protobuf.AbstractMessageLite
com.google.protobuf.AbstractMessage
com.google.protobuf.GeneratedMessageV3
inference.ModelConfigOuterClass.ModelInstanceGroup
All Implemented Interfaces:
com.google.protobuf.Message, com.google.protobuf.MessageLite, com.google.protobuf.MessageLiteOrBuilder, com.google.protobuf.MessageOrBuilder, ModelConfigOuterClass.ModelInstanceGroupOrBuilder, Serializable
Enclosing class:
ModelConfigOuterClass

public static final class ModelConfigOuterClass.ModelInstanceGroup extends com.google.protobuf.GeneratedMessageV3 implements ModelConfigOuterClass.ModelInstanceGroupOrBuilder
@@
@@.. cpp:var:: message ModelInstanceGroup
@@
@@   A group of one or more instances of a model and resources made
@@   available for those instances.
@@
 
Protobuf type inference.ModelInstanceGroup
See Also:
  • Field Details

  • Method Details

    • newInstance

      protected Object newInstance(com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter unused)
      Overrides:
      newInstance in class com.google.protobuf.GeneratedMessageV3
    • getDescriptor

      public static final com.google.protobuf.Descriptors.Descriptor getDescriptor()
    • internalGetFieldAccessorTable

      protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
      Specified by:
      internalGetFieldAccessorTable in class com.google.protobuf.GeneratedMessageV3
    • getName

      public String getName()
      @@  .. cpp:var:: string name
      @@
      @@     Optional name of this group of instances. If not specified the
      @@     name will be formed as <model name>_<group number>. The name of
      @@     individual instances will be further formed by a unique instance
      @@     number and GPU index:
      @@
       
      string name = 1;
      Specified by:
      getName in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The name.
    • getNameBytes

      public com.google.protobuf.ByteString getNameBytes()
      @@  .. cpp:var:: string name
      @@
      @@     Optional name of this group of instances. If not specified the
      @@     name will be formed as <model name>_<group number>. The name of
      @@     individual instances will be further formed by a unique instance
      @@     number and GPU index:
      @@
       
      string name = 1;
      Specified by:
      getNameBytes in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The bytes for name.
    • getKindValue

      public int getKindValue()
      @@  .. cpp:var:: Kind kind
      @@
      @@     The kind of this instance group. Default is KIND_AUTO. If
      @@     KIND_AUTO or KIND_GPU then both 'count' and 'gpu' are valid and
      @@     may be specified. If KIND_CPU or KIND_MODEL only 'count' is valid
      @@     and 'gpu' cannot be specified.
      @@
       
      .inference.ModelInstanceGroup.Kind kind = 4;
      Specified by:
      getKindValue in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The enum numeric value on the wire for kind.
    • getKind

      @@  .. cpp:var:: Kind kind
      @@
      @@     The kind of this instance group. Default is KIND_AUTO. If
      @@     KIND_AUTO or KIND_GPU then both 'count' and 'gpu' are valid and
      @@     may be specified. If KIND_CPU or KIND_MODEL only 'count' is valid
      @@     and 'gpu' cannot be specified.
      @@
       
      .inference.ModelInstanceGroup.Kind kind = 4;
      Specified by:
      getKind in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The kind.
    • getCount

      public int getCount()
      @@  .. cpp:var:: int32 count
      @@
      @@     For a group assigned to GPU, the number of instances created for
      @@     each GPU listed in 'gpus'. For a group assigned to CPU the number
      @@     of instances created. Default is 1.
       
      int32 count = 2;
      Specified by:
      getCount in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The count.
    • hasRateLimiter

      public boolean hasRateLimiter()
      @@  .. cpp:var:: ModelRateLimiter rate_limiter
      @@
      @@     The rate limiter specific settings to be associated with this
      @@     instance group. Optional, if not specified no rate limiting
      @@     will be applied to this instance group.
      @@
       
      .inference.ModelRateLimiter rate_limiter = 6;
      Specified by:
      hasRateLimiter in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      Whether the rateLimiter field is set.
    • getRateLimiter

      public ModelConfigOuterClass.ModelRateLimiter getRateLimiter()
      @@  .. cpp:var:: ModelRateLimiter rate_limiter
      @@
      @@     The rate limiter specific settings to be associated with this
      @@     instance group. Optional, if not specified no rate limiting
      @@     will be applied to this instance group.
      @@
       
      .inference.ModelRateLimiter rate_limiter = 6;
      Specified by:
      getRateLimiter in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The rateLimiter.
    • getRateLimiterOrBuilder

      public ModelConfigOuterClass.ModelRateLimiterOrBuilder getRateLimiterOrBuilder()
      @@  .. cpp:var:: ModelRateLimiter rate_limiter
      @@
      @@     The rate limiter specific settings to be associated with this
      @@     instance group. Optional, if not specified no rate limiting
      @@     will be applied to this instance group.
      @@
       
      .inference.ModelRateLimiter rate_limiter = 6;
      Specified by:
      getRateLimiterOrBuilder in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getGpusList

      public List<Integer> getGpusList()
      @@  .. cpp:var:: int32 gpus (repeated)
      @@
      @@     GPU(s) where instances should be available. For each GPU listed,
      @@     'count' instances of the model will be available. Setting 'gpus'
      @@     to empty (or not specifying at all) is equivalent to listing all
      @@     available GPUs.
      @@
       
      repeated int32 gpus = 3;
      Specified by:
      getGpusList in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      A list containing the gpus.
    • getGpusCount

      public int getGpusCount()
      @@  .. cpp:var:: int32 gpus (repeated)
      @@
      @@     GPU(s) where instances should be available. For each GPU listed,
      @@     'count' instances of the model will be available. Setting 'gpus'
      @@     to empty (or not specifying at all) is equivalent to listing all
      @@     available GPUs.
      @@
       
      repeated int32 gpus = 3;
      Specified by:
      getGpusCount in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The count of gpus.
    • getGpus

      public int getGpus(int index)
      @@  .. cpp:var:: int32 gpus (repeated)
      @@
      @@     GPU(s) where instances should be available. For each GPU listed,
      @@     'count' instances of the model will be available. Setting 'gpus'
      @@     to empty (or not specifying at all) is equivalent to listing all
      @@     available GPUs.
      @@
       
      repeated int32 gpus = 3;
      Specified by:
      getGpus in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Parameters:
      index - The index of the element to return.
      Returns:
      The gpus at the given index.
    • getSecondaryDevicesList

      @@  .. cpp:var:: SecondaryDevice secondary_devices (repeated)
      @@
      @@     Secondary devices that are required by instances specified by this
      @@     instance group. Optional.
      @@
       
      repeated .inference.ModelInstanceGroup.SecondaryDevice secondary_devices = 8;
      Specified by:
      getSecondaryDevicesList in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getSecondaryDevicesOrBuilderList

      public List<? extends ModelConfigOuterClass.ModelInstanceGroup.SecondaryDeviceOrBuilder> getSecondaryDevicesOrBuilderList()
      @@  .. cpp:var:: SecondaryDevice secondary_devices (repeated)
      @@
      @@     Secondary devices that are required by instances specified by this
      @@     instance group. Optional.
      @@
       
      repeated .inference.ModelInstanceGroup.SecondaryDevice secondary_devices = 8;
      Specified by:
      getSecondaryDevicesOrBuilderList in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getSecondaryDevicesCount

      public int getSecondaryDevicesCount()
      @@  .. cpp:var:: SecondaryDevice secondary_devices (repeated)
      @@
      @@     Secondary devices that are required by instances specified by this
      @@     instance group. Optional.
      @@
       
      repeated .inference.ModelInstanceGroup.SecondaryDevice secondary_devices = 8;
      Specified by:
      getSecondaryDevicesCount in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getSecondaryDevices

      public ModelConfigOuterClass.ModelInstanceGroup.SecondaryDevice getSecondaryDevices(int index)
      @@  .. cpp:var:: SecondaryDevice secondary_devices (repeated)
      @@
      @@     Secondary devices that are required by instances specified by this
      @@     instance group. Optional.
      @@
       
      repeated .inference.ModelInstanceGroup.SecondaryDevice secondary_devices = 8;
      Specified by:
      getSecondaryDevices in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getSecondaryDevicesOrBuilder

      public ModelConfigOuterClass.ModelInstanceGroup.SecondaryDeviceOrBuilder getSecondaryDevicesOrBuilder(int index)
      @@  .. cpp:var:: SecondaryDevice secondary_devices (repeated)
      @@
      @@     Secondary devices that are required by instances specified by this
      @@     instance group. Optional.
      @@
       
      repeated .inference.ModelInstanceGroup.SecondaryDevice secondary_devices = 8;
      Specified by:
      getSecondaryDevicesOrBuilder in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
    • getProfileList

      public com.google.protobuf.ProtocolStringList getProfileList()
      @@  .. cpp:var:: string profile (repeated)
      @@
      @@     For TensorRT models containing multiple optimization profile, this
      @@     parameter specifies a set of optimization profiles available to this
      @@     instance group. The inference server will choose the optimal profile
      @@     based on the shapes of the input tensors. This field should lie
      @@     between 0 and <TotalNumberOfOptimizationProfilesInPlanModel> - 1
      @@     and be specified only for TensorRT backend, otherwise an error will
      @@     be generated. If not specified, the server will select the first
      @@     optimization profile by default.
      @@
       
      repeated string profile = 5;
      Specified by:
      getProfileList in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      A list containing the profile.
    • getProfileCount

      public int getProfileCount()
      @@  .. cpp:var:: string profile (repeated)
      @@
      @@     For TensorRT models containing multiple optimization profile, this
      @@     parameter specifies a set of optimization profiles available to this
      @@     instance group. The inference server will choose the optimal profile
      @@     based on the shapes of the input tensors. This field should lie
      @@     between 0 and <TotalNumberOfOptimizationProfilesInPlanModel> - 1
      @@     and be specified only for TensorRT backend, otherwise an error will
      @@     be generated. If not specified, the server will select the first
      @@     optimization profile by default.
      @@
       
      repeated string profile = 5;
      Specified by:
      getProfileCount in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The count of profile.
    • getProfile

      public String getProfile(int index)
      @@  .. cpp:var:: string profile (repeated)
      @@
      @@     For TensorRT models containing multiple optimization profile, this
      @@     parameter specifies a set of optimization profiles available to this
      @@     instance group. The inference server will choose the optimal profile
      @@     based on the shapes of the input tensors. This field should lie
      @@     between 0 and <TotalNumberOfOptimizationProfilesInPlanModel> - 1
      @@     and be specified only for TensorRT backend, otherwise an error will
      @@     be generated. If not specified, the server will select the first
      @@     optimization profile by default.
      @@
       
      repeated string profile = 5;
      Specified by:
      getProfile in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Parameters:
      index - The index of the element to return.
      Returns:
      The profile at the given index.
    • getProfileBytes

      public com.google.protobuf.ByteString getProfileBytes(int index)
      @@  .. cpp:var:: string profile (repeated)
      @@
      @@     For TensorRT models containing multiple optimization profile, this
      @@     parameter specifies a set of optimization profiles available to this
      @@     instance group. The inference server will choose the optimal profile
      @@     based on the shapes of the input tensors. This field should lie
      @@     between 0 and <TotalNumberOfOptimizationProfilesInPlanModel> - 1
      @@     and be specified only for TensorRT backend, otherwise an error will
      @@     be generated. If not specified, the server will select the first
      @@     optimization profile by default.
      @@
       
      repeated string profile = 5;
      Specified by:
      getProfileBytes in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Parameters:
      index - The index of the value to return.
      Returns:
      The bytes of the profile at the given index.
    • getPassive

      public boolean getPassive()
      @@  .. cpp:var:: bool passive
      @@
      @@     Whether the instances within this instance group will be accepting
      @@     inference requests from the scheduler. If true, the instances will
      @@     not be added to the scheduler. Default value is false.
      @@
       
      bool passive = 7;
      Specified by:
      getPassive in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The passive.
    • getHostPolicy

      public String getHostPolicy()
      @@  .. cpp:var:: string host_policy
      @@
      @@     The host policy name that the instance to be associated with.
      @@     The default value is set to reflect the device kind of the instance,
      @@     for instance, KIND_CPU is "cpu", KIND_MODEL is "model" and
      @@     KIND_GPU is "gpu_<gpu_id>".
      @@
       
      string host_policy = 9;
      Specified by:
      getHostPolicy in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The hostPolicy.
    • getHostPolicyBytes

      public com.google.protobuf.ByteString getHostPolicyBytes()
      @@  .. cpp:var:: string host_policy
      @@
      @@     The host policy name that the instance to be associated with.
      @@     The default value is set to reflect the device kind of the instance,
      @@     for instance, KIND_CPU is "cpu", KIND_MODEL is "model" and
      @@     KIND_GPU is "gpu_<gpu_id>".
      @@
       
      string host_policy = 9;
      Specified by:
      getHostPolicyBytes in interface ModelConfigOuterClass.ModelInstanceGroupOrBuilder
      Returns:
      The bytes for hostPolicy.
    • isInitialized

      public final boolean isInitialized()
      Specified by:
      isInitialized in interface com.google.protobuf.MessageLiteOrBuilder
      Overrides:
      isInitialized in class com.google.protobuf.GeneratedMessageV3
    • writeTo

      public void writeTo(com.google.protobuf.CodedOutputStream output) throws IOException
      Specified by:
      writeTo in interface com.google.protobuf.MessageLite
      Overrides:
      writeTo in class com.google.protobuf.GeneratedMessageV3
      Throws:
      IOException
    • getSerializedSize

      public int getSerializedSize()
      Specified by:
      getSerializedSize in interface com.google.protobuf.MessageLite
      Overrides:
      getSerializedSize in class com.google.protobuf.GeneratedMessageV3
    • equals

      public boolean equals(Object obj)
      Specified by:
      equals in interface com.google.protobuf.Message
      Overrides:
      equals in class com.google.protobuf.AbstractMessage
    • hashCode

      public int hashCode()
      Specified by:
      hashCode in interface com.google.protobuf.Message
      Overrides:
      hashCode in class com.google.protobuf.AbstractMessage
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(ByteBuffer data) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(com.google.protobuf.ByteString data) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(byte[] data) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
      Throws:
      com.google.protobuf.InvalidProtocolBufferException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(InputStream input) throws IOException
      Throws:
      IOException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
      Throws:
      IOException
    • parseDelimitedFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseDelimitedFrom(InputStream input) throws IOException
      Throws:
      IOException
    • parseDelimitedFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
      Throws:
      IOException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(com.google.protobuf.CodedInputStream input) throws IOException
      Throws:
      IOException
    • parseFrom

      public static ModelConfigOuterClass.ModelInstanceGroup parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
      Throws:
      IOException
    • newBuilderForType

      Specified by:
      newBuilderForType in interface com.google.protobuf.Message
      Specified by:
      newBuilderForType in interface com.google.protobuf.MessageLite
    • newBuilder

    • newBuilder

    • toBuilder

      Specified by:
      toBuilder in interface com.google.protobuf.Message
      Specified by:
      toBuilder in interface com.google.protobuf.MessageLite
    • newBuilderForType

      protected ModelConfigOuterClass.ModelInstanceGroup.Builder newBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent)
      Specified by:
      newBuilderForType in class com.google.protobuf.GeneratedMessageV3
    • getDefaultInstance

      public static ModelConfigOuterClass.ModelInstanceGroup getDefaultInstance()
    • parser

      public static com.google.protobuf.Parser<ModelConfigOuterClass.ModelInstanceGroup> parser()
    • getParserForType

      public com.google.protobuf.Parser<ModelConfigOuterClass.ModelInstanceGroup> getParserForType()
      Specified by:
      getParserForType in interface com.google.protobuf.Message
      Specified by:
      getParserForType in interface com.google.protobuf.MessageLite
      Overrides:
      getParserForType in class com.google.protobuf.GeneratedMessageV3
    • getDefaultInstanceForType

      public ModelConfigOuterClass.ModelInstanceGroup getDefaultInstanceForType()
      Specified by:
      getDefaultInstanceForType in interface com.google.protobuf.MessageLiteOrBuilder
      Specified by:
      getDefaultInstanceForType in interface com.google.protobuf.MessageOrBuilder