public final class SpeculativeDecodingSpec extends com.google.protobuf.GeneratedMessageV3 implements SpeculativeDecodingSpecOrBuilder
Configuration for Speculative Decoding.Protobuf type
google.cloud.vertexai.v1.SpeculativeDecodingSpec| Modifier and Type | Class and Description |
|---|---|
static class |
SpeculativeDecodingSpec.Builder
Configuration for Speculative Decoding.
|
static class |
SpeculativeDecodingSpec.DraftModelSpeculation
Draft model speculation works by using the smaller model to generate
candidate tokens for speculative decoding.
|
static interface |
SpeculativeDecodingSpec.DraftModelSpeculationOrBuilder |
static class |
SpeculativeDecodingSpec.NgramSpeculation
N-Gram speculation works by trying to find matching tokens in the
previous prompt sequence and use those as speculation for generating
new tokens.
|
static interface |
SpeculativeDecodingSpec.NgramSpeculationOrBuilder |
static class |
SpeculativeDecodingSpec.SpeculationCase |
com.google.protobuf.GeneratedMessageV3.BuilderParent, com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>,BuilderT extends com.google.protobuf.GeneratedMessageV3.ExtendableBuilder<MessageT,BuilderT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.ExtendableMessageOrBuilder<MessageT extends com.google.protobuf.GeneratedMessageV3.ExtendableMessage<MessageT>>, com.google.protobuf.GeneratedMessageV3.FieldAccessorTable, com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter| Modifier and Type | Field and Description |
|---|---|
static int |
DRAFT_MODEL_SPECULATION_FIELD_NUMBER |
static int |
NGRAM_SPECULATION_FIELD_NUMBER |
static int |
SPECULATIVE_TOKEN_COUNT_FIELD_NUMBER |
| Modifier and Type | Method and Description |
|---|---|
boolean |
equals(Object obj) |
static SpeculativeDecodingSpec |
getDefaultInstance() |
SpeculativeDecodingSpec |
getDefaultInstanceForType() |
static com.google.protobuf.Descriptors.Descriptor |
getDescriptor() |
SpeculativeDecodingSpec.DraftModelSpeculation |
getDraftModelSpeculation()
draft model speculation.
|
SpeculativeDecodingSpec.DraftModelSpeculationOrBuilder |
getDraftModelSpeculationOrBuilder()
draft model speculation.
|
SpeculativeDecodingSpec.NgramSpeculation |
getNgramSpeculation()
N-Gram speculation.
|
SpeculativeDecodingSpec.NgramSpeculationOrBuilder |
getNgramSpeculationOrBuilder()
N-Gram speculation.
|
com.google.protobuf.Parser<SpeculativeDecodingSpec> |
getParserForType() |
int |
getSerializedSize() |
SpeculativeDecodingSpec.SpeculationCase |
getSpeculationCase() |
int |
getSpeculativeTokenCount()
The number of speculative tokens to generate at each step.
|
boolean |
hasDraftModelSpeculation()
draft model speculation.
|
int |
hashCode() |
boolean |
hasNgramSpeculation()
N-Gram speculation.
|
protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTable |
internalGetFieldAccessorTable() |
boolean |
isInitialized() |
static SpeculativeDecodingSpec.Builder |
newBuilder() |
static SpeculativeDecodingSpec.Builder |
newBuilder(SpeculativeDecodingSpec prototype) |
SpeculativeDecodingSpec.Builder |
newBuilderForType() |
protected SpeculativeDecodingSpec.Builder |
newBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent) |
protected Object |
newInstance(com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter unused) |
static SpeculativeDecodingSpec |
parseDelimitedFrom(InputStream input) |
static SpeculativeDecodingSpec |
parseDelimitedFrom(InputStream input,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static SpeculativeDecodingSpec |
parseFrom(byte[] data) |
static SpeculativeDecodingSpec |
parseFrom(byte[] data,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static SpeculativeDecodingSpec |
parseFrom(ByteBuffer data) |
static SpeculativeDecodingSpec |
parseFrom(ByteBuffer data,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static SpeculativeDecodingSpec |
parseFrom(com.google.protobuf.ByteString data) |
static SpeculativeDecodingSpec |
parseFrom(com.google.protobuf.ByteString data,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static SpeculativeDecodingSpec |
parseFrom(com.google.protobuf.CodedInputStream input) |
static SpeculativeDecodingSpec |
parseFrom(com.google.protobuf.CodedInputStream input,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static SpeculativeDecodingSpec |
parseFrom(InputStream input) |
static SpeculativeDecodingSpec |
parseFrom(InputStream input,
com.google.protobuf.ExtensionRegistryLite extensionRegistry) |
static com.google.protobuf.Parser<SpeculativeDecodingSpec> |
parser() |
SpeculativeDecodingSpec.Builder |
toBuilder() |
void |
writeTo(com.google.protobuf.CodedOutputStream output) |
canUseUnsafe, computeStringSize, computeStringSizeNoTag, emptyBooleanList, emptyDoubleList, emptyFloatList, emptyIntList, emptyList, emptyLongList, getAllFields, getDescriptorForType, getField, getOneofFieldDescriptor, getRepeatedField, getRepeatedFieldCount, getUnknownFields, hasField, hasOneof, internalGetMapField, internalGetMapFieldReflection, isStringEmpty, makeExtensionsImmutable, makeMutableCopy, makeMutableCopy, mergeFromAndMakeImmutableInternal, mutableCopy, mutableCopy, mutableCopy, mutableCopy, mutableCopy, newBooleanList, newBuilderForType, newDoubleList, newFloatList, newIntList, newLongList, parseDelimitedWithIOException, parseDelimitedWithIOException, parseUnknownField, parseUnknownFieldProto3, parseWithIOException, parseWithIOException, parseWithIOException, parseWithIOException, serializeBooleanMapTo, serializeIntegerMapTo, serializeLongMapTo, serializeStringMapTo, writeReplace, writeString, writeStringNoTagfindInitializationErrors, getInitializationErrorString, hashBoolean, hashEnum, hashEnumList, hashFields, hashLong, toStringaddAll, addAll, checkByteStringIsUtf8, toByteArray, toByteString, writeDelimitedTo, writeToclone, finalize, getClass, notify, notifyAll, wait, wait, waitpublic static final int DRAFT_MODEL_SPECULATION_FIELD_NUMBER
public static final int NGRAM_SPECULATION_FIELD_NUMBER
public static final int SPECULATIVE_TOKEN_COUNT_FIELD_NUMBER
protected Object newInstance(com.google.protobuf.GeneratedMessageV3.UnusedPrivateParameter unused)
newInstance in class com.google.protobuf.GeneratedMessageV3public static final com.google.protobuf.Descriptors.Descriptor getDescriptor()
protected com.google.protobuf.GeneratedMessageV3.FieldAccessorTable internalGetFieldAccessorTable()
internalGetFieldAccessorTable in class com.google.protobuf.GeneratedMessageV3public SpeculativeDecodingSpec.SpeculationCase getSpeculationCase()
getSpeculationCase in interface SpeculativeDecodingSpecOrBuilderpublic boolean hasDraftModelSpeculation()
draft model speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.DraftModelSpeculation draft_model_speculation = 2;
hasDraftModelSpeculation in interface SpeculativeDecodingSpecOrBuilderpublic SpeculativeDecodingSpec.DraftModelSpeculation getDraftModelSpeculation()
draft model speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.DraftModelSpeculation draft_model_speculation = 2;
getDraftModelSpeculation in interface SpeculativeDecodingSpecOrBuilderpublic SpeculativeDecodingSpec.DraftModelSpeculationOrBuilder getDraftModelSpeculationOrBuilder()
draft model speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.DraftModelSpeculation draft_model_speculation = 2;
getDraftModelSpeculationOrBuilder in interface SpeculativeDecodingSpecOrBuilderpublic boolean hasNgramSpeculation()
N-Gram speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.NgramSpeculation ngram_speculation = 3;
hasNgramSpeculation in interface SpeculativeDecodingSpecOrBuilderpublic SpeculativeDecodingSpec.NgramSpeculation getNgramSpeculation()
N-Gram speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.NgramSpeculation ngram_speculation = 3;
getNgramSpeculation in interface SpeculativeDecodingSpecOrBuilderpublic SpeculativeDecodingSpec.NgramSpeculationOrBuilder getNgramSpeculationOrBuilder()
N-Gram speculation.
.google.cloud.vertexai.v1.SpeculativeDecodingSpec.NgramSpeculation ngram_speculation = 3;
getNgramSpeculationOrBuilder in interface SpeculativeDecodingSpecOrBuilderpublic int getSpeculativeTokenCount()
The number of speculative tokens to generate at each step.
int32 speculative_token_count = 1;getSpeculativeTokenCount in interface SpeculativeDecodingSpecOrBuilderpublic final boolean isInitialized()
isInitialized in interface com.google.protobuf.MessageLiteOrBuilderisInitialized in class com.google.protobuf.GeneratedMessageV3public void writeTo(com.google.protobuf.CodedOutputStream output)
throws IOException
writeTo in interface com.google.protobuf.MessageLitewriteTo in class com.google.protobuf.GeneratedMessageV3IOExceptionpublic int getSerializedSize()
getSerializedSize in interface com.google.protobuf.MessageLitegetSerializedSize in class com.google.protobuf.GeneratedMessageV3public boolean equals(Object obj)
equals in interface com.google.protobuf.Messageequals in class com.google.protobuf.AbstractMessagepublic int hashCode()
hashCode in interface com.google.protobuf.MessagehashCode in class com.google.protobuf.AbstractMessagepublic static SpeculativeDecodingSpec parseFrom(ByteBuffer data) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(ByteBuffer data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(com.google.protobuf.ByteString data) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(com.google.protobuf.ByteString data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(byte[] data) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(byte[] data, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws com.google.protobuf.InvalidProtocolBufferException
com.google.protobuf.InvalidProtocolBufferExceptionpublic static SpeculativeDecodingSpec parseFrom(InputStream input) throws IOException
IOExceptionpublic static SpeculativeDecodingSpec parseFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
IOExceptionpublic static SpeculativeDecodingSpec parseDelimitedFrom(InputStream input) throws IOException
IOExceptionpublic static SpeculativeDecodingSpec parseDelimitedFrom(InputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
IOExceptionpublic static SpeculativeDecodingSpec parseFrom(com.google.protobuf.CodedInputStream input) throws IOException
IOExceptionpublic static SpeculativeDecodingSpec parseFrom(com.google.protobuf.CodedInputStream input, com.google.protobuf.ExtensionRegistryLite extensionRegistry) throws IOException
IOExceptionpublic SpeculativeDecodingSpec.Builder newBuilderForType()
newBuilderForType in interface com.google.protobuf.MessagenewBuilderForType in interface com.google.protobuf.MessageLitepublic static SpeculativeDecodingSpec.Builder newBuilder()
public static SpeculativeDecodingSpec.Builder newBuilder(SpeculativeDecodingSpec prototype)
public SpeculativeDecodingSpec.Builder toBuilder()
toBuilder in interface com.google.protobuf.MessagetoBuilder in interface com.google.protobuf.MessageLiteprotected SpeculativeDecodingSpec.Builder newBuilderForType(com.google.protobuf.GeneratedMessageV3.BuilderParent parent)
newBuilderForType in class com.google.protobuf.GeneratedMessageV3public static SpeculativeDecodingSpec getDefaultInstance()
public static com.google.protobuf.Parser<SpeculativeDecodingSpec> parser()
public com.google.protobuf.Parser<SpeculativeDecodingSpec> getParserForType()
getParserForType in interface com.google.protobuf.MessagegetParserForType in interface com.google.protobuf.MessageLitegetParserForType in class com.google.protobuf.GeneratedMessageV3public SpeculativeDecodingSpec getDefaultInstanceForType()
getDefaultInstanceForType in interface com.google.protobuf.MessageLiteOrBuildergetDefaultInstanceForType in interface com.google.protobuf.MessageOrBuilderCopyright © 2025 Google LLC. All rights reserved.