diff --git a/AiPlatform/metadata/V1/Endpoint.php b/AiPlatform/metadata/V1/Endpoint.php index cbcb49763cfa..309d31b475c1 100644 Binary files a/AiPlatform/metadata/V1/Endpoint.php and b/AiPlatform/metadata/V1/Endpoint.php differ diff --git a/AiPlatform/src/V1/DeployedModel.php b/AiPlatform/src/V1/DeployedModel.php index 3f33119f03f8..18123cd20d99 100644 --- a/AiPlatform/src/V1/DeployedModel.php +++ b/AiPlatform/src/V1/DeployedModel.php @@ -149,6 +149,12 @@ class DeployedModel extends \Google\Protobuf\Internal\Message * Generated from protobuf field map system_labels = 28; */ private $system_labels; + /** + * Optional. Spec for configuring speculative decoding. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec speculative_decoding_spec = 30 [(.google.api.field_behavior) = OPTIONAL]; + */ + protected $speculative_decoding_spec = null; protected $prediction_resources; /** @@ -245,6 +251,8 @@ class DeployedModel extends \Google\Protobuf\Internal\Message * @type array|\Google\Protobuf\Internal\MapField $system_labels * System labels to apply to Model Garden deployments. * System labels are managed by Google for internal use only. + * @type \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec $speculative_decoding_spec + * Optional. Spec for configuring speculative decoding. * } */ public function __construct($data = NULL) { @@ -867,6 +875,42 @@ public function setSystemLabels($var) return $this; } + /** + * Optional. Spec for configuring speculative decoding. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec speculative_decoding_spec = 30 [(.google.api.field_behavior) = OPTIONAL]; + * @return \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec|null + */ + public function getSpeculativeDecodingSpec() + { + return $this->speculative_decoding_spec; + } + + public function hasSpeculativeDecodingSpec() + { + return isset($this->speculative_decoding_spec); + } + + public function clearSpeculativeDecodingSpec() + { + unset($this->speculative_decoding_spec); + } + + /** + * Optional. Spec for configuring speculative decoding. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec speculative_decoding_spec = 30 [(.google.api.field_behavior) = OPTIONAL]; + * @param \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec $var + * @return $this + */ + public function setSpeculativeDecodingSpec($var) + { + GPBUtil::checkMessage($var, \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec::class); + $this->speculative_decoding_spec = $var; + + return $this; + } + /** * @return string */ diff --git a/AiPlatform/src/V1/SpeculativeDecodingSpec.php b/AiPlatform/src/V1/SpeculativeDecodingSpec.php new file mode 100644 index 000000000000..5dbb14c34336 --- /dev/null +++ b/AiPlatform/src/V1/SpeculativeDecodingSpec.php @@ -0,0 +1,142 @@ +google.cloud.aiplatform.v1.SpeculativeDecodingSpec + */ +class SpeculativeDecodingSpec extends \Google\Protobuf\Internal\Message +{ + /** + * The number of speculative tokens to generate at each step. + * + * Generated from protobuf field int32 speculative_token_count = 1; + */ + protected $speculative_token_count = 0; + protected $speculation; + + /** + * Constructor. + * + * @param array $data { + * Optional. Data for populating the Message object. + * + * @type \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\DraftModelSpeculation $draft_model_speculation + * draft model speculation. + * @type \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\NgramSpeculation $ngram_speculation + * N-Gram speculation. + * @type int $speculative_token_count + * The number of speculative tokens to generate at each step. + * } + */ + public function __construct($data = NULL) { + \GPBMetadata\Google\Cloud\Aiplatform\V1\Endpoint::initOnce(); + parent::__construct($data); + } + + /** + * draft model speculation. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec.DraftModelSpeculation draft_model_speculation = 2; + * @return \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\DraftModelSpeculation|null + */ + public function getDraftModelSpeculation() + { + return $this->readOneof(2); + } + + public function hasDraftModelSpeculation() + { + return $this->hasOneof(2); + } + + /** + * draft model speculation. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec.DraftModelSpeculation draft_model_speculation = 2; + * @param \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\DraftModelSpeculation $var + * @return $this + */ + public function setDraftModelSpeculation($var) + { + GPBUtil::checkMessage($var, \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\DraftModelSpeculation::class); + $this->writeOneof(2, $var); + + return $this; + } + + /** + * N-Gram speculation. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec.NgramSpeculation ngram_speculation = 3; + * @return \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\NgramSpeculation|null + */ + public function getNgramSpeculation() + { + return $this->readOneof(3); + } + + public function hasNgramSpeculation() + { + return $this->hasOneof(3); + } + + /** + * N-Gram speculation. + * + * Generated from protobuf field .google.cloud.aiplatform.v1.SpeculativeDecodingSpec.NgramSpeculation ngram_speculation = 3; + * @param \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\NgramSpeculation $var + * @return $this + */ + public function setNgramSpeculation($var) + { + GPBUtil::checkMessage($var, \Google\Cloud\AIPlatform\V1\SpeculativeDecodingSpec\NgramSpeculation::class); + $this->writeOneof(3, $var); + + return $this; + } + + /** + * The number of speculative tokens to generate at each step. + * + * Generated from protobuf field int32 speculative_token_count = 1; + * @return int + */ + public function getSpeculativeTokenCount() + { + return $this->speculative_token_count; + } + + /** + * The number of speculative tokens to generate at each step. + * + * Generated from protobuf field int32 speculative_token_count = 1; + * @param int $var + * @return $this + */ + public function setSpeculativeTokenCount($var) + { + GPBUtil::checkInt32($var); + $this->speculative_token_count = $var; + + return $this; + } + + /** + * @return string + */ + public function getSpeculation() + { + return $this->whichOneof("speculation"); + } + +} + diff --git a/AiPlatform/src/V1/SpeculativeDecodingSpec/DraftModelSpeculation.php b/AiPlatform/src/V1/SpeculativeDecodingSpec/DraftModelSpeculation.php new file mode 100644 index 000000000000..8096e48ea4dd --- /dev/null +++ b/AiPlatform/src/V1/SpeculativeDecodingSpec/DraftModelSpeculation.php @@ -0,0 +1,69 @@ +google.cloud.aiplatform.v1.SpeculativeDecodingSpec.DraftModelSpeculation + */ +class DraftModelSpeculation extends \Google\Protobuf\Internal\Message +{ + /** + * Required. The resource name of the draft model. + * + * Generated from protobuf field string draft_model = 1 [(.google.api.field_behavior) = REQUIRED, (.google.api.resource_reference) = { + */ + protected $draft_model = ''; + + /** + * Constructor. + * + * @param array $data { + * Optional. Data for populating the Message object. + * + * @type string $draft_model + * Required. The resource name of the draft model. + * } + */ + public function __construct($data = NULL) { + \GPBMetadata\Google\Cloud\Aiplatform\V1\Endpoint::initOnce(); + parent::__construct($data); + } + + /** + * Required. The resource name of the draft model. + * + * Generated from protobuf field string draft_model = 1 [(.google.api.field_behavior) = REQUIRED, (.google.api.resource_reference) = { + * @return string + */ + public function getDraftModel() + { + return $this->draft_model; + } + + /** + * Required. The resource name of the draft model. + * + * Generated from protobuf field string draft_model = 1 [(.google.api.field_behavior) = REQUIRED, (.google.api.resource_reference) = { + * @param string $var + * @return $this + */ + public function setDraftModel($var) + { + GPBUtil::checkString($var, True); + $this->draft_model = $var; + + return $this; + } + +} + + diff --git a/AiPlatform/src/V1/SpeculativeDecodingSpec/NgramSpeculation.php b/AiPlatform/src/V1/SpeculativeDecodingSpec/NgramSpeculation.php new file mode 100644 index 000000000000..7fd31b4bfefb --- /dev/null +++ b/AiPlatform/src/V1/SpeculativeDecodingSpec/NgramSpeculation.php @@ -0,0 +1,82 @@ +google.cloud.aiplatform.v1.SpeculativeDecodingSpec.NgramSpeculation + */ +class NgramSpeculation extends \Google\Protobuf\Internal\Message +{ + /** + * The number of last N input tokens used as ngram to search/match + * against the previous prompt sequence. + * This is equal to the N in N-Gram. + * The default value is 3 if not specified. + * + * Generated from protobuf field int32 ngram_size = 1; + */ + protected $ngram_size = 0; + + /** + * Constructor. + * + * @param array $data { + * Optional. Data for populating the Message object. + * + * @type int $ngram_size + * The number of last N input tokens used as ngram to search/match + * against the previous prompt sequence. + * This is equal to the N in N-Gram. + * The default value is 3 if not specified. + * } + */ + public function __construct($data = NULL) { + \GPBMetadata\Google\Cloud\Aiplatform\V1\Endpoint::initOnce(); + parent::__construct($data); + } + + /** + * The number of last N input tokens used as ngram to search/match + * against the previous prompt sequence. + * This is equal to the N in N-Gram. + * The default value is 3 if not specified. + * + * Generated from protobuf field int32 ngram_size = 1; + * @return int + */ + public function getNgramSize() + { + return $this->ngram_size; + } + + /** + * The number of last N input tokens used as ngram to search/match + * against the previous prompt sequence. + * This is equal to the N in N-Gram. + * The default value is 3 if not specified. + * + * Generated from protobuf field int32 ngram_size = 1; + * @param int $var + * @return $this + */ + public function setNgramSize($var) + { + GPBUtil::checkInt32($var); + $this->ngram_size = $var; + + return $this; + } + +} + +