softwaremill
diff --git a/‎core/src/main/scala/sttp/openai/OpenAI.scala
+89-3 b/‎core/src/main/scala/sttp/openai/OpenAI.scala
+89-3
diff --git a/‎core/src/main/scala/sttp/openai/OpenAISyncClient.scala
+66-2 b/‎core/src/main/scala/sttp/openai/OpenAISyncClient.scala
+66-2
diff --git a/‎core/src/main/scala/sttp/openai/requests/assistants/AssistantsRequestBody.scala
+47-12 b/‎core/src/main/scala/sttp/openai/requests/assistants/AssistantsRequestBody.scala
+47-12
@@ -17,14 +17,14 @@ import sttp.openai.requests.audio.AudioResponseData.AudioResponse
 import sttp.openai.requests.audio.RecognitionModel
 import sttp.openai.requests.audio.transcriptions.TranscriptionConfig
 import sttp.openai.requests.audio.translations.TranslationConfig
+import sttp.openai.requests.batch.{QueryParameters => _, _}
 import sttp.openai.requests.completions.CompletionsRequestBody.CompletionsBody
 import sttp.openai.requests.completions.CompletionsResponseData.CompletionsResponse
 import sttp.openai.requests.completions.chat.ChatRequestBody.ChatBody
 import sttp.openai.requests.completions.chat.ChatRequestResponseData.ChatResponse
 import sttp.openai.requests.embeddings.EmbeddingsRequestBody.EmbeddingsBody
 import sttp.openai.requests.embeddings.EmbeddingsResponseBody.EmbeddingResponse
 import sttp.openai.requests.files.FilesResponseData._
-import sttp.openai.requests.finetuning
 import sttp.openai.requests.finetuning._
 import sttp.openai.requests.images.ImageResponseData.ImageResponse
 import sttp.openai.requests.images.creation.ImageCreationRequestBody.ImageCreationBody
@@ -37,7 +37,7 @@ import sttp.openai.requests.threads.QueryParameters
 import sttp.openai.requests.threads.ThreadsRequestBody.CreateThreadBody
 import sttp.openai.requests.threads.ThreadsResponseData.{DeleteThreadResponse, ThreadData}
 import sttp.openai.requests.threads.messages.ThreadMessagesRequestBody.CreateMessage
-import sttp.openai.requests.threads.messages.ThreadMessagesResponseData.{ListMessagesResponse, MessageData}
+import sttp.openai.requests.threads.messages.ThreadMessagesResponseData.{DeleteMessageResponse, ListMessagesResponse, MessageData}
 import sttp.openai.requests.threads.runs.ThreadRunsRequestBody._
 import sttp.openai.requests.threads.runs.ThreadRunsResponseData.{ListRunStepsResponse, ListRunsResponse, RunData, RunStepData}
 import sttp.openai.requests.vectorstore.VectorStoreRequestBody.{CreateVectorStoreBody, ModifyVectorStoreBody}
@@ -48,6 +48,7 @@ import sttp.openai.requests.vectorstore.file.VectorStoreFileResponseData.{
   ListVectorStoreFilesResponse,
   VectorStoreFile
 }
+import sttp.openai.requests.{batch, finetuning}
 
 import java.io.{File, InputStream}
 import java.nio.file.Paths
@@ -463,7 +464,8 @@ class OpenAI(authToken: String, baseUri: Uri = OpenAIUris.OpenAIBaseUri) {
           Some(multipart("model", model.value)),
           prompt.map(multipart("prompt", _)),
           responseFormat.map(format => multipart("response_format", format)),
-          temperature.map(multipart("temperature", _))
+          temperature.map(multipart("temperature", _)),
+          language.map(multipart("language", _))
         ).flatten
       }
       .response(asJson_parseErrors[AudioResponse])
@@ -767,6 +769,24 @@ class OpenAI(authToken: String, baseUri: Uri = OpenAIUris.OpenAIBaseUri) {
       .body(metadata)
       .response(asJson_parseErrors[MessageData])
 
+  /** Deletes a message.
+    *
+    * [[https://platform.openai.com/docs/api-reference/messages/deleteMessage]]
+    *
+    * @param threadId
+    *   The ID of the thread to which this message belongs.
+    *
+    * @param messageId
+    *   The ID of the message to delete.
+    *
+    * @return
+    *   Deletion status
+    */
+  def deleteMessage(threadId: String, messageId: String): Request[Either[OpenAIException, DeleteMessageResponse]] =
+    betaOpenAIAuthRequest
+      .delete(openAIUris.threadMessage(threadId, messageId))
+      .response(asJson_parseErrors[DeleteMessageResponse])
+
   /** Create an assistant with a model and instructions.
     *
     * [[https://platform.openai.com/docs/api-reference/assistants/createAssistant]]
@@ -1113,6 +1133,68 @@ class OpenAI(authToken: String, baseUri: Uri = OpenAIUris.OpenAIBaseUri) {
       .delete(openAIUris.vectorStoreFile(vectorStoreId, fileId))
       .response(asJson_parseErrors[DeleteVectorStoreFileResponse])
 
+  /** Creates and executes a batch from an uploaded file of requests
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/create]]
+    *
+    * @param createBatchRequest
+    *   Request body that will be used to create a batch.
+    * @return
+    *   The created Batch object.
+    */
+  def createBatch(createBatchRequest: BatchRequestBody): Request[Either[OpenAIException, BatchResponse]] =
+    openAIAuthRequest
+      .post(openAIUris.Batches)
+      .body(createBatchRequest)
+      .response(asJson_parseErrors[BatchResponse])
+
+  /** Retrieves a batch.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/retreive]]
+    *
+    * @param batchId
+    *   The ID of the batch to retrieve.
+    * @return
+    *   The Batch object matching the specified ID.
+    */
+  def retrieveBatch(batchId: String): Request[Either[OpenAIException, BatchResponse]] =
+    openAIAuthRequest
+      .get(openAIUris.batch(batchId))
+      .response(asJson_parseErrors[BatchResponse])
+
+  /** Cancels an in-progress batch. The batch will be in status cancelling for up to 10 minutes, before changing to cancelled, where it will
+    * have partial results (if any) available in the output file.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/cancel]]
+    *
+    * @param batchId
+    *   The ID of the batch to cancel.
+    * @return
+    *   The Batch object matching the specified ID.
+    */
+  def cancelBatch(batchId: String): Request[Either[OpenAIException, BatchResponse]] =
+    openAIAuthRequest
+      .post(openAIUris.cancelBatch(batchId))
+      .response(asJson_parseErrors[BatchResponse])
+
+  /** List your organization's batches.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/list]]
+    *
+    * @return
+    *   A list of paginated Batch objects.
+    */
+  def listBatches(
+      queryParameters: batch.QueryParameters = batch.QueryParameters.empty
+  ): Request[Either[OpenAIException, ListBatchResponse]] = {
+    val uri = openAIUris.Batches
+      .withParams(queryParameters.toMap)
+
+    openAIAuthRequest
+      .get(uri)
+      .response(asJson_parseErrors[ListBatchResponse])
+  }
+
   protected val openAIAuthRequest: PartialRequest[Either[String, String]] = basicRequest.auth
     .bearer(authToken)
 
@@ -1133,6 +1215,7 @@ private class OpenAIUris(val baseUri: Uri) {
   val Models: Uri = uri"$baseUri/models"
   val Moderations: Uri = uri"$baseUri/moderations"
   val FineTuningJobs: Uri = uri"$baseUri/fine_tuning/jobs"
+  val Batches: Uri = uri"$baseUri/batches"
   val Transcriptions: Uri = audioBase.addPath("transcriptions")
   val Translations: Uri = audioBase.addPath("translations")
   val VariationsImage: Uri = imageBase.addPath("variations")
@@ -1147,6 +1230,9 @@ private class OpenAIUris(val baseUri: Uri) {
   def fineTuningJobCheckpoints(fineTuningJobId: String): Uri = fineTuningJob(fineTuningJobId).addPath("checkpoints")
   def cancelFineTuningJob(fineTuningJobId: String): Uri = fineTuningJob(fineTuningJobId).addPath("cancel")
 
+  def batch(batchId: String): Uri = Batches.addPath(batchId)
+  def cancelBatch(batchId: String): Uri = batch(batchId).addPath("cancel")
+
   def file(fileId: String): Uri = Files.addPath(fileId)
   def fileContent(fileId: String): Uri = Files.addPath(fileId, "content")
   def model(modelId: String): Uri = Models.addPath(modelId)
 
@@ -9,14 +9,14 @@ import sttp.openai.requests.audio.AudioResponseData.AudioResponse
 import sttp.openai.requests.audio.RecognitionModel
 import sttp.openai.requests.audio.transcriptions.TranscriptionConfig
 import sttp.openai.requests.audio.translations.TranslationConfig
+import sttp.openai.requests.batch.{BatchRequestBody, BatchResponse, ListBatchResponse}
 import sttp.openai.requests.completions.CompletionsRequestBody.CompletionsBody
 import sttp.openai.requests.completions.CompletionsResponseData.CompletionsResponse
 import sttp.openai.requests.completions.chat.ChatRequestBody.ChatBody
 import sttp.openai.requests.completions.chat.ChatRequestResponseData.ChatResponse
 import sttp.openai.requests.embeddings.EmbeddingsRequestBody.EmbeddingsBody
 import sttp.openai.requests.embeddings.EmbeddingsResponseBody.EmbeddingResponse
 import sttp.openai.requests.files.FilesResponseData.{DeletedFileData, FileData, FilesResponse}
-import sttp.openai.requests.finetuning
 import sttp.openai.requests.finetuning._
 import sttp.openai.requests.images.ImageResponseData.ImageResponse
 import sttp.openai.requests.images.creation.ImageCreationRequestBody.ImageCreationBody
@@ -29,7 +29,7 @@ import sttp.openai.requests.threads.QueryParameters
 import sttp.openai.requests.threads.ThreadsRequestBody.CreateThreadBody
 import sttp.openai.requests.threads.ThreadsResponseData.{DeleteThreadResponse, ThreadData}
 import sttp.openai.requests.threads.messages.ThreadMessagesRequestBody.CreateMessage
-import sttp.openai.requests.threads.messages.ThreadMessagesResponseData.{ListMessagesResponse, MessageData}
+import sttp.openai.requests.threads.messages.ThreadMessagesResponseData.{DeleteMessageResponse, ListMessagesResponse, MessageData}
 import sttp.openai.requests.threads.runs.ThreadRunsRequestBody.{CreateRun, CreateThreadAndRun, ToolOutput}
 import sttp.openai.requests.threads.runs.ThreadRunsResponseData.{ListRunStepsResponse, ListRunsResponse, RunData, RunStepData}
 import sttp.openai.requests.vectorstore.VectorStoreRequestBody.{CreateVectorStoreBody, ModifyVectorStoreBody}
@@ -40,6 +40,7 @@ import sttp.openai.requests.vectorstore.file.VectorStoreFileResponseData.{
   ListVectorStoreFilesResponse,
   VectorStoreFile
 }
+import sttp.openai.requests.{batch, finetuning}
 
 import java.io.File
 
@@ -517,6 +518,22 @@ class OpenAISyncClient private (
   def modifyMessage(threadId: String, messageId: String, metadata: Map[String, String]): MessageData =
     sendOrThrow(openAI.modifyMessage(threadId, messageId, metadata))
 
+  /** Deletes a message.
+    *
+    * [[https://platform.openai.com/docs/api-reference/messages/deleteMessage]]
+    *
+    * @param threadId
+    *   The ID of the thread to which this message belongs.
+    *
+    * @param messageId
+    *   The ID of the message to delete.
+    *
+    * @return
+    *   Deletion status
+    */
+  def deleteMessage(threadId: String, messageId: String): DeleteMessageResponse =
+    sendOrThrow(openAI.deleteMessage(threadId, messageId))
+
   /** Create an assistant with a model and instructions.
     *
     * [[https://platform.openai.com/docs/api-reference/assistants/createAssistant]]
@@ -798,6 +815,53 @@ class OpenAISyncClient private (
   def deleteVectorStoreFile(vectorStoreId: String, fileId: String): DeleteVectorStoreFileResponse =
     sendOrThrow(openAI.deleteVectorStoreFile(vectorStoreId, fileId))
 
+  /** Creates and executes a batch from an uploaded file of requests
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/create]]
+    *
+    * @param createBatchRequest
+    *   Request body that will be used to create a batch.
+    * @return
+    *   The created Batch object.
+    */
+  def createBatch(createBatchRequest: BatchRequestBody): BatchResponse =
+    sendOrThrow(openAI.createBatch(createBatchRequest))
+
+  /** Retrieves a batch.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/retreive]]
+    *
+    * @param batchId
+    *   The ID of the batch to retrieve.
+    * @return
+    *   The Batch object matching the specified ID.
+    */
+  def retrieveBatch(batchId: String): BatchResponse =
+    sendOrThrow(openAI.retrieveBatch(batchId))
+
+  /** Cancels an in-progress batch. The batch will be in status cancelling for up to 10 minutes, before changing to cancelled, where it will
+    * have partial results (if any) available in the output file.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/cancel]]
+    *
+    * @param batchId
+    *   The ID of the batch to cancel.
+    * @return
+    *   The Batch object matching the specified ID.
+    */
+  def cancelBatch(batchId: String): BatchResponse =
+    sendOrThrow(openAI.cancelBatch(batchId))
+
+  /** List your organization's batches.
+    *
+    * [[https://platform.openai.com/docs/api-reference/batch/list]]
+    *
+    * @return
+    *   A list of paginated Batch objects.
+    */
+  def listBatches(queryParameters: batch.QueryParameters = batch.QueryParameters.empty): ListBatchResponse =
+    sendOrThrow(openAI.listBatches(queryParameters))
+
   /** Closes and releases resources of http client if was not provided explicitly, otherwise works no-op. */
   def close(): Unit = if (closeClient) backend.close() else ()
 
 
@@ -8,27 +8,31 @@ object AssistantsRequestBody {
   /** @param model
     *   ID of the model to use. You can use the List models API to see all of your available models, or see our Model overview for
     *   descriptions of them.
-    *
     * @param name
     *   The name of the assistant. The maximum length is 256 characters.
-    *
     * @param description
     *   The description of the assistant. The maximum length is 512 characters.
-    *
     * @param instructions
     *   The system instructions that the assistant uses. The maximum length is 32768 characters.
-    *
+    * @param reasoningEffort
+    *   o1 and o3-mini models only Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and
+    *   high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.
     * @param tools
     *   A list of tool enabled on the assistant. There can be a maximum of 128 tools per assistant. Tools can be of types code_interpreter,
     *   file_search, or function.
-    *
     * @param toolResources
     *   A set of resources that are used by the assistant's tools. The resources are specific to the type of tool. For example, the
     *   code_interpreter tool requires a list of file IDs, while the file_search tool requires a list of vector store IDs.
-    *
     * @param metadata
     *   Set of 16 key-value pairs that can be attached to an object. This can be useful for storing additional information about the object
     *   in a structured format. Keys can be a maximum of 64 characters long and values can be a maxium of 512 characters long.
+    * @param temperature
+    *   What sampling temperature to use, between 0 and 2. Higher values like 0.8 will make the output more random, while lower values like
+    *   0.2 will make it more focused and deterministic.
+    * @param topP
+    *   An alternative to sampling with temperature, called nucleus sampling, where the model considers the results of the tokens with top_p
+    *   probability mass. So 0.1 means only the tokens comprising the top 10% probability mass are considered. We generally recommend
+    *   altering this or temperature but not both.
     *
     * For more information please visit: [[https://platform.openai.com/docs/api-reference/assistants/createAssistant]]
     */
@@ -37,9 +41,12 @@ object AssistantsRequestBody {
       name: Option[String] = None,
       description: Option[String] = None,
       instructions: Option[String] = None,
+      reasoningEffort: Option[ReasoningEffort] = None,
       tools: Seq[Tool] = Seq.empty,
       toolResources: Option[ToolResources] = None,
-      metadata: Option[Map[String, String]] = None
+      metadata: Option[Map[String, String]] = None,
+      temperature: Option[Float] = None,
+      topP: Option[Float] = None
   )
   object CreateAssistantBody {
     implicit val createAssistantBodyW: SnakePickle.Writer[CreateAssistantBody] = SnakePickle.macroW[CreateAssistantBody]
@@ -48,26 +55,33 @@ object AssistantsRequestBody {
   /** @param model
     *   ID of the model to use. You can use the List models API to see all of your available models, or see our Model overview for
     *   descriptions of them.
-    *
     * @param name
     *   The name of the assistant. The maximum length is 256 characters.
-    *
     * @param description
     *   The description of the assistant. The maximum length is 512 characters.
-    *
     * @param instructions
     *   The system instructions that the assistant uses. The maximum length is 32768 characters.
+    * @param reasoningEffort
+    *   o1 and o3-mini models only
     *
+    * Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort
+    * can result in faster responses and fewer tokens used on reasoning in a response.
     * @param tools
     *   A list of tool enabled on the assistant. There can be a maximum of 128 tools per assistant. Tools can be of types code_interpreter,
     *   file_search, or function.
-    *
     * @param toolResources
     *   A set of resources that are used by the assistant's tools. The resources are specific to the type of tool. For example, the
     *   code_interpreter tool requires a list of file IDs, while the file_search tool requires a list of vector store IDs. v
     * @param metadata
     *   Set of 16 key-value pairs that can be attached to an object. This can be useful for storing additional information about the object
     *   in a structured format. Keys can be a maximum of 64 characters long and values can be a maxium of 512 characters long.
+    * @param temperature
+    *   What sampling temperature to use, between 0 and 2. Higher values like 0.8 will make the output more random, while lower values like
+    *   0.2 will make it more focused and deterministic.
+    * @param topP
+    *   An alternative to sampling with temperature, called nucleus sampling, where the model considers the results of the tokens with top_p
+    *   probability mass. So 0.1 means only the tokens comprising the top 10% probability mass are considered. We generally recommend
+    *   altering this or temperature but not both.
     *
     * For more information please visit: [[https://platform.openai.com/docs/api-reference/assistants/modifyAssistant]]
     */
@@ -76,12 +90,33 @@ object AssistantsRequestBody {
       name: Option[String] = None,
       description: Option[String] = None,
       instructions: Option[String] = None,
+      reasoningEffort: Option[ReasoningEffort] = None,
       tools: Seq[Tool] = Seq.empty,
       toolResources: Option[ToolResources] = None,
-      metadata: Map[String, String] = Map.empty
+      metadata: Map[String, String] = Map.empty,
+      temperature: Option[Float] = None,
+      topP: Option[Float] = None
   )
 
   object ModifyAssistantBody {
     implicit val modifyAssistantBodyW: SnakePickle.Writer[ModifyAssistantBody] = SnakePickle.macroW[ModifyAssistantBody]
   }
 }
+
+sealed abstract class ReasoningEffort(val value: String)
+
+object ReasoningEffort {
+
+  implicit val reasoningEffortW: SnakePickle.Writer[ReasoningEffort] = SnakePickle
+    .writer[ujson.Value]
+    .comap[ReasoningEffort](reasoningEffort => SnakePickle.writeJs(reasoningEffort.value))
+
+  case object Low extends ReasoningEffort("low")
+
+  case object Medium extends ReasoningEffort("medium")
+
+  case object High extends ReasoningEffort("high")
+
+  case class CustomReasoningEffort(customReasoningEffort: String) extends ReasoningEffort(customReasoningEffort)
+
+}