Fixing missing `object` field for regular completions.

This commit is contained in:
Nicolas Patry 2024-07-03 10:40:22 +00:00
parent 571530dd9a
commit 2bbb7fa4b2
No known key found for this signature in database
GPG Key ID: B154A218C20EBBCA
3 changed files with 118 additions and 20 deletions

View File

@ -946,6 +946,38 @@
} }
} }
}, },
"Chunk": {
"type": "object",
"required": [
"id",
"created",
"choices",
"model",
"system_fingerprint"
],
"properties": {
"choices": {
"type": "array",
"items": {
"$ref": "#/components/schemas/CompletionComplete"
}
},
"created": {
"type": "integer",
"format": "int64",
"minimum": 0
},
"id": {
"type": "string"
},
"model": {
"type": "string"
},
"system_fingerprint": {
"type": "string"
}
}
},
"CompatGenerateRequest": { "CompatGenerateRequest": {
"type": "object", "type": "object",
"required": [ "required": [
@ -965,6 +997,55 @@
} }
} }
}, },
"Completion": {
"oneOf": [
{
"allOf": [
{
"$ref": "#/components/schemas/Chunk"
},
{
"type": "object",
"required": [
"object"
],
"properties": {
"object": {
"type": "string",
"enum": [
"text_completion"
]
}
}
}
]
},
{
"allOf": [
{
"$ref": "#/components/schemas/CompletionFinal"
},
{
"type": "object",
"required": [
"object"
],
"properties": {
"object": {
"type": "string",
"enum": [
"text_completion"
]
}
}
}
]
}
],
"discriminator": {
"propertyName": "object"
}
},
"CompletionComplete": { "CompletionComplete": {
"type": "object", "type": "object",
"required": [ "required": [
@ -994,14 +1075,15 @@
} }
} }
}, },
"CompletionCompleteChunk": { "CompletionFinal": {
"type": "object", "type": "object",
"required": [ "required": [
"id", "id",
"created", "created",
"choices",
"model", "model",
"system_fingerprint" "system_fingerprint",
"choices",
"usage"
], ],
"properties": { "properties": {
"choices": { "choices": {
@ -1013,16 +1095,21 @@
"created": { "created": {
"type": "integer", "type": "integer",
"format": "int64", "format": "int64",
"example": "1706270835",
"minimum": 0 "minimum": 0
}, },
"id": { "id": {
"type": "string" "type": "string"
}, },
"model": { "model": {
"type": "string" "type": "string",
"example": "mistralai/Mistral-7B-Instruct-v0.2"
}, },
"system_fingerprint": { "system_fingerprint": {
"type": "string" "type": "string"
},
"usage": {
"$ref": "#/components/schemas/Usage"
} }
} }
}, },

View File

@ -433,8 +433,17 @@ pub struct CompletionRequest {
pub stop: Option<Vec<String>>, pub stop: Option<Vec<String>>,
} }
#[derive(Clone, Serialize, ToSchema)]
#[serde(tag = "object")]
enum Completion {
#[serde(rename = "text_completion")]
Chunk(Chunk),
#[serde(rename = "text_completion")]
Final(CompletionFinal),
}
#[derive(Clone, Deserialize, Serialize, ToSchema, Default)] #[derive(Clone, Deserialize, Serialize, ToSchema, Default)]
pub(crate) struct Completion { pub(crate) struct CompletionFinal {
pub id: String, pub id: String,
#[schema(example = "1706270835")] #[schema(example = "1706270835")]
pub created: u64, pub created: u64,
@ -453,6 +462,15 @@ pub(crate) struct CompletionComplete {
pub finish_reason: String, pub finish_reason: String,
} }
#[derive(Clone, Deserialize, Serialize, ToSchema)]
pub(crate) struct Chunk {
pub id: String,
pub created: u64,
pub choices: Vec<CompletionComplete>,
pub model: String,
pub system_fingerprint: String,
}
#[derive(Clone, Deserialize, Serialize, ToSchema)] #[derive(Clone, Deserialize, Serialize, ToSchema)]
pub(crate) struct ChatCompletion { pub(crate) struct ChatCompletion {
pub id: String, pub id: String,
@ -614,15 +632,6 @@ impl ChatCompletion {
} }
} }
} }
#[derive(Clone, Deserialize, Serialize, ToSchema)]
pub(crate) struct CompletionCompleteChunk {
pub id: String,
pub created: u64,
pub choices: Vec<CompletionComplete>,
pub model: String,
pub system_fingerprint: String,
}
#[derive(Clone, Serialize, ToSchema)] #[derive(Clone, Serialize, ToSchema)]
pub(crate) struct ChatCompletionChunk { pub(crate) struct ChatCompletionChunk {
pub id: String, pub id: String,

View File

@ -19,7 +19,7 @@ use crate::{
use crate::{ use crate::{
ChatCompletion, ChatCompletionChoice, ChatCompletionChunk, ChatCompletionComplete, ChatCompletion, ChatCompletionChoice, ChatCompletionChunk, ChatCompletionComplete,
ChatCompletionDelta, ChatCompletionLogprob, ChatCompletionLogprobs, ChatCompletionTopLogprob, ChatCompletionDelta, ChatCompletionLogprob, ChatCompletionLogprobs, ChatCompletionTopLogprob,
ChatRequest, CompatGenerateRequest, Completion, CompletionComplete, CompletionCompleteChunk, ChatRequest, Chunk, CompatGenerateRequest, Completion, CompletionComplete, CompletionFinal,
CompletionRequest, CompletionType, DeltaToolCall, Function, Tool, VertexRequest, CompletionRequest, CompletionType, DeltaToolCall, Function, Tool, VertexRequest,
VertexResponse, VertexResponse,
}; };
@ -705,7 +705,7 @@ async fn completions(
.as_secs(); .as_secs();
event event
.json_data(CompletionCompleteChunk { .json_data(Completion::Chunk(Chunk {
id: "".to_string(), id: "".to_string(),
created: current_time, created: current_time,
@ -718,7 +718,7 @@ async fn completions(
model: model_id.clone(), model: model_id.clone(),
system_fingerprint: system_fingerprint.clone(), system_fingerprint: system_fingerprint.clone(),
}) }))
.unwrap_or_else(|_e| Event::default()) .unwrap_or_else(|_e| Event::default())
}; };
@ -931,7 +931,7 @@ async fn completions(
.collect::<Result<Vec<_>, _>>() .collect::<Result<Vec<_>, _>>()
.map_err(|(status, Json(err))| (status, Json(err)))?; .map_err(|(status, Json(err))| (status, Json(err)))?;
let response = Completion { let response = Completion::Final(CompletionFinal {
id: "".to_string(), id: "".to_string(),
created: current_time, created: current_time,
model: info.model_id.clone(), model: info.model_id.clone(),
@ -946,7 +946,7 @@ async fn completions(
completion_tokens, completion_tokens,
total_tokens, total_tokens,
}, },
}; });
// headers similar to `generate` but aggregated // headers similar to `generate` but aggregated
let mut headers = HeaderMap::new(); let mut headers = HeaderMap::new();
@ -1464,7 +1464,9 @@ pub async fn run(
ChatCompletion, ChatCompletion,
CompletionRequest, CompletionRequest,
CompletionComplete, CompletionComplete,
CompletionCompleteChunk, Chunk,
Completion,
CompletionFinal,
GenerateParameters, GenerateParameters,
PrefillToken, PrefillToken,
Token, Token,