OpenAI APIs · Schema
TranscriptionResponse
Artificial IntelligenceEmbeddingsImage GenerationLanguage ModelsSpeech
Properties
| Name | Type | Description |
|---|---|---|
| text | string | The transcribed text |
| task | string | The task performed (transcribe) |
| language | string | The detected or specified language |
| duration | number | The duration of the audio in seconds |
| words | array | Word-level timestamps (when requested) |
| segments | array | Segment-level timestamps (when requested) |
JSON Schema
{
"$schema": "https://json-schema.org/draft/2020-12/schema",
"$id": "#/components/schemas/TranscriptionResponse",
"title": "TranscriptionResponse",
"type": "object",
"properties": {
"text": {
"type": "string",
"description": "The transcribed text"
},
"task": {
"type": "string",
"description": "The task performed (transcribe)"
},
"language": {
"type": "string",
"description": "The detected or specified language"
},
"duration": {
"type": "number",
"description": "The duration of the audio in seconds"
},
"words": {
"type": "array",
"items": {
"type": "object",
"properties": {
"word": {
"type": "string"
},
"start": {
"type": "number"
},
"end": {
"type": "number"
}
}
},
"description": "Word-level timestamps (when requested)"
},
"segments": {
"type": "array",
"items": {
"type": "object",
"properties": {
"id": {
"type": "integer"
},
"start": {
"type": "number"
},
"end": {
"type": "number"
},
"text": {
"type": "string"
}
}
},
"description": "Segment-level timestamps (when requested)"
}
}
}