Blog Post
A New Chapter for Realtime AI: Reasoning, Translation, and Real-Time Transcription
New models not available in our subscription. No indication anywhere of how or who to contact to request them. Why does MS do this for every foundry release you guys are making it really hard to love foundry.
% az cognitiveservices account list-models \
--resource-group AIFOUNDRY-REALTIME \
--name XXXX \
-o json | jq '.[] | select((.name // "") | contains("gpt-realtime"))'
{
"baseModel": null,
"callRateLimit": null,
"capabilities": {
"assistants": "false",
"chatCompletion": "false",
"completion": "false",
"realtime": "true"
},
"deprecation": {
"fineTune": null,
"inference": "2027-02-28T00:00:00Z"
},
"finetuneCapabilities": null,
"format": "OpenAI",
"isDefaultVersion": false,
"lifecycleStatus": "GenerallyAvailable",
"maxCapacity": 3,
"name": "gpt-realtime",
"skus": [
{
"capacity": {
"default": 100,
"maximum": 30000,
"minimum": null,
"step": null
},
"deprecationDate": "2027-02-28T00:00:00+00:00",
"name": "GlobalStandard",
"rateLimits": [
{
"count": 20.0,
"key": "request",
"renewalPeriod": 60.0,
"rules": null
},
{
"count": 10000.0,
"key": "token",
"renewalPeriod": 60.0,
"rules": null
}
],
"usageName": "OpenAI.GlobalStandard.gpt-realtime"
}
],
"source": null,
"systemData": {
"createdAt": "2025-08-28T00:00:00+00:00",
"createdBy": "Microsoft",
"createdByType": "Application",
"lastModifiedAt": "2025-08-28T00:00:00+00:00",
"lastModifiedBy": "Microsoft",
"lastModifiedByType": "Application"
},
"version": "2025-08-28"
}
{
"baseModel": null,
"callRateLimit": null,
"capabilities": {
"assistants": "false",
"chatCompletion": "false",
"completion": "false",
"realtime": "true"
},
"deprecation": {
"fineTune": null,
"inference": "2027-04-07T00:00:00Z"
},
"finetuneCapabilities": null,
"format": "OpenAI",
"isDefaultVersion": false,
"lifecycleStatus": "GenerallyAvailable",
"maxCapacity": 3,
"name": "gpt-realtime-mini",
"skus": [
{
"capacity": {
"default": 100,
"maximum": 30000,
"minimum": null,
"step": null
},
"deprecationDate": "2027-04-07T00:00:00+00:00",
"name": "GlobalStandard",
"rateLimits": [
{
"count": 10.0,
"key": "request",
"renewalPeriod": 60.0,
"rules": null
},
{
"count": 5000.0,
"key": "token",
"renewalPeriod": 60.0,
"rules": null
}
],
"usageName": "OpenAI.GlobalStandard.gpt-realtime-mini"
}
],
"source": null,
"systemData": {
"createdAt": "2025-10-06T00:00:00+00:00",
"createdBy": "Microsoft",
"createdByType": "Application",
"lastModifiedAt": "2025-10-06T00:00:00+00:00",
"lastModifiedBy": "Microsoft",
"lastModifiedByType": "Application"
},
"version": "2025-10-06"
}
{
"baseModel": null,
"callRateLimit": null,
"capabilities": {
"assistants": "false",
"chatCompletion": "false",
"completion": "false",
"realtime": "true"
},
"deprecation": {
"fineTune": null,
"inference": "2026-12-15T00:00:00Z"
},
"finetuneCapabilities": null,
"format": "OpenAI",
"isDefaultVersion": true,
"lifecycleStatus": "GenerallyAvailable",
"maxCapacity": 3,
"name": "gpt-realtime-mini",
"skus": [
{
"capacity": {
"default": 100,
"maximum": 30000,
"minimum": null,
"step": null
},
"deprecationDate": "2026-12-15T00:00:00+00:00",
"name": "GlobalStandard",
"rateLimits": [
{
"count": 3.0,
"key": "request",
"renewalPeriod": 60.0,
"rules": null
},
{
"count": 10000.0,
"key": "token",
"renewalPeriod": 60.0,
"rules": null
}
],
"usageName": "OpenAI.GlobalStandard.gpt-realtime-mini"
}
],
"source": null,
"systemData": {
"createdAt": "2025-12-11T00:00:00+00:00",
"createdBy": "Microsoft",
"createdByType": "Application",
"lastModifiedAt": "2025-12-11T00:00:00+00:00",
"lastModifiedBy": "Microsoft",
"lastModifiedByType": "Application"
},
"version": "2025-12-15"
}
{
"baseModel": null,
"callRateLimit": null,
"capabilities": {
"assistants": "false",
"chatCompletion": "false",
"completion": "false",
"realtime": "true"
},
"deprecation": {
"fineTune": null,
"inference": "2027-02-23T00:00:00Z"
},
"finetuneCapabilities": null,
"format": "OpenAI",
"isDefaultVersion": false,
"lifecycleStatus": "GenerallyAvailable",
"maxCapacity": 3,
"name": "gpt-realtime-1.5",
"skus": [
{
"capacity": {
"default": 100,
"maximum": 30000,
"minimum": null,
"step": null
},
"deprecationDate": "2027-02-23T00:00:00+00:00",
"name": "GlobalStandard",
"rateLimits": [
{
"count": 20.0,
"key": "request",
"renewalPeriod": 60.0,
"rules": null
},
{
"count": 10000.0,
"key": "token",
"renewalPeriod": 60.0,
"rules": null
}
],
"usageName": "OpenAI.GlobalStandard.gpt-realtime-1.5"
}
],
"source": null,
"systemData": {
"createdAt": "2026-02-23T00:00:00+00:00",
"createdBy": "Microsoft",
"createdByType": "Application",
"lastModifiedAt": "2026-02-23T00:00:00+00:00",
"lastModifiedBy": "Microsoft",
"lastModifiedByType": "Application"
},
"version": "2026-02-23"
}