That is because I believe the blog was pulled, so you were seeing a cached version that is no longer
That is because I believe the blog was pulled, so you were seeing a cached version that is no longer there.

refusal on the Anthropic API to be successful. https://docs.anthropic.com/en/docs/test-and-evaluate/strengthen-guardrails/handle-streaming-refusals#implementation-guide


error while building embeddings during the sync.ave you set up "Authenticated Gateway" on the settings pageyes
and passed the token in the cf-aig-authorization header as a bearer tokenno. I found no place for that.
refusalmodels/gemini-2.5-flash-lite is not found for API version v1, or is not supported for generateContent. Call ListModels to see the list of available models and their supported methodscurl -X POST https://gateway.ai.cloudflare.com/v1/<cloudflare-acco
unt-id>/<gateway-name>/groq/audio/transcriptions \
-H "Content-Type: multipart/form-data" \
-H "Authorization: Bearer <token>" \
-F "model=whisper-large-v3-turbo" \
-F "file=@/path/to/audio.mp3"{"error":{"message":"could not process file - is it a valid media file?","type":"invalid_request_error"}}error{
"error": {
"message": "You didn't provide an API key. You need to provide your API key in an Authorization header using Bearer auth (i.e. Authorization: Bearer YOUR_KEY), or as the password field (with blank username) if you're accessing the API from your browser and are prompted for a username and password. You can obtain an API key from https://platform.openai.com/account/api-keys.",
"type": "invalid_request_error",
"param": null,
"code": null
}
}"usage": {
"input_tokens": 0,
"cache_creation_input_tokens": 575,
"cache_read_input_tokens": 106910,
"cache_creation": {
"ephemeral_5m_input_tokens": 575,
"ephemeral_1h_input_tokens": 0
},
"output_tokens": 957,
"service_tier": "standard"
}{
"id": "msg_01HCDu5LRGeP2o7s2xGmxyx8",
"type": "message",
"role": "assistant",
"model": "claude-opus-4-1-20250805",
"content": "",
"stop_reason": null,
"stop_sequence": null,
"usage": {
"input_tokens": 9,
"cache_creation_input_tokens": 16203,
"cache_read_input_tokens": 0,
"cache_creation": {
"ephemeral_5m_input_tokens": 16203,
"ephemeral_1h_input_tokens": 0
},
"output_tokens": 0
},
"streamed_data": [
{
"nonce": "e8071956",
"type": "message_start",
"message": {
"id": "msg_01HCDu5LRGeP2o7s2xGmxyx8",
"type": "message",
"role": "assistant",
"model": "claude-opus-4-1-20250805",
"content": [],
"stop_reason": null,
"stop_sequence": null,
"usage": {
"input_tokens": 9,
"cache_creation_input_tokens": 16203,
"cache_read_input_tokens": 0,
"cache_creation": {
"ephemeral_5m_input_tokens": 16203,
"ephemeral_1h_input_tokens": 0
},
"output_tokens": 0
}
}
},
{
"type": "message_delta",
"delta": {
"stop_reason": "refusal",
"stop_sequence": null
},
"usage": {
"input_tokens": 9,
"cache_creation_input_tokens": 16203,
"cache_read_input_tokens": 0,
"output_tokens": 0
}
},
{
"nonce": "8aeda459",
"type": "message_stop"
}
]
}curl -N -X POST https://gateway.ai.cloudflare.com/v1/{account_id}/{gateway_id}/compat/chat/completions \
--header 'Authorization: Bearer {GOOGLE_GENERATIVE_AI_API_KEY}' \
--header 'Content-Type: application/json' \
--header 'Accept: text/event-stream' \
--header 'Cache-Control: no-cache' \
--data '{
"model": "google-ai-studio/gemini-2.0-flash",
"messages": [
{
"role": "user",
"content": "What is Cloudflare?"
}
],
"stream": true,
"temperature": 0.7,
"max_tokens": 1000
}' | while IFS= read -r line; do
echo "[$(date '+%H:%M:%S.%3N')] $line"
done