simple_streaming_kimi-k2_wandb.yaml

 1---
 2version: 2
 3interactions:
 4  - id: 0
 5    request:
 6        proto: HTTP/1.1
 7        proto_major: 1
 8        proto_minor: 1
 9        content_length: 282
10        host: ""
11        body: '{"messages":[{"content":"You are a helpful assistant","role":"system"},{"content":"Say hi in Portuguese","role":"user"}],"model":"moonshotai/kimi-k2-0905","max_tokens":4000,"stream_options":{"include_usage":true},"provider":{"only":["wandb"]},"usage":{"include":true},"stream":true}'
12        headers:
13            Accept:
14              - application/json
15            Content-Type:
16              - application/json
17            User-Agent:
18              - OpenAI/Go 2.3.0
19        url: https://openrouter.ai/api/v1/chat/completions
20        method: POST
21    response:
22        proto: HTTP/2.0
23        proto_major: 2
24        proto_minor: 0
25        content_length: -1
26        body: '{"error":{"message":"Provider returned error","code":429,"metadata":{"raw":"moonshotai/kimi-k2-0905 is temporarily rate-limited upstream. Please retry shortly, or add your own key to accumulate your rate limits: https://openrouter.ai/settings/integrations","provider_name":"WandB"}},"user_id":"user_2zMGmKqlf4zmAvL9snVImB1Z1ZQ"}'
27        headers:
28            Content-Type:
29              - application/json
30        status: 429 Too Many Requests
31        code: 429
32        duration: 641.195667ms
33  - id: 1
34    request:
35        proto: HTTP/1.1
36        proto_major: 1
37        proto_minor: 1
38        content_length: 282
39        host: ""
40        body: '{"messages":[{"content":"You are a helpful assistant","role":"system"},{"content":"Say hi in Portuguese","role":"user"}],"model":"moonshotai/kimi-k2-0905","max_tokens":4000,"stream_options":{"include_usage":true},"provider":{"only":["wandb"]},"usage":{"include":true},"stream":true}'
41        headers:
42            Accept:
43              - application/json
44            Content-Type:
45              - application/json
46            User-Agent:
47              - OpenAI/Go 2.3.0
48        url: https://openrouter.ai/api/v1/chat/completions
49        method: POST
50    response:
51        proto: HTTP/2.0
52        proto_major: 2
53        proto_minor: 0
54        content_length: -1
55        body: |+
56            data: {"id":"gen-1758698629-5CNlN3eN3r4JHgnIsxJp","provider":"WandB","model":"moonshotai/kimi-k2-0905","object":"chat.completion.chunk","created":1758698629,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null,"native_finish_reason":null,"logprobs":null}]}
57
58            data: {"id":"gen-1758698629-5CNlN3eN3r4JHgnIsxJp","provider":"WandB","model":"moonshotai/kimi-k2-0905","object":"chat.completion.chunk","created":1758698629,"choices":[{"index":0,"delta":{"role":"assistant","content":"Oi"},"finish_reason":null,"native_finish_reason":null,"logprobs":null}]}
59
60            data: {"id":"gen-1758698629-5CNlN3eN3r4JHgnIsxJp","provider":"WandB","model":"moonshotai/kimi-k2-0905","object":"chat.completion.chunk","created":1758698629,"choices":[{"index":0,"delta":{"role":"assistant","content":"!"},"finish_reason":null,"native_finish_reason":null,"logprobs":null}]}
61
62            data: {"id":"gen-1758698629-5CNlN3eN3r4JHgnIsxJp","provider":"WandB","model":"moonshotai/kimi-k2-0905","object":"chat.completion.chunk","created":1758698629,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":"stop","native_finish_reason":"stop","logprobs":null}]}
63
64            data: {"id":"gen-1758698629-5CNlN3eN3r4JHgnIsxJp","provider":"WandB","model":"moonshotai/kimi-k2-0905","object":"chat.completion.chunk","created":1758698629,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null,"native_finish_reason":null,"logprobs":null}],"usage":{"prompt_tokens":20,"completion_tokens":3,"total_tokens":23,"cost":0.000039,"is_byok":false,"prompt_tokens_details":{"cached_tokens":0,"audio_tokens":0},"cost_details":{"upstream_inference_cost":null,"upstream_inference_prompt_cost":0.000027,"upstream_inference_completions_cost":0.000012},"completion_tokens_details":{"reasoning_tokens":0,"image_tokens":0}}}
65
66            data: [DONE]
67
68        headers:
69            Content-Type:
70              - text/event-stream
71        status: 200 OK
72        code: 200
73        duration: 523.797417ms