Failed to load versions. Head to the versions page to see all versions for this model.
You're looking at a specific version of this model. Jump to the model overview.
zsxkib /kimi-audio-7b-instruct:7500b323
Input
Run this model in Node.js with one line of code:
npm install replicate
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
import Replicate from "replicate";
const replicate = new Replicate({
auth: process.env.REPLICATE_API_TOKEN,
});
Run zsxkib/kimi-audio-7b-instruct using Replicateās API. Check out the model's schema for an overview of inputs and outputs.
const output = await replicate.run(
"zsxkib/kimi-audio-7b-instruct:7500b32387695e89da3d09271850319ba027969f0c714dfc226361609ff29f2b",
{
input: {
audio: "https://replicate.delivery/pbxt/MvvJqBrVl5ss7Q8v1ofoqrDevThwTTx2oybmqO6mfkv4NXBd/example_prompt.mp3",
prompt: "convert audio to text",
text_top_k: 5,
audio_top_k: 10,
output_type: "text",
return_json: true,
text_temperature: 0,
audio_temperature: 0.8,
text_repetition_penalty: 1,
audio_repetition_penalty: 1,
text_repetition_window_size: 16,
audio_repetition_window_size: 64
}
}
);
console.log(output);
To learn more, take a look at the guide on getting started with Node.js.
pip install replicate
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
import replicate
Run zsxkib/kimi-audio-7b-instruct using Replicateās API. Check out the model's schema for an overview of inputs and outputs.
output = replicate.run(
"zsxkib/kimi-audio-7b-instruct:7500b32387695e89da3d09271850319ba027969f0c714dfc226361609ff29f2b",
input={
"audio": "https://replicate.delivery/pbxt/MvvJqBrVl5ss7Q8v1ofoqrDevThwTTx2oybmqO6mfkv4NXBd/example_prompt.mp3",
"prompt": "convert audio to text",
"text_top_k": 5,
"audio_top_k": 10,
"output_type": "text",
"return_json": True,
"text_temperature": 0,
"audio_temperature": 0.8,
"text_repetition_penalty": 1,
"audio_repetition_penalty": 1,
"text_repetition_window_size": 16,
"audio_repetition_window_size": 64
}
)
print(output)
To learn more, take a look at the guide on getting started with Python.
REPLICATE_API_TOKEN
environment variable:export REPLICATE_API_TOKEN=<paste-your-token-here>
Find your API token in your account settings.
Run zsxkib/kimi-audio-7b-instruct using Replicateās API. Check out the model's schema for an overview of inputs and outputs.
curl -s -X POST \
-H "Authorization: Bearer $REPLICATE_API_TOKEN" \
-H "Content-Type: application/json" \
-H "Prefer: wait" \
-d $'{
"version": "zsxkib/kimi-audio-7b-instruct:7500b32387695e89da3d09271850319ba027969f0c714dfc226361609ff29f2b",
"input": {
"audio": "https://replicate.delivery/pbxt/MvvJqBrVl5ss7Q8v1ofoqrDevThwTTx2oybmqO6mfkv4NXBd/example_prompt.mp3",
"prompt": "convert audio to text",
"text_top_k": 5,
"audio_top_k": 10,
"output_type": "text",
"return_json": true,
"text_temperature": 0,
"audio_temperature": 0.8,
"text_repetition_penalty": 1,
"audio_repetition_penalty": 1,
"text_repetition_window_size": 16,
"audio_repetition_window_size": 64
}
}' \
https://api.replicate.com/v1/predictions
To learn more, take a look at Replicateās HTTP API reference docs.
Add a payment method to run this model.
By signing in, you agree to our
terms of service and privacy policy
Output
{
"completed_at": "2025-05-01T14:49:35.137147Z",
"created_at": "2025-05-01T14:49:34.483000Z",
"data_removed": false,
"error": null,
"id": "02q9mmga2drmc0cphh9sfv43h4",
"input": {
"audio": "https://replicate.delivery/pbxt/MvvJqBrVl5ss7Q8v1ofoqrDevThwTTx2oybmqO6mfkv4NXBd/example_prompt.mp3",
"prompt": "convert audio to text",
"text_top_k": 5,
"audio_top_k": 10,
"output_type": "text",
"return_json": true,
"text_temperature": 0,
"audio_temperature": 0.8,
"text_repetition_penalty": 1,
"audio_repetition_penalty": 1,
"text_repetition_window_size": 16,
"audio_repetition_window_size": 64
},
"logs": "Generating tokens: 0%| | 0/7444 [00:00<?, ?it/s]\nGenerating tokens: 0%| | 4/7444 [00:00<03:50, 32.32it/s]\nGenerating tokens: 0%| | 8/7444 [00:00<03:40, 33.67it/s]\nGenerating tokens: 0%| | 12/7444 [00:00<03:37, 34.09it/s]\nGenerating tokens: 0%| | 16/7444 [00:00<03:36, 34.32it/s]\nGenerating tokens: 0%| | 16/7444 [00:00<03:51, 32.06it/s]\n>>> output text: Open waits text to dialogue model. You get full control over scripts and voices.\nWritten output to /tmp/output/output.txt",
"metrics": {
"predict_time": 0.647011726,
"total_time": 0.654147
},
"output": {
"json_str": "Open waits text to dialogue model. You get full control over scripts and voices.",
"media_path": null
},
"started_at": "2025-05-01T14:49:34.490135Z",
"status": "succeeded",
"urls": {
"get": "https://api.replicate.com/v1/predictions/02q9mmga2drmc0cphh9sfv43h4",
"cancel": "https://api.replicate.com/v1/predictions/02q9mmga2drmc0cphh9sfv43h4/cancel"
},
"version": "7500b32387695e89da3d09271850319ba027969f0c714dfc226361609ff29f2b"
}
Generating tokens: 0%| | 0/7444 [00:00<?, ?it/s]
Generating tokens: 0%| | 4/7444 [00:00<03:50, 32.32it/s]
Generating tokens: 0%| | 8/7444 [00:00<03:40, 33.67it/s]
Generating tokens: 0%| | 12/7444 [00:00<03:37, 34.09it/s]
Generating tokens: 0%| | 16/7444 [00:00<03:36, 34.32it/s]
Generating tokens: 0%| | 16/7444 [00:00<03:51, 32.06it/s]
>>> output text: Open waits text to dialogue model. You get full control over scripts and voices.
Written output to /tmp/output/output.txt