zsxkib/hailuo-02-with-sound
minimax/hailuo-02 + topazlabs/video-upscale + zsxkib/thinksound
        
          
            
          
          Public
        
      
      
        
          
            
          
          31
            runs
          
        
        
          
            
            
              Run zsxkib/hailuo-02-with-sound with an API
Use one of our client libraries to get started quickly. Clicking on a library will take you to the Playground tab where you can tweak different inputs, see the results, and copy the corresponding code to use in your own project.
            
              
                
              
            
            Input schema
          
          The fields you can use to run this model with an API. If you don't give a value for a field its default value will be used.
| Field | Type | Default value | Description | 
|---|---|---|---|
| prompt | 
            string
            
           | 
            Text prompt for generation
           | |
| first_frame_image | 
            string
            
           | 
            First frame image for video generation. The output video will have the same aspect ratio as this image.
           | |
| duration | 
            None
            
           | 
              6
             | 
            Duration of the video in seconds. 10 seconds is only available for 768p resolution.
           | 
| resolution | 
            None
            
           | 
              1080p
             | 
            Pick between standard 768p, or pro 1080p resolution. The pro model is not just high resolution, it is also higher quality.
           | 
| prompt_optimizer | 
            boolean
            
           | 
              True
             | 
            Use prompt optimizer
           | 
| enable_upscaling | 
            boolean
            
           | 
              True
             | 
            Enable video upscaling (disable for faster processing)
           | 
| target_resolution | 
            None
            
           | 
              1080p
             | 
            Target resolution for upscaling
           | 
| target_fps | 
            integer
            
           | 
              60
             Min: 15 Max: 120 | 
            Target FPS (choose from 15fps to 120fps)
           | 
| enable_sound | 
            boolean
            
           | 
              True
             | 
            Enable AI-generated sound (disable for silent video)
           | 
| context_hint | 
            string
            
           |  | 
            Optional context hint to help with challenging videos (e.g., 'fireworks video', 'cat playing', 'machinery sounds')
           | 
{
  "type": "object",
  "title": "Input",
  "required": [
    "prompt"
  ],
  "properties": {
    "prompt": {
      "type": "string",
      "title": "Prompt",
      "x-order": 0,
      "description": "Text prompt for generation"
    },
    "duration": {
      "enum": [
        6,
        10
      ],
      "type": "integer",
      "title": "duration",
      "description": "Duration of the video in seconds. 10 seconds is only available for 768p resolution.",
      "default": 6,
      "x-order": 2
    },
    "resolution": {
      "enum": [
        "768p",
        "1080p"
      ],
      "type": "string",
      "title": "resolution",
      "description": "Pick between standard 768p, or pro 1080p resolution. The pro model is not just high resolution, it is also higher quality.",
      "default": "1080p",
      "x-order": 3
    },
    "target_fps": {
      "type": "integer",
      "title": "Target Fps",
      "default": 60,
      "maximum": 120,
      "minimum": 15,
      "x-order": 7,
      "description": "Target FPS (choose from 15fps to 120fps)"
    },
    "context_hint": {
      "type": "string",
      "title": "Context Hint",
      "default": "",
      "x-order": 9,
      "description": "Optional context hint to help with challenging videos (e.g., 'fireworks video', 'cat playing', 'machinery sounds')"
    },
    "enable_sound": {
      "type": "boolean",
      "title": "Enable Sound",
      "default": true,
      "x-order": 8,
      "description": "Enable AI-generated sound (disable for silent video)"
    },
    "enable_upscaling": {
      "type": "boolean",
      "title": "Enable Upscaling",
      "default": true,
      "x-order": 5,
      "description": "Enable video upscaling (disable for faster processing)"
    },
    "prompt_optimizer": {
      "type": "boolean",
      "title": "Prompt Optimizer",
      "default": true,
      "x-order": 4,
      "description": "Use prompt optimizer"
    },
    "first_frame_image": {
      "type": "string",
      "title": "First Frame Image",
      "x-order": 1,
      "description": "First frame image for video generation. The output video will have the same aspect ratio as this image."
    },
    "target_resolution": {
      "enum": [
        "1080p",
        "2k",
        "4k"
      ],
      "type": "string",
      "title": "target_resolution",
      "description": "Target resolution for upscaling",
      "default": "1080p",
      "x-order": 6
    }
  }
}
            
              
                
              
            
            Output schema
          
        The shape of the response you’ll get when you run this model with an API.
              Schema
            
            {
  "type": "string",
  "title": "Output",
  "format": "uri"
}
                  Example API response
                
                View prediction
              'https://replicate.delivery/xezq/0esQGkn8TRVVLqNLT9pY9zd6AfOfEk6hS5yqJ95loiXBh9DqA/tmp7hbwh_bw.mp4'