archcollege/voice | API reference

Public

49 runs

Run archcollege/voice with an API

Use one of our client libraries to get started quickly. Clicking on a library will take you to the Playground tab where you can tweak different inputs, see the results, and copy the corresponding code to use in your own project.

Input schema

The fields you can use to run this model with an API. If you don't give a value for a field its default value will be used.

Field	Type	Default value	Description
train_audio	string		请输入要训练的声音文件.建议10-20分钟
total_epoch	integer	20	总训练轮数
if_f0_3	boolean	False	模型是否带音高指导(唱歌一定要, 语音可以不要)
f0method8	None	harvest	选择音高提取算法:输入歌声可用pm提速,高质量语音但CPU差可用dio提速,harvest质量更好但慢,rmvpe效果最好且微吃CPU/GPU
if_cache_gpu17	boolean	False	是否缓存所有训练集至显存. 10min以下小数据可缓存以加速训练, 大数据缓存会炸显存也加不了多少速
audio_pth	string		(推理音频用)请输入训练好的声音模型
audio	string		(推理音频用)请输入需要合成的声音源文件

{
  "type": "object",
  "title": "Input",
  "properties": {
    "audio": {
      "type": "string",
      "title": "Audio",
      "format": "uri",
      "x-order": 6,
      "description": "(\u63a8\u7406\u97f3\u9891\u7528)\u8bf7\u8f93\u5165\u9700\u8981\u5408\u6210\u7684\u58f0\u97f3\u6e90\u6587\u4ef6"
    },
    "if_f0_3": {
      "type": "boolean",
      "title": "If F0 3",
      "default": false,
      "x-order": 2,
      "description": "\u6a21\u578b\u662f\u5426\u5e26\u97f3\u9ad8\u6307\u5bfc(\u5531\u6b4c\u4e00\u5b9a\u8981, \u8bed\u97f3\u53ef\u4ee5\u4e0d\u8981)"
    },
    "audio_pth": {
      "type": "string",
      "title": "Audio Pth",
      "format": "uri",
      "x-order": 5,
      "description": "(\u63a8\u7406\u97f3\u9891\u7528)\u8bf7\u8f93\u5165\u8bad\u7ec3\u597d\u7684\u58f0\u97f3\u6a21\u578b"
    },
    "f0method8": {
      "enum": [
        "pm",
        "harvest",
        "dio",
        "rmvpe",
        "rmvpe_gpu"
      ],
      "type": "string",
      "title": "f0method8",
      "description": "\u9009\u62e9\u97f3\u9ad8\u63d0\u53d6\u7b97\u6cd5:\u8f93\u5165\u6b4c\u58f0\u53ef\u7528pm\u63d0\u901f,\u9ad8\u8d28\u91cf\u8bed\u97f3\u4f46CPU\u5dee\u53ef\u7528dio\u63d0\u901f,harvest\u8d28\u91cf\u66f4\u597d\u4f46\u6162,rmvpe\u6548\u679c\u6700\u597d\u4e14\u5fae\u5403CPU/GPU",
      "default": "harvest",
      "x-order": 3
    },
    "total_epoch": {
      "type": "integer",
      "title": "Total Epoch",
      "default": 20,
      "x-order": 1,
      "description": "\u603b\u8bad\u7ec3\u8f6e\u6570"
    },
    "train_audio": {
      "type": "string",
      "title": "Train Audio",
      "format": "uri",
      "x-order": 0,
      "description": "\u8bf7\u8f93\u5165\u8981\u8bad\u7ec3\u7684\u58f0\u97f3\u6587\u4ef6.\u5efa\u8bae10-20\u5206\u949f"
    },
    "if_cache_gpu17": {
      "type": "boolean",
      "title": "If Cache Gpu17",
      "default": false,
      "x-order": 4,
      "description": "\u662f\u5426\u7f13\u5b58\u6240\u6709\u8bad\u7ec3\u96c6\u81f3\u663e\u5b58. 10min\u4ee5\u4e0b\u5c0f\u6570\u636e\u53ef\u7f13\u5b58\u4ee5\u52a0\u901f\u8bad\u7ec3, \u5927\u6570\u636e\u7f13\u5b58\u4f1a\u70b8\u663e\u5b58\u4e5f\u52a0\u4e0d\u4e86\u591a\u5c11\u901f"
    }
  }
}

Output schema

The shape of the response you’ll get when you run this model with an API.

Schema

{
  "type": "string",
  "title": "Output",
  "format": "uri"
}