config.pbtxt 1.1 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. name: "token2wav"
  2. backend: "python"
  3. max_batch_size: ${triton_max_batch_size}
  4. dynamic_batching {
  5. max_queue_delay_microseconds: ${max_queue_delay_microseconds}
  6. priority_levels: 100
  7. default_priority_level: 100
  8. }
  9. parameters [
  10. {
  11. key: "model_dir",
  12. value: {string_value:"${model_dir}"}
  13. }
  14. ]
  15. input [
  16. {
  17. name: "target_speech_tokens"
  18. data_type: TYPE_INT32
  19. dims: [-1]
  20. },
  21. {
  22. name: "prompt_speech_tokens"
  23. data_type: TYPE_INT32
  24. dims: [-1]
  25. optional: true
  26. },
  27. {
  28. name: "prompt_speech_feat"
  29. data_type: TYPE_FP16
  30. dims: [-1, 80]
  31. optional: true
  32. },
  33. {
  34. name: "prompt_spk_embedding"
  35. data_type: TYPE_FP16
  36. dims: [-1]
  37. optional: true
  38. },
  39. {
  40. name: "token_offset"
  41. data_type: TYPE_INT32
  42. dims: [ 1 ]
  43. reshape: { shape: [ ] }
  44. optional: true
  45. },
  46. {
  47. name: "finalize"
  48. data_type: TYPE_BOOL
  49. dims: [ 1 ]
  50. reshape: { shape: [ ] }
  51. optional: true
  52. }
  53. ]
  54. output [
  55. {
  56. name: "mel"
  57. data_type: TYPE_FP32
  58. dims: [ 80, -1 ]
  59. }
  60. ]
  61. instance_group [
  62. {
  63. count: 1
  64. kind: KIND_GPU
  65. gpus: [ 0 ]
  66. }
  67. ]