config.pbtxt 1.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263
  1. # Copyright (c) 2025, NVIDIA CORPORATION. All rights reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. name: "token2wav"
  15. backend: "python"
  16. max_batch_size: ${triton_max_batch_size}
  17. dynamic_batching {
  18. max_queue_delay_microseconds: ${max_queue_delay_microseconds}
  19. }
  20. parameters [
  21. {
  22. key: "model_dir",
  23. value: {string_value:"${model_dir}"}
  24. }
  25. ]
  26. input [
  27. {
  28. name: "target_speech_tokens"
  29. data_type: TYPE_INT32
  30. dims: [-1]
  31. },
  32. {
  33. name: "prompt_speech_tokens"
  34. data_type: TYPE_INT32
  35. dims: [-1]
  36. },
  37. {
  38. name: "prompt_speech_feat"
  39. data_type: TYPE_FP16
  40. dims: [-1, 80]
  41. },
  42. {
  43. name: "prompt_spk_embedding"
  44. data_type: TYPE_FP16
  45. dims: [-1]
  46. }
  47. ]
  48. output [
  49. {
  50. name: "waveform"
  51. data_type: TYPE_FP32
  52. dims: [ -1 ]
  53. }
  54. ]
  55. instance_group [
  56. {
  57. count: 1
  58. kind: KIND_CPU
  59. }
  60. ]