14
14
15
15
def parse_arguments ():
16
16
parser = argparse .ArgumentParser (description = "HTTP client for ChatTTS service" )
17
- parser .add_argument ("--text" , type = str , nargs = '+' , required = True , help = "Text to synthesize" )
18
- parser .add_argument ("--audio_seed" , type = int , required = True , help = "Audio generation seed" )
19
- parser .add_argument ("--text_seed" , type = int , required = True , help = "Text generation seed" )
20
- parser .add_argument ("--stream" , type = bool , default = False , help = "Enable/disable streaming" )
17
+ parser .add_argument (
18
+ "--text" , type = str , nargs = "+" , required = True , help = "Text to synthesize"
19
+ )
20
+ parser .add_argument (
21
+ "--audio_seed" , type = int , required = True , help = "Audio generation seed"
22
+ )
23
+ parser .add_argument (
24
+ "--text_seed" , type = int , required = True , help = "Text generation seed"
25
+ )
26
+ parser .add_argument (
27
+ "--stream" , type = bool , default = False , help = "Enable/disable streaming"
28
+ )
21
29
parser .add_argument ("--lang" , type = str , default = None , help = "Language code for text" )
22
- parser .add_argument ("--skip_refine_text" , type = bool , default = True , help = "Skip text refinement" )
23
- parser .add_argument ("--refine_text_only" , type = bool , default = False , help = "Only refine text" )
24
- parser .add_argument ("--use_decoder" , type = bool , default = True , help = "Use decoder during inference" )
25
- parser .add_argument ("--do_text_normalization" , type = bool , default = True , help = "Enable text normalization" )
26
- parser .add_argument ("--do_homophone_replacement" , type = bool , default = False , help = "Enable homophone replacement" )
27
- parser .add_argument ("--tgt" , type = str , default = "./output" , help = "Target directory to save output files" )
28
- parser .add_argument ("--filename" , type = str , default = "test.mp3" , help = "Target directory to save output files" )
30
+ parser .add_argument (
31
+ "--skip_refine_text" , type = bool , default = True , help = "Skip text refinement"
32
+ )
33
+ parser .add_argument (
34
+ "--refine_text_only" , type = bool , default = False , help = "Only refine text"
35
+ )
36
+ parser .add_argument (
37
+ "--use_decoder" , type = bool , default = True , help = "Use decoder during inference"
38
+ )
39
+ parser .add_argument (
40
+ "--do_text_normalization" ,
41
+ type = bool ,
42
+ default = True ,
43
+ help = "Enable text normalization" ,
44
+ )
45
+ parser .add_argument (
46
+ "--do_homophone_replacement" ,
47
+ type = bool ,
48
+ default = False ,
49
+ help = "Enable homophone replacement" ,
50
+ )
51
+ parser .add_argument (
52
+ "--tgt" ,
53
+ type = str ,
54
+ default = "./output" ,
55
+ help = "Target directory to save output files" ,
56
+ )
57
+ parser .add_argument (
58
+ "--filename" ,
59
+ type = str ,
60
+ default = "test.mp3" ,
61
+ help = "Target directory to save output files" ,
62
+ )
29
63
30
64
# Refinement text parameters
31
- parser .add_argument ("--refine_prompt" , type = str , default = "" , help = "Prompt for text refinement" )
32
- parser .add_argument ("--refine_top_P" , type = float , default = 0.7 , help = "Top P value for text refinement" )
33
- parser .add_argument ("--refine_top_K" , type = int , default = 20 , help = "Top K value for text refinement" )
34
- parser .add_argument ("--refine_temperature" , type = float , default = 0.7 , help = "Temperature for text refinement" )
35
- parser .add_argument ("--refine_repetition_penalty" , type = float , default = 1.0 ,
36
- help = "Repetition penalty for text refinement" )
37
- parser .add_argument ("--refine_max_new_token" , type = int , default = 384 , help = "Max new tokens for text refinement" )
38
- parser .add_argument ("--refine_min_new_token" , type = int , default = 0 , help = "Min new tokens for text refinement" )
39
- parser .add_argument ("--refine_show_tqdm" , type = bool , default = True , help = "Show progress bar for text refinement" )
40
- parser .add_argument ("--refine_ensure_non_empty" , type = bool , default = True , help = "Ensure non-empty output" )
41
- parser .add_argument ("--refine_stream_batch" , type = int , default = 24 , help = "Stream batch size for refinement" )
65
+ parser .add_argument (
66
+ "--refine_prompt" , type = str , default = "" , help = "Prompt for text refinement"
67
+ )
68
+ parser .add_argument (
69
+ "--refine_top_P" ,
70
+ type = float ,
71
+ default = 0.7 ,
72
+ help = "Top P value for text refinement" ,
73
+ )
74
+ parser .add_argument (
75
+ "--refine_top_K" , type = int , default = 20 , help = "Top K value for text refinement"
76
+ )
77
+ parser .add_argument (
78
+ "--refine_temperature" ,
79
+ type = float ,
80
+ default = 0.7 ,
81
+ help = "Temperature for text refinement" ,
82
+ )
83
+ parser .add_argument (
84
+ "--refine_repetition_penalty" ,
85
+ type = float ,
86
+ default = 1.0 ,
87
+ help = "Repetition penalty for text refinement" ,
88
+ )
89
+ parser .add_argument (
90
+ "--refine_max_new_token" ,
91
+ type = int ,
92
+ default = 384 ,
93
+ help = "Max new tokens for text refinement" ,
94
+ )
95
+ parser .add_argument (
96
+ "--refine_min_new_token" ,
97
+ type = int ,
98
+ default = 0 ,
99
+ help = "Min new tokens for text refinement" ,
100
+ )
101
+ parser .add_argument (
102
+ "--refine_show_tqdm" ,
103
+ type = bool ,
104
+ default = True ,
105
+ help = "Show progress bar for text refinement" ,
106
+ )
107
+ parser .add_argument (
108
+ "--refine_ensure_non_empty" ,
109
+ type = bool ,
110
+ default = True ,
111
+ help = "Ensure non-empty output" ,
112
+ )
113
+ parser .add_argument (
114
+ "--refine_stream_batch" ,
115
+ type = int ,
116
+ default = 24 ,
117
+ help = "Stream batch size for refinement" ,
118
+ )
42
119
43
120
# Infer code parameters
44
- parser .add_argument ("--infer_prompt" , type = str , default = "[speed_5]" , help = "Prompt for inference" )
45
- parser .add_argument ("--infer_top_P" , type = float , default = 0.1 , help = "Top P value for inference" )
46
- parser .add_argument ("--infer_top_K" , type = int , default = 20 , help = "Top K value for inference" )
47
- parser .add_argument ("--infer_temperature" , type = float , default = 0.3 , help = "Temperature for inference" )
48
- parser .add_argument ("--infer_repetition_penalty" , type = float , default = 1.05 , help = "Repetition penalty for inference" )
49
- parser .add_argument ("--infer_max_new_token" , type = int , default = 2048 , help = "Max new tokens for inference" )
50
- parser .add_argument ("--infer_min_new_token" , type = int , default = 0 , help = "Min new tokens for inference" )
51
- parser .add_argument ("--infer_show_tqdm" , type = bool , default = True , help = "Show progress bar for inference" )
52
- parser .add_argument ("--infer_ensure_non_empty" , type = bool , default = True , help = "Ensure non-empty output" )
53
- parser .add_argument ("--infer_stream_batch" , type = bool , default = True , help = "Stream batch for inference" )
54
- parser .add_argument ("--infer_spk_emb" , type = str , default = None , help = "Speaker embedding for inference" )
121
+ parser .add_argument (
122
+ "--infer_prompt" , type = str , default = "[speed_5]" , help = "Prompt for inference"
123
+ )
124
+ parser .add_argument (
125
+ "--infer_top_P" , type = float , default = 0.1 , help = "Top P value for inference"
126
+ )
127
+ parser .add_argument (
128
+ "--infer_top_K" , type = int , default = 20 , help = "Top K value for inference"
129
+ )
130
+ parser .add_argument (
131
+ "--infer_temperature" , type = float , default = 0.3 , help = "Temperature for inference"
132
+ )
133
+ parser .add_argument (
134
+ "--infer_repetition_penalty" ,
135
+ type = float ,
136
+ default = 1.05 ,
137
+ help = "Repetition penalty for inference" ,
138
+ )
139
+ parser .add_argument (
140
+ "--infer_max_new_token" ,
141
+ type = int ,
142
+ default = 2048 ,
143
+ help = "Max new tokens for inference" ,
144
+ )
145
+ parser .add_argument (
146
+ "--infer_min_new_token" ,
147
+ type = int ,
148
+ default = 0 ,
149
+ help = "Min new tokens for inference" ,
150
+ )
151
+ parser .add_argument (
152
+ "--infer_show_tqdm" ,
153
+ type = bool ,
154
+ default = True ,
155
+ help = "Show progress bar for inference" ,
156
+ )
157
+ parser .add_argument (
158
+ "--infer_ensure_non_empty" ,
159
+ type = bool ,
160
+ default = True ,
161
+ help = "Ensure non-empty output" ,
162
+ )
163
+ parser .add_argument (
164
+ "--infer_stream_batch" ,
165
+ type = bool ,
166
+ default = True ,
167
+ help = "Stream batch for inference" ,
168
+ )
169
+ parser .add_argument (
170
+ "--infer_spk_emb" ,
171
+ type = str ,
172
+ default = None ,
173
+ help = "Speaker embedding for inference" ,
174
+ )
55
175
56
176
return parser .parse_args ()
57
177
58
178
59
-
60
179
def main ():
61
180
args = parse_arguments ()
62
181
@@ -65,7 +184,7 @@ def main():
65
184
"text" : args .text ,
66
185
"stream" : args .stream ,
67
186
"lang" : args .lang ,
68
- "filename" :args .filename ,
187
+ "filename" : args .filename ,
69
188
"skip_refine_text" : args .skip_refine_text ,
70
189
"refine_text_only" : args .refine_text_only ,
71
190
"use_decoder" : args .use_decoder ,
0 commit comments