Aditya02 commited on
Commit
91fc676
·
verified ·
1 Parent(s): 1eaa937

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +73 -35
  2. LICENSE +395 -0
  3. NumberToText.py +96 -0
  4. README.md +115 -0
  5. api.py +63 -0
  6. app.py +179 -0
  7. assamese_latest/female/model/config.yaml +319 -0
  8. assamese_latest/female/model/energy_stats.npz +3 -0
  9. assamese_latest/female/model/feats_stats.npz +3 -0
  10. assamese_latest/female/model/model.pth +3 -0
  11. assamese_latest/female/model/pitch_stats.npz +3 -0
  12. assamese_latest/male/model/config.yaml +315 -0
  13. assamese_latest/male/model/energy_stats.npz +3 -0
  14. assamese_latest/male/model/feats_stats.npz +3 -0
  15. assamese_latest/male/model/feats_type +1 -0
  16. assamese_latest/male/model/model.pth +3 -0
  17. assamese_latest/male/model/pitch_stats.npz +3 -0
  18. bengali_latest/male/model/config.yaml +315 -0
  19. bengali_latest/male/model/energy_stats.npz +3 -0
  20. bengali_latest/male/model/feats_stats.npz +3 -0
  21. bengali_latest/male/model/model.pth +3 -0
  22. bengali_latest/male/model/pitch_stats.npz +3 -0
  23. bodo_latest/female/model/config.yaml +319 -0
  24. bodo_latest/female/model/energy_stats.npz +3 -0
  25. bodo_latest/female/model/feats_stats.npz +3 -0
  26. bodo_latest/female/model/feats_type +1 -0
  27. bodo_latest/female/model/model.pth +3 -0
  28. bodo_latest/female/model/pitch_stats.npz +3 -0
  29. bodo_latest/male/model/config.yaml +319 -0
  30. bodo_latest/male/model/energy_stats.npz +3 -0
  31. bodo_latest/male/model/feats_stats.npz +3 -0
  32. bodo_latest/male/model/feats_type +1 -0
  33. bodo_latest/male/model/model.pth +3 -0
  34. bodo_latest/male/model/pitch_stats.npz +3 -0
  35. charmap/Text_Cleaning.ipynb +332 -0
  36. charmap/Text_Cleaning.py +76 -0
  37. charmap/charmap_Bengali.txt +62 -0
  38. charmap/charmap_Hindi.txt +81 -0
  39. charmap/charmap_Hindi.xlsx +0 -0
  40. charmap/charmap_Malayalam.txt +81 -0
  41. charmap/charmap_Malayalam.xlsx +0 -0
  42. charmap/charmap_Marathi.txt +81 -0
  43. charmap/charmap_Marathi.xlsx +0 -0
  44. charmap/charmap_Tamil.disabled +76 -0
  45. charmap/charmap_Tamil.xlsx +0 -0
  46. charmap/charmap_Telugu.txt +81 -0
  47. charmap/charmap_Telugu.xlsx +0 -0
  48. dogri_latest/female/model/config.yaml +320 -0
  49. dogri_latest/female/model/energy_stats.npz +3 -0
  50. dogri_latest/female/model/feats_stats.npz +3 -0
.gitattributes CHANGED
@@ -1,35 +1,73 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ license.pdf filter=lfs diff=lfs merge=lfs -text
37
+ vocoder/female/assamese_latest/generator filter=lfs diff=lfs merge=lfs -text
38
+ vocoder/female/bengali_latest/generator filter=lfs diff=lfs merge=lfs -text
39
+ vocoder/female/bodo_latest/generator filter=lfs diff=lfs merge=lfs -text
40
+ vocoder/female/dogri_latest/generator filter=lfs diff=lfs merge=lfs -text
41
+ vocoder/female/gujarati_latest/generator filter=lfs diff=lfs merge=lfs -text
42
+ vocoder/female/hindi_latest/generator filter=lfs diff=lfs merge=lfs -text
43
+ vocoder/female/kannada_latest/generator filter=lfs diff=lfs merge=lfs -text
44
+ vocoder/female/konkani_latest/generator filter=lfs diff=lfs merge=lfs -text
45
+ vocoder/female/maithili_latest/generator filter=lfs diff=lfs merge=lfs -text
46
+ vocoder/female/malayalam_latest/generator filter=lfs diff=lfs merge=lfs -text
47
+ vocoder/female/manipuri_latest/generator filter=lfs diff=lfs merge=lfs -text
48
+ vocoder/female/nepali_latest/generator filter=lfs diff=lfs merge=lfs -text
49
+ vocoder/female/punjabi_latest/generator filter=lfs diff=lfs merge=lfs -text
50
+ vocoder/female/rajasthani_latest/generator filter=lfs diff=lfs merge=lfs -text
51
+ vocoder/female/sanskrit_latest/generator filter=lfs diff=lfs merge=lfs -text
52
+ vocoder/female/sindhi_latest/generator filter=lfs diff=lfs merge=lfs -text
53
+ vocoder/female/tamil_latest/generator filter=lfs diff=lfs merge=lfs -text
54
+ vocoder/female/telugu_latest/generator filter=lfs diff=lfs merge=lfs -text
55
+ vocoder/male/assamese_latest/generator filter=lfs diff=lfs merge=lfs -text
56
+ vocoder/male/bengali_latest/generator filter=lfs diff=lfs merge=lfs -text
57
+ vocoder/male/bodo_latest/generator filter=lfs diff=lfs merge=lfs -text
58
+ vocoder/male/dogri_latest/generator filter=lfs diff=lfs merge=lfs -text
59
+ vocoder/male/gujarati_latest/generator filter=lfs diff=lfs merge=lfs -text
60
+ vocoder/male/hindi_latest/generator filter=lfs diff=lfs merge=lfs -text
61
+ vocoder/male/kannada_latest/generator filter=lfs diff=lfs merge=lfs -text
62
+ vocoder/male/konkani_latest/generator filter=lfs diff=lfs merge=lfs -text
63
+ vocoder/male/maithili_latest/generator filter=lfs diff=lfs merge=lfs -text
64
+ vocoder/male/malayalam_latest/generator filter=lfs diff=lfs merge=lfs -text
65
+ vocoder/male/manipuri_latest/generator filter=lfs diff=lfs merge=lfs -text
66
+ vocoder/male/nepali_latest/generator filter=lfs diff=lfs merge=lfs -text
67
+ vocoder/male/punjabi_latest/generator filter=lfs diff=lfs merge=lfs -text
68
+ vocoder/male/rajasthani_latest/generator filter=lfs diff=lfs merge=lfs -text
69
+ vocoder/male/sanskrit_latest/generator filter=lfs diff=lfs merge=lfs -text
70
+ vocoder/male/sindhi_latest/generator filter=lfs diff=lfs merge=lfs -text
71
+ vocoder/male/tamil_latest/generator filter=lfs diff=lfs merge=lfs -text
72
+ vocoder/male/telugu_latest/generator filter=lfs diff=lfs merge=lfs -text
73
+ ssn_parser_new/scripts/tamil_trans_py filter=lfs diff=lfs merge=lfs -text
LICENSE ADDED
@@ -0,0 +1,395 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Attribution 4.0 International
2
+
3
+ =======================================================================
4
+
5
+ Creative Commons Corporation ("Creative Commons") is not a law firm and
6
+ does not provide legal services or legal advice. Distribution of
7
+ Creative Commons public licenses does not create a lawyer-client or
8
+ other relationship. Creative Commons makes its licenses and related
9
+ information available on an "as-is" basis. Creative Commons gives no
10
+ warranties regarding its licenses, any material licensed under their
11
+ terms and conditions, or any related information. Creative Commons
12
+ disclaims all liability for damages resulting from their use to the
13
+ fullest extent possible.
14
+
15
+ Using Creative Commons Public Licenses
16
+
17
+ Creative Commons public licenses provide a standard set of terms and
18
+ conditions that creators and other rights holders may use to share
19
+ original works of authorship and other material subject to copyright
20
+ and certain other rights specified in the public license below. The
21
+ following considerations are for informational purposes only, are not
22
+ exhaustive, and do not form part of our licenses.
23
+
24
+ Considerations for licensors: Our public licenses are
25
+ intended for use by those authorized to give the public
26
+ permission to use material in ways otherwise restricted by
27
+ copyright and certain other rights. Our licenses are
28
+ irrevocable. Licensors should read and understand the terms
29
+ and conditions of the license they choose before applying it.
30
+ Licensors should also secure all rights necessary before
31
+ applying our licenses so that the public can reuse the
32
+ material as expected. Licensors should clearly mark any
33
+ material not subject to the license. This includes other CC-
34
+ licensed material, or material used under an exception or
35
+ limitation to copyright. More considerations for licensors:
36
+ wiki.creativecommons.org/Considerations_for_licensors
37
+
38
+ Considerations for the public: By using one of our public
39
+ licenses, a licensor grants the public permission to use the
40
+ licensed material under specified terms and conditions. If
41
+ the licensor's permission is not necessary for any reason--for
42
+ example, because of any applicable exception or limitation to
43
+ copyright--then that use is not regulated by the license. Our
44
+ licenses grant only permissions under copyright and certain
45
+ other rights that a licensor has authority to grant. Use of
46
+ the licensed material may still be restricted for other
47
+ reasons, including because others have copyright or other
48
+ rights in the material. A licensor may make special requests,
49
+ such as asking that all changes be marked or described.
50
+ Although not required by our licenses, you are encouraged to
51
+ respect those requests where reasonable. More_considerations
52
+ for the public:
53
+ wiki.creativecommons.org/Considerations_for_licensees
54
+
55
+ =======================================================================
56
+
57
+ Creative Commons Attribution 4.0 International Public License
58
+
59
+ By exercising the Licensed Rights (defined below), You accept and agree
60
+ to be bound by the terms and conditions of this Creative Commons
61
+ Attribution 4.0 International Public License ("Public License"). To the
62
+ extent this Public License may be interpreted as a contract, You are
63
+ granted the Licensed Rights in consideration of Your acceptance of
64
+ these terms and conditions, and the Licensor grants You such rights in
65
+ consideration of benefits the Licensor receives from making the
66
+ Licensed Material available under these terms and conditions.
67
+
68
+
69
+ Section 1 -- Definitions.
70
+
71
+ a. Adapted Material means material subject to Copyright and Similar
72
+ Rights that is derived from or based upon the Licensed Material
73
+ and in which the Licensed Material is translated, altered,
74
+ arranged, transformed, or otherwise modified in a manner requiring
75
+ permission under the Copyright and Similar Rights held by the
76
+ Licensor. For purposes of this Public License, where the Licensed
77
+ Material is a musical work, performance, or sound recording,
78
+ Adapted Material is always produced where the Licensed Material is
79
+ synched in timed relation with a moving image.
80
+
81
+ b. Adapter's License means the license You apply to Your Copyright
82
+ and Similar Rights in Your contributions to Adapted Material in
83
+ accordance with the terms and conditions of this Public License.
84
+
85
+ c. Copyright and Similar Rights means copyright and/or similar rights
86
+ closely related to copyright including, without limitation,
87
+ performance, broadcast, sound recording, and Sui Generis Database
88
+ Rights, without regard to how the rights are labeled or
89
+ categorized. For purposes of this Public License, the rights
90
+ specified in Section 2(b)(1)-(2) are not Copyright and Similar
91
+ Rights.
92
+
93
+ d. Effective Technological Measures means those measures that, in the
94
+ absence of proper authority, may not be circumvented under laws
95
+ fulfilling obligations under Article 11 of the WIPO Copyright
96
+ Treaty adopted on December 20, 1996, and/or similar international
97
+ agreements.
98
+
99
+ e. Exceptions and Limitations means fair use, fair dealing, and/or
100
+ any other exception or limitation to Copyright and Similar Rights
101
+ that applies to Your use of the Licensed Material.
102
+
103
+ f. Licensed Material means the artistic or literary work, database,
104
+ or other material to which the Licensor applied this Public
105
+ License.
106
+
107
+ g. Licensed Rights means the rights granted to You subject to the
108
+ terms and conditions of this Public License, which are limited to
109
+ all Copyright and Similar Rights that apply to Your use of the
110
+ Licensed Material and that the Licensor has authority to license.
111
+
112
+ h. Licensor means the individual(s) or entity(ies) granting rights
113
+ under this Public License.
114
+
115
+ i. Share means to provide material to the public by any means or
116
+ process that requires permission under the Licensed Rights, such
117
+ as reproduction, public display, public performance, distribution,
118
+ dissemination, communication, or importation, and to make material
119
+ available to the public including in ways that members of the
120
+ public may access the material from a place and at a time
121
+ individually chosen by them.
122
+
123
+ j. Sui Generis Database Rights means rights other than copyright
124
+ resulting from Directive 96/9/EC of the European Parliament and of
125
+ the Council of 11 March 1996 on the legal protection of databases,
126
+ as amended and/or succeeded, as well as other essentially
127
+ equivalent rights anywhere in the world.
128
+
129
+ k. You means the individual or entity exercising the Licensed Rights
130
+ under this Public License. Your has a corresponding meaning.
131
+
132
+
133
+ Section 2 -- Scope.
134
+
135
+ a. License grant.
136
+
137
+ 1. Subject to the terms and conditions of this Public License,
138
+ the Licensor hereby grants You a worldwide, royalty-free,
139
+ non-sublicensable, non-exclusive, irrevocable license to
140
+ exercise the Licensed Rights in the Licensed Material to:
141
+
142
+ a. reproduce and Share the Licensed Material, in whole or
143
+ in part; and
144
+
145
+ b. produce, reproduce, and Share Adapted Material.
146
+
147
+ 2. Exceptions and Limitations. For the avoidance of doubt, where
148
+ Exceptions and Limitations apply to Your use, this Public
149
+ License does not apply, and You do not need to comply with
150
+ its terms and conditions.
151
+
152
+ 3. Term. The term of this Public License is specified in Section
153
+ 6(a).
154
+
155
+ 4. Media and formats; technical modifications allowed. The
156
+ Licensor authorizes You to exercise the Licensed Rights in
157
+ all media and formats whether now known or hereafter created,
158
+ and to make technical modifications necessary to do so. The
159
+ Licensor waives and/or agrees not to assert any right or
160
+ authority to forbid You from making technical modifications
161
+ necessary to exercise the Licensed Rights, including
162
+ technical modifications necessary to circumvent Effective
163
+ Technological Measures. For purposes of this Public License,
164
+ simply making modifications authorized by this Section 2(a)
165
+ (4) never produces Adapted Material.
166
+
167
+ 5. Downstream recipients.
168
+
169
+ a. Offer from the Licensor -- Licensed Material. Every
170
+ recipient of the Licensed Material automatically
171
+ receives an offer from the Licensor to exercise the
172
+ Licensed Rights under the terms and conditions of this
173
+ Public License.
174
+
175
+ b. No downstream restrictions. You may not offer or impose
176
+ any additional or different terms or conditions on, or
177
+ apply any Effective Technological Measures to, the
178
+ Licensed Material if doing so restricts exercise of the
179
+ Licensed Rights by any recipient of the Licensed
180
+ Material.
181
+
182
+ 6. No endorsement. Nothing in this Public License constitutes or
183
+ may be construed as permission to assert or imply that You
184
+ are, or that Your use of the Licensed Material is, connected
185
+ with, or sponsored, endorsed, or granted official status by,
186
+ the Licensor or others designated to receive attribution as
187
+ provided in Section 3(a)(1)(A)(i).
188
+
189
+ b. Other rights.
190
+
191
+ 1. Moral rights, such as the right of integrity, are not
192
+ licensed under this Public License, nor are publicity,
193
+ privacy, and/or other similar personality rights; however, to
194
+ the extent possible, the Licensor waives and/or agrees not to
195
+ assert any such rights held by the Licensor to the limited
196
+ extent necessary to allow You to exercise the Licensed
197
+ Rights, but not otherwise.
198
+
199
+ 2. Patent and trademark rights are not licensed under this
200
+ Public License.
201
+
202
+ 3. To the extent possible, the Licensor waives any right to
203
+ collect royalties from You for the exercise of the Licensed
204
+ Rights, whether directly or through a collecting society
205
+ under any voluntary or waivable statutory or compulsory
206
+ licensing scheme. In all other cases the Licensor expressly
207
+ reserves any right to collect such royalties.
208
+
209
+
210
+ Section 3 -- License Conditions.
211
+
212
+ Your exercise of the Licensed Rights is expressly made subject to the
213
+ following conditions.
214
+
215
+ a. Attribution.
216
+
217
+ 1. If You Share the Licensed Material (including in modified
218
+ form), You must:
219
+
220
+ a. retain the following if it is supplied by the Licensor
221
+ with the Licensed Material:
222
+
223
+ i. identification of the creator(s) of the Licensed
224
+ Material and any others designated to receive
225
+ attribution, in any reasonable manner requested by
226
+ the Licensor (including by pseudonym if
227
+ designated);
228
+
229
+ ii. a copyright notice;
230
+
231
+ iii. a notice that refers to this Public License;
232
+
233
+ iv. a notice that refers to the disclaimer of
234
+ warranties;
235
+
236
+ v. a URI or hyperlink to the Licensed Material to the
237
+ extent reasonably practicable;
238
+
239
+ b. indicate if You modified the Licensed Material and
240
+ retain an indication of any previous modifications; and
241
+
242
+ c. indicate the Licensed Material is licensed under this
243
+ Public License, and include the text of, or the URI or
244
+ hyperlink to, this Public License.
245
+
246
+ 2. You may satisfy the conditions in Section 3(a)(1) in any
247
+ reasonable manner based on the medium, means, and context in
248
+ which You Share the Licensed Material. For example, it may be
249
+ reasonable to satisfy the conditions by providing a URI or
250
+ hyperlink to a resource that includes the required
251
+ information.
252
+
253
+ 3. If requested by the Licensor, You must remove any of the
254
+ information required by Section 3(a)(1)(A) to the extent
255
+ reasonably practicable.
256
+
257
+ 4. If You Share Adapted Material You produce, the Adapter's
258
+ License You apply must not prevent recipients of the Adapted
259
+ Material from complying with this Public License.
260
+
261
+
262
+ Section 4 -- Sui Generis Database Rights.
263
+
264
+ Where the Licensed Rights include Sui Generis Database Rights that
265
+ apply to Your use of the Licensed Material:
266
+
267
+ a. for the avoidance of doubt, Section 2(a)(1) grants You the right
268
+ to extract, reuse, reproduce, and Share all or a substantial
269
+ portion of the contents of the database;
270
+
271
+ b. if You include all or a substantial portion of the database
272
+ contents in a database in which You have Sui Generis Database
273
+ Rights, then the database in which You have Sui Generis Database
274
+ Rights (but not its individual contents) is Adapted Material; and
275
+
276
+ c. You must comply with the conditions in Section 3(a) if You Share
277
+ all or a substantial portion of the contents of the database.
278
+
279
+ For the avoidance of doubt, this Section 4 supplements and does not
280
+ replace Your obligations under this Public License where the Licensed
281
+ Rights include other Copyright and Similar Rights.
282
+
283
+
284
+ Section 5 -- Disclaimer of Warranties and Limitation of Liability.
285
+
286
+ a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
287
+ EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
288
+ AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
289
+ ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
290
+ IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
291
+ WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
292
+ PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
293
+ ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
294
+ KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
295
+ ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
296
+
297
+ b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
298
+ TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
299
+ NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
300
+ INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
301
+ COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
302
+ USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
303
+ ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
304
+ DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
305
+ IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
306
+
307
+ c. The disclaimer of warranties and limitation of liability provided
308
+ above shall be interpreted in a manner that, to the extent
309
+ possible, most closely approximates an absolute disclaimer and
310
+ waiver of all liability.
311
+
312
+
313
+ Section 6 -- Term and Termination.
314
+
315
+ a. This Public License applies for the term of the Copyright and
316
+ Similar Rights licensed here. However, if You fail to comply with
317
+ this Public License, then Your rights under this Public License
318
+ terminate automatically.
319
+
320
+ b. Where Your right to use the Licensed Material has terminated under
321
+ Section 6(a), it reinstates:
322
+
323
+ 1. automatically as of the date the violation is cured, provided
324
+ it is cured within 30 days of Your discovery of the
325
+ violation; or
326
+
327
+ 2. upon express reinstatement by the Licensor.
328
+
329
+ For the avoidance of doubt, this Section 6(b) does not affect any
330
+ right the Licensor may have to seek remedies for Your violations
331
+ of this Public License.
332
+
333
+ c. For the avoidance of doubt, the Licensor may also offer the
334
+ Licensed Material under separate terms or conditions or stop
335
+ distributing the Licensed Material at any time; however, doing so
336
+ will not terminate this Public License.
337
+
338
+ d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
339
+ License.
340
+
341
+
342
+ Section 7 -- Other Terms and Conditions.
343
+
344
+ a. The Licensor shall not be bound by any additional or different
345
+ terms or conditions communicated by You unless expressly agreed.
346
+
347
+ b. Any arrangements, understandings, or agreements regarding the
348
+ Licensed Material not stated herein are separate from and
349
+ independent of the terms and conditions of this Public License.
350
+
351
+
352
+ Section 8 -- Interpretation.
353
+
354
+ a. For the avoidance of doubt, this Public License does not, and
355
+ shall not be interpreted to, reduce, limit, restrict, or impose
356
+ conditions on any use of the Licensed Material that could lawfully
357
+ be made without permission under this Public License.
358
+
359
+ b. To the extent possible, if any provision of this Public License is
360
+ deemed unenforceable, it shall be automatically reformed to the
361
+ minimum extent necessary to make it enforceable. If the provision
362
+ cannot be reformed, it shall be severed from this Public License
363
+ without affecting the enforceability of the remaining terms and
364
+ conditions.
365
+
366
+ c. No term or condition of this Public License will be waived and no
367
+ failure to comply consented to unless expressly agreed to by the
368
+ Licensor.
369
+
370
+ d. Nothing in this Public License constitutes or may be interpreted
371
+ as a limitation upon, or waiver of, any privileges and immunities
372
+ that apply to the Licensor or You, including from the legal
373
+ processes of any jurisdiction or authority.
374
+
375
+
376
+ =======================================================================
377
+
378
+ Creative Commons is not a party to its public
379
+ licenses. Notwithstanding, Creative Commons may elect to apply one of
380
+ its public licenses to material it publishes and in those instances
381
+ will be considered the “Licensor.” The text of the Creative Commons
382
+ public licenses is dedicated to the public domain under the CC0 Public
383
+ Domain Dedication. Except for the limited purpose of indicating that
384
+ material is shared under a Creative Commons public license or as
385
+ otherwise permitted by the Creative Commons policies published at
386
+ creativecommons.org/policies, Creative Commons does not authorize the
387
+ use of the trademark "Creative Commons" or any other trademark or logo
388
+ of Creative Commons without its prior written consent including,
389
+ without limitation, in connection with any unauthorized modifications
390
+ to any of its public licenses or any other arrangements,
391
+ understandings, or agreements concerning use of licensed material. For
392
+ the avoidance of doubt, this paragraph does not form part of the
393
+ public licenses.
394
+
395
+ Creative Commons may be contacted at creativecommons.org.
NumberToText.py ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import csv
3
+
4
+ class NumberDictionary:
5
+ def __init__(self):
6
+ directoryPath = "numToText"
7
+ # print(directoryPath)
8
+ languages = self.get_filenames_in_folder(directoryPath)
9
+ # print(languages, directoryPath)
10
+ self.lang_num_dictionary = self.load_language_dictionary(directoryPath, languages)
11
+ # print(self.lang_num_dictionary)
12
+
13
+
14
+
15
+ def get_filenames_in_folder(self,folder_path):
16
+ file_list = []
17
+
18
+ # Loop through the files in the directory
19
+ for filename in os.listdir(folder_path):
20
+ # Check if it's a file (not a subdirectory)
21
+ if os.path.isfile(os.path.join(folder_path, filename)):
22
+ file_list.append(filename[:-4])
23
+
24
+ return file_list
25
+
26
+
27
+ def load_language_dictionary(self, directory_path, file_names):
28
+ lang_num_dictionary = {}
29
+
30
+ for file_name in file_names:
31
+ language = os.path.splitext(file_name)[0]
32
+ file_path = os.path.join(directory_path, f"{file_name}.csv")
33
+ if not os.path.exists(file_path):
34
+ # print(f"File '{file_path}' not found. Skipping...")
35
+ continue
36
+
37
+ with open(file_path, 'r', encoding='utf-8') as file:
38
+ reader = csv.reader(file)
39
+ language_map = {row[0].strip(): row[1].strip() for row in reader}
40
+
41
+ lang_num_dictionary[language] = language_map
42
+
43
+ return lang_num_dictionary
44
+
45
+ def num2text(self, input_str, language):
46
+ if language not in self.lang_num_dictionary:
47
+ return "Language not supported."
48
+
49
+ integer_part, *decimal_part = input_str.split('.')
50
+ try:
51
+ int_part = int(integer_part)
52
+ except ValueError:
53
+ return "Invalid input. Please provide a valid number."
54
+
55
+ if int_part < 0 or int_part > 999999999999999:
56
+ return "Number out of range (0-999999999999999)"
57
+
58
+ lang_map = self.lang_num_dictionary[language]
59
+ integer_text = self.convert_to_indian_number(int_part, lang_map)
60
+
61
+ if decimal_part:
62
+ decimal_text = lang_map.get('.', '') + ' '
63
+ for digit in decimal_part[0]:
64
+ decimal_text += lang_map.get(digit, '') + ' '
65
+ return (integer_text + ' ' + decimal_text).strip()
66
+ else:
67
+ return integer_text.strip()
68
+
69
+ def convert_to_indian_number(self, n, lang_map):
70
+ numeric_keys = [key for key in lang_map.keys() if key.isdigit()] # Filter numeric keys
71
+ if n <= 20 or (n <= 100 and str(n) in lang_map):
72
+ return lang_map.get(str(n), '')
73
+ elif n < 1000:
74
+ result = f"{lang_map.get(str(n // 100), '')} {lang_map.get('100', '')}"
75
+ if n % 100 != 0:
76
+ result += f" {self.convert_to_indian_number(n % 100, lang_map)}"
77
+ return result.strip()
78
+ else:
79
+ base, term = 0, ''
80
+ for key in sorted(numeric_keys, key=int, reverse=True): # Sort only numeric keys
81
+ if n >= int(key):
82
+ base = int(key)
83
+ term = lang_map[key]
84
+ break
85
+
86
+ if n % base == 0:
87
+ return f"{self.convert_to_indian_number(n // base, lang_map)} {term}"
88
+ else:
89
+ return f"{self.convert_to_indian_number(n // base, lang_map)} {term} {self.convert_to_indian_number(n % base, lang_map)}"
90
+
91
+
92
+
93
+
94
+ # number_dict = NumberDictionary()
95
+ # result = number_dict.num2text("2000048.145", "gujarati")
96
+ # print(result)
README.md CHANGED
@@ -1,3 +1,118 @@
1
  ---
2
  license: cc-by-4.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: cc-by-4.0
3
+ language:
4
+ - hi
5
+ - as
6
+ - bn
7
+ - bo
8
+ - en
9
+ - gu
10
+ - kn
11
+ - ml
12
+ - mr
13
+ - or
14
+ - pa
15
+ - ta
16
+ - te
17
+ - ur
18
+ tags:
19
+ - tts
20
+ - indictts
21
+ - fs2
22
+ - mfa
23
+ - HS
24
+ - hybrid_segmentation
25
+ - fastspeech2
26
  ---
27
+ # Latest Fastspeech2 Models using FLAT Start
28
+
29
+ This repository contains new and high quality Fastspeech2 Models for Indian languages implemented using the Flat Start for speech synthesis. The models are capable of generating mel-spectrograms from text inputs and can be used to synthesize speech.
30
+
31
+ The Repo is large in size. New Models are in "language"_latest folder.
32
+
33
+ Supported languages: Assamese, Bengali, Bodo, Dogri, Gujarati, Hindi, Kannada, Konkani(Maharashtrian), Maithili, Malayalam, Manipuri, Nepali, Punjabi, Rajasthani, Sanskrit, Tamil, Telugu.
34
+
35
+ NOTE - I do not own any right to the repository, all the rights goes to original owner. This repository is meant to help easy installation of the speech models.
36
+
37
+ ## Model Files
38
+
39
+ The model for each language includes the following files:
40
+
41
+ - `config.yaml`: Configuration file for the Fastspeech2 Model.
42
+ - `energy_stats.npz`: Energy statistics for normalization during synthesis.
43
+ - `feats_stats.npz`: Features statistics for normalization during synthesis.
44
+ - `feats_type`: Features type information.
45
+ - `pitch_stats.npz`: Pitch statistics for normalization during synthesis.
46
+ - `model.pth`: Pre-trained Fastspeech2 model weights.
47
+
48
+ ## Installation
49
+
50
+ 1. Install [Miniconda](https://docs.conda.io/projects/miniconda/en/latest/) first. Create a conda environment using the provided `environment.yml` file:
51
+
52
+ ```shell
53
+ conda env create -f environment.yml
54
+ ```
55
+
56
+ 2.Activate the conda environment (check inside environment.yaml file):
57
+ ```shell
58
+ conda activate tts-hs-hifigan
59
+ ```
60
+
61
+ 3. Install PyTorch separately (you can install the specific version based on your requirements):
62
+ ```shell
63
+ conda install pytorch cudatoolkit
64
+ pip install torchaudio
65
+ ```
66
+ ## Vocoder
67
+ For generating WAV files from mel-spectrograms, you can use a vocoder of your choice. One popular option is the [HIFIGAN](https://github.com/jik876/hifi-gan) vocoder (Clone this repo and put it in the current working directory). Please refer to the documentation of the vocoder you choose for installation and usage instructions.
68
+
69
+ (**We have used the HIFIGAN V1 vocoder and have provided Vocoder for few languages in the Vocoder folder. If needed, make sure to adjust the path in the inference file.**)
70
+
71
+ ## Usage
72
+
73
+ The directory paths are Relative. ( But if needed, Make changes to **text_preprocess_for_inference.py** and **inference.py** file, Update folder/file paths wherever required.)
74
+
75
+ **Please give language/gender in small cases and sample text between quotes. Adjust output speed using the alpha parameter (higher for slow voiced output and vice versa). Output argument is optional; the provide name will be used for the output file.**
76
+
77
+ Use the inference file to synthesize speech from text inputs:
78
+ ```shell
79
+ python inference.py --sample_text "Your input text here" --language <language>_latest --gender <gender> --alpha <alpha> --output_file <file_name.wav OR path/to/file_name.wav>
80
+ ```
81
+
82
+ **Example:**
83
+
84
+ ```
85
+ python inference.py --sample_text "श्रीलंका और पाकिस्तान में खेला जा रहा एशिया कप अब तक का सबसे विवादित टूर्नामेंट होता जा रहा है।" --language hindi_latest --gender male --alpha 1 --output_file male_hindi_output.wav
86
+ ```
87
+ The file will be stored as `male_hindi_output.wav` and will be inside current working directory. If **--output_file** argument is not given it will be stored as `<language>_<gender>_output.wav` in the current working directory.
88
+
89
+ **Use "language"_latest in --language to use latest models.**
90
+
91
+
92
+ ### Citation
93
+ If you use this Fastspeech2 Model in your research or work, please consider citing:
94
+
95
+
96
+ COPYRIGHT
97
+ 2025, Speech Technology Consortium,
98
+
99
+ Bhashini, MeiTY and by Hema A Murthy & S Umesh,
100
+
101
+
102
+ DEPARTMENT OF COMPUTER SCIENCE AND ENGINEERING
103
+ and
104
+ ELECTRICAL ENGINEERING,
105
+ IIT MADRAS. ALL RIGHTS RESERVED "
106
+
107
+
108
+
109
+ Shield: [![CC BY 4.0][cc-by-shield]][cc-by]
110
+
111
+ This work is licensed under a
112
+ [Creative Commons Attribution 4.0 International License][cc-by].
113
+
114
+ [![CC BY 4.0][cc-by-image]][cc-by]
115
+
116
+ [cc-by]: http://creativecommons.org/licenses/by/4.0/
117
+ [cc-by-image]: https://i.creativecommons.org/l/by/4.0/88x31.png
118
+ [cc-by-shield]: https://img.shields.io/badge/License-CC%20BY%204.0-lightgrey.svg
api.py ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # TTS IITM SPEECH LAB
2
+ import requests
3
+ import json
4
+ import base64
5
+
6
+ text = "सुप्रभात, आप कैसे हैं?" # hindi
7
+ # text = "സുപ്രഭാതം, സുഖമാ?" # malayalam
8
+ # text = "সুপ্ৰভাত, তুমি কেনে?" # manipuri
9
+ # text = "सुप्रभात, तुम्ही कसे आहात?" # marathi
10
+ # text = "ಶುಭೋದಯ, ನೀವು ಹೇಗಿದ್ದೀರಿ?" # kannada
11
+ # text = "बसु म्विथ्बो, बरि दिबाबो?" # bodo male not working <---
12
+ # text = "Good morning, how are you?" # english
13
+ # text = "সুপ্ৰভাত, আপুনি কেমন আছে?" # assamese
14
+ # text = "காலை வணக்கம், நீங்கள் எப்படி இருக்கின்றீர்கள்?" # tamil
15
+ # text = "ସୁପ୍ରଭାତ, ଆପଣ କେମିତି ଅଛନ୍ତି?" # odia male not working <---
16
+ # text = "सुप्रभात, आप कैसे छो?" # rajasthani
17
+ # text = "శుభోదయం, మీరు ఎలా ఉన్నారు?" # telugu
18
+ # text = "সুপ্রভাত, আপনি কেমন আছেন?" # bengali male not working <---
19
+ # text = "સુપ્રભાત, તમે કેમ છો?" # gujarati
20
+
21
+ lang = 'hindi'
22
+ gender = 'female'
23
+
24
+ url = "http://localhost:4005/tts"
25
+ # url = 'http://projects.respark.iitm.ac.in:8009/tts' # proxy
26
+
27
+ payload = json.dumps({
28
+ "input": text,
29
+ "gender": gender,
30
+ "lang": lang,
31
+ "alpha": 1,
32
+ "segmentwise":"True"
33
+ })
34
+ headers = {'Content-Type': 'application/json'}
35
+ response = requests.request("POST", url, headers=headers, data=payload).json()
36
+
37
+ audio = response['audio']
38
+ file_name = "tts.mp3"
39
+ wav_file = open(file_name,'wb')
40
+ decode_string = base64.b64decode(audio)
41
+ wav_file.write(decode_string)
42
+ wav_file.close()
43
+
44
+ '''
45
+ Supported languages
46
+
47
+ Assamese
48
+ Bengali
49
+ Bodo
50
+ English
51
+ Gujarati
52
+ Hindi
53
+ Kannada
54
+ Malayalam
55
+ Manipuri
56
+ Marathi
57
+ Odia
58
+ Punjabi
59
+ Rajasthani
60
+ Tamil
61
+ Telugu
62
+ Urdu
63
+ '''
app.py ADDED
@@ -0,0 +1,179 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from flask import Flask, render_template, request, send_file, jsonify
2
+ import requests
3
+ import json
4
+ import ssl
5
+ import logging
6
+ import sys
7
+ import os
8
+ import base64
9
+ import io
10
+ #replace the path with your hifigan path to import Generator from models.py
11
+ sys.path.append("hifigan")
12
+ # import argparse
13
+ import torch
14
+ from espnet2.bin.tts_inference import Text2Speech
15
+ from models import Generator
16
+ from scipy.io.wavfile import write
17
+ from meldataset import MAX_WAV_VALUE
18
+ from env import AttrDict
19
+ import json
20
+ import yaml
21
+ from text_preprocess_for_inference import TTSDurAlignPreprocessor
22
+ # import time
23
+
24
+ logging.basicConfig(filename='access.log', level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
25
+
26
+ SAMPLING_RATE = 22050
27
+ if torch.cuda.is_available():
28
+ device = "cuda"
29
+ else:
30
+ device = "cpu"
31
+
32
+ preprocessor = TTSDurAlignPreprocessor()
33
+
34
+ app = Flask(__name__)
35
+ # app.config['SECRET_KEY'] = 'key'
36
+ # socketio = SocketIO(app)
37
+
38
+ # @socketio.on('new_user')
39
+ # def handle_new_user(data):
40
+ # client_id = data['id']
41
+ # # print('\n'+f"New user connected with ID: {client_id}")
42
+ # logging.info('\n'+f"New user connected with ID: {client_id}")
43
+
44
+ def load_hifigan_vocoder(language, gender, device):
45
+ # Load HiFi-GAN vocoder configuration file and generator model for the specified language and gender
46
+ vocoder_config = f"vocoder/{gender}/aryan/hifigan/config.json"
47
+ vocoder_generator = f"vocoder/{gender}/aryan/hifigan/generator"
48
+ # Read the contents of the vocoder configuration file
49
+ with open(vocoder_config, 'r') as f:
50
+ data = f.read()
51
+ json_config = json.loads(data)
52
+ h = AttrDict(json_config)
53
+ torch.manual_seed(h.seed)
54
+ # Move the generator model to the specified device (CPU or GPU)
55
+ device = torch.device(device)
56
+ generator = Generator(h).to(device)
57
+ state_dict_g = torch.load(vocoder_generator, device)
58
+ generator.load_state_dict(state_dict_g['generator'])
59
+ generator.eval()
60
+ generator.remove_weight_norm()
61
+
62
+ # Return the loaded and prepared HiFi-GAN generator model
63
+ return generator
64
+
65
+ def load_fastspeech2_model(language, gender, device):
66
+
67
+ #updating the config.yaml fiel based on language and gender
68
+ with open(f"{language}/{gender}/model/config.yaml", "r") as file:
69
+ config = yaml.safe_load(file)
70
+
71
+ current_working_directory = os.getcwd()
72
+ feat="model/feats_stats.npz"
73
+ pitch="model/pitch_stats.npz"
74
+ energy="model/energy_stats.npz"
75
+
76
+ feat_path=os.path.join(current_working_directory,language,gender,feat)
77
+ pitch_path=os.path.join(current_working_directory,language,gender,pitch)
78
+ energy_path=os.path.join(current_working_directory,language,gender,energy)
79
+
80
+
81
+ config["normalize_conf"]["stats_file"] = feat_path
82
+ config["pitch_normalize_conf"]["stats_file"] = pitch_path
83
+ config["energy_normalize_conf"]["stats_file"] = energy_path
84
+
85
+ with open(f"{language}/{gender}/model/config.yaml", "w") as file:
86
+ yaml.dump(config, file)
87
+
88
+ tts_model = f"{language}/{gender}/model/model.pth"
89
+ tts_config = f"{language}/{gender}/model/config.yaml"
90
+
91
+
92
+ return Text2Speech(train_config=tts_config, model_file=tts_model, device=device)
93
+
94
+ def text_synthesis(language, gender, sample_text, vocoder, MAX_WAV_VALUE, device, alpha=1):
95
+ # Perform Text-to-Speech synthesis
96
+ with torch.no_grad():
97
+ # Load the FastSpeech2 model for the specified language and gender
98
+
99
+ model = load_fastspeech2_model(language, gender, device)
100
+
101
+ # Generate mel-spectrograms from the input text using the FastSpeech2 model
102
+ out = model(sample_text, decode_conf={"alpha": alpha})
103
+ print("TTS Done")
104
+ x = out["feat_gen_denorm"].T.unsqueeze(0) * 2.3262
105
+ x = x.to(device)
106
+
107
+ # Use the HiFi-GAN vocoder to convert mel-spectrograms to raw audio waveforms
108
+ y_g_hat = vocoder(x)
109
+ audio = y_g_hat.squeeze()
110
+ audio = audio * MAX_WAV_VALUE
111
+ audio = audio.cpu().numpy().astype('int16')
112
+
113
+ # Return the synthesized audio
114
+ return audio
115
+
116
+ def setup_app():
117
+ genders = ['male','female']
118
+ # to make dummy calls in all languages available
119
+ languages = {'hindi': "नमस्ते",'malayalam': "ഹലോ",'manipuri': "হ্যালো",'marathi': "हॅलो",'kannada': "ಹಲೋ",'bodo': "हॅलो",'english': "Hello",'assamese': "হ্যালো",'tamil': "ஹலோ",'odia': "ହେଲୋ",'rajasthani': "हॅलो",'telugu': "హలో",'bengali': "হ্যালো",'gujarati': "હલો"}
120
+
121
+ vocoders = {}
122
+ for gender in genders:
123
+ vocoders[gender]={}
124
+ for language,text in languages.items():
125
+ # Load the HiFi-GAN vocoder with dynamic language and gender
126
+ vocoder = load_hifigan_vocoder(language, gender, device)
127
+ vocoders[gender][language] = vocoder
128
+ # dummy calls
129
+ print(f"making dummy calls for {language} - {gender}")
130
+ try:
131
+ out = text_synthesis(language, gender, text, vocoder, MAX_WAV_VALUE, device)
132
+ except:
133
+ message = f"cannot make dummy call for {gender} - {language} <==================="
134
+ print(message.upper())
135
+
136
+ print("Server Started...")
137
+ return vocoders
138
+ vocoders = setup_app()
139
+
140
+ @app.route('/', methods=['GET'])
141
+ def main():
142
+ return "IITM_TTS_V2"
143
+
144
+ @app.route('/tts', methods=['GET', 'POST'], strict_slashes=False)
145
+ def tts():
146
+ try:
147
+ json_data = request.get_json()
148
+ text = json_data["input"]
149
+ if not isinstance(text,str):
150
+ input_type = type(text)
151
+ ret = jsonify(status='failure', reason=f"Unsupported input type {input_type}. Input text should be in string format.")
152
+ gender = json_data["gender"]
153
+ language = json_data["lang"].lower()
154
+ alpha = json_data["alpha"]
155
+ # Preprocess the sample text
156
+ preprocessed_text, phrases = preprocessor.preprocess(text, language, gender)
157
+ preprocessed_text = " ".join(preprocessed_text)
158
+ vocoder = vocoders[gender][language]
159
+ out = text_synthesis(language, gender, preprocessed_text, vocoder, MAX_WAV_VALUE, device, alpha=alpha)
160
+
161
+ # output_file = f"{language}_{gender}_output.wav"
162
+ # write(output_file, SAMPLING_RATE, out)
163
+ # audio_wav_bytes = base64.b64encode(open(output_file, "rb").read())
164
+
165
+ # avoid saving file on disk
166
+ output_stream = io.BytesIO()
167
+ write(output_stream, SAMPLING_RATE, out)
168
+ audio_wav_bytes = base64.b64encode(output_stream.getvalue())
169
+
170
+ ret = jsonify(status="success",audio=audio_wav_bytes.decode('utf-8'))
171
+
172
+ except Exception as err:
173
+ ret = jsonify(status="failure", reason=str(err))
174
+ return ret
175
+
176
+ if __name__ == '__main__':
177
+ # ssl_context = ssl.create_default_context(ssl.Purpose.CLIENT_AUTH)
178
+ # ssl_context.load_cert_chain('./ssl2023/iitm2022.crt','./ssl2023/iitm2022.key')
179
+ app.run(host='0.0.0.0', port=4005, debug=True)
assamese_latest/female/model/config.yaml ADDED
@@ -0,0 +1,319 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_fastspeech2.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 1
12
+ num_att_plot: 3
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: 2
16
+ dist_rank: 0
17
+ local_rank: 0
18
+ dist_master_addr: localhost
19
+ dist_master_port: 36807
20
+ dist_launcher: null
21
+ multiprocessing_distributed: true
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 1000
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - loss
44
+ - min
45
+ - - train
46
+ - loss
47
+ - min
48
+ keep_nbest_models: 5
49
+ nbest_averaging_interval: 0
50
+ grad_clip: 1.0
51
+ grad_clip_type: 2.0
52
+ grad_noise: false
53
+ accum_grad: 8
54
+ no_forward_run: false
55
+ resume: true
56
+ train_dtype: float32
57
+ use_amp: false
58
+ log_interval: null
59
+ use_matplotlib: true
60
+ use_tensorboard: true
61
+ create_graph_in_tensorboard: false
62
+ use_wandb: false
63
+ wandb_project: null
64
+ wandb_id: null
65
+ wandb_entity: null
66
+ wandb_name: null
67
+ wandb_model_log_interval: -1
68
+ detect_anomaly: false
69
+ use_adapter: false
70
+ adapter: lora
71
+ save_strategy: all
72
+ adapter_conf: {}
73
+ pretrain_path: null
74
+ init_param: []
75
+ ignore_init_mismatch: false
76
+ freeze_param: []
77
+ num_iters_per_epoch: 800
78
+ batch_size: 20
79
+ valid_batch_size: null
80
+ batch_bins: 3000000
81
+ valid_batch_bins: null
82
+ train_shape_file:
83
+ - exp/tts_stats_raw_char_None/train/text_shape.char
84
+ - exp/tts_stats_raw_char_None/train/speech_shape
85
+ valid_shape_file:
86
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
87
+ - exp/tts_stats_raw_char_None/valid/speech_shape
88
+ batch_type: numel
89
+ valid_batch_type: null
90
+ fold_length:
91
+ - 150
92
+ - 819200
93
+ sort_in_batch: descending
94
+ shuffle_within_batch: false
95
+ sort_batch: descending
96
+ multiple_iterator: false
97
+ chunk_length: 500
98
+ chunk_shift_ratio: 0.5
99
+ num_cache_chunks: 1024
100
+ chunk_excluded_key_prefixes: []
101
+ chunk_default_fs: null
102
+ chunk_max_abs_length: null
103
+ chunk_discard_short_samples: true
104
+ train_data_path_and_name_and_type:
105
+ - - dump/raw/tr_no_dev/text
106
+ - text
107
+ - text
108
+ - - duration_info/tr_no_dev/durations
109
+ - durations
110
+ - text_int
111
+ - - dump/raw/tr_no_dev/wav.scp
112
+ - speech
113
+ - sound
114
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
115
+ - pitch
116
+ - npy
117
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
118
+ - energy
119
+ - npy
120
+ valid_data_path_and_name_and_type:
121
+ - - dump/raw/dev/text
122
+ - text
123
+ - text
124
+ - - duration_info/dev/durations
125
+ - durations
126
+ - text_int
127
+ - - dump/raw/dev/wav.scp
128
+ - speech
129
+ - sound
130
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
131
+ - pitch
132
+ - npy
133
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
134
+ - energy
135
+ - npy
136
+ multi_task_dataset: false
137
+ allow_variable_data_keys: false
138
+ max_cache_size: 0.0
139
+ max_cache_fd: 32
140
+ allow_multi_rates: false
141
+ valid_max_cache_size: null
142
+ exclude_weight_decay: false
143
+ exclude_weight_decay_conf: {}
144
+ optim: adam
145
+ optim_conf:
146
+ lr: 1.0
147
+ scheduler: noamlr
148
+ scheduler_conf:
149
+ model_size: 384
150
+ warmup_steps: 4000
151
+ token_list:
152
+ - <blank>
153
+ - <unk>
154
+ - <space>
155
+ - $
156
+ - ','
157
+ - .
158
+ - M
159
+ - q
160
+ - H
161
+ - k
162
+ - ख
163
+ - g
164
+ - घ
165
+ - ङ
166
+ - c
167
+ - C
168
+ - j
169
+ - J
170
+ - ञ
171
+ - ट
172
+ - ठ
173
+ - ड
174
+ - ढ
175
+ - ण
176
+ - t
177
+ - थ
178
+ - d
179
+ - ध
180
+ - n
181
+ - ऩ
182
+ - p
183
+ - P
184
+ - b
185
+ - B
186
+ - m
187
+ - y
188
+ - r
189
+ - ऱ
190
+ - l
191
+ - ള
192
+ - Z
193
+ - w
194
+ - श
195
+ - ष
196
+ - s
197
+ - h
198
+ - Y
199
+ - ऽ
200
+ - क
201
+ - K
202
+ - G
203
+ - z
204
+ - D
205
+ - T
206
+ - f
207
+ - ॠ
208
+ - ൺ
209
+ - N
210
+ - ർ
211
+ - ൽ
212
+ - ൾ
213
+ - a
214
+ - A
215
+ - i
216
+ - I
217
+ - u
218
+ - U
219
+ - R
220
+ - ऍ
221
+ - e
222
+ - E
223
+ - ऐ
224
+ - ऑ
225
+ - o
226
+ - O
227
+ - औ
228
+ - உ
229
+ - <sos/eos>
230
+ odim: null
231
+ model_conf: {}
232
+ use_preprocessor: true
233
+ token_type: char
234
+ bpemodel: null
235
+ non_linguistic_symbols: null
236
+ cleaner: null
237
+ g2p: null
238
+ feats_extract: fbank
239
+ feats_extract_conf:
240
+ n_fft: 8192
241
+ hop_length: 1024
242
+ win_length: 4096
243
+ fs: 48000
244
+ fmin: 0
245
+ fmax: 24000
246
+ n_mels: 160
247
+ normalize: global_mvn
248
+ normalize_conf:
249
+ stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
250
+ tts: fastspeech2
251
+ tts_conf:
252
+ adim: 384
253
+ aheads: 2
254
+ elayers: 4
255
+ eunits: 1536
256
+ dlayers: 4
257
+ dunits: 1536
258
+ positionwise_layer_type: conv1d
259
+ positionwise_conv_kernel_size: 3
260
+ duration_predictor_layers: 2
261
+ duration_predictor_chans: 256
262
+ duration_predictor_kernel_size: 3
263
+ postnet_layers: 5
264
+ postnet_filts: 5
265
+ postnet_chans: 256
266
+ use_masking: true
267
+ use_scaled_pos_enc: true
268
+ encoder_normalize_before: true
269
+ decoder_normalize_before: true
270
+ reduction_factor: 1
271
+ init_type: xavier_uniform
272
+ init_enc_alpha: 1.0
273
+ init_dec_alpha: 1.0
274
+ transformer_enc_dropout_rate: 0.2
275
+ transformer_enc_positional_dropout_rate: 0.2
276
+ transformer_enc_attn_dropout_rate: 0.2
277
+ transformer_dec_dropout_rate: 0.2
278
+ transformer_dec_positional_dropout_rate: 0.2
279
+ transformer_dec_attn_dropout_rate: 0.2
280
+ pitch_predictor_layers: 5
281
+ pitch_predictor_chans: 256
282
+ pitch_predictor_kernel_size: 5
283
+ pitch_predictor_dropout: 0.5
284
+ pitch_embed_kernel_size: 1
285
+ pitch_embed_dropout: 0.0
286
+ stop_gradient_from_pitch_predictor: true
287
+ energy_predictor_layers: 2
288
+ energy_predictor_chans: 256
289
+ energy_predictor_kernel_size: 3
290
+ energy_predictor_dropout: 0.5
291
+ energy_embed_kernel_size: 1
292
+ energy_embed_dropout: 0.0
293
+ stop_gradient_from_energy_predictor: false
294
+ pitch_extract: dio
295
+ pitch_extract_conf:
296
+ fs: 48000
297
+ n_fft: 8192
298
+ hop_length: 1024
299
+ f0max: 400
300
+ f0min: 80
301
+ reduction_factor: 1
302
+ pitch_normalize: global_mvn
303
+ pitch_normalize_conf:
304
+ stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
305
+ energy_extract: energy
306
+ energy_extract_conf:
307
+ fs: 48000
308
+ n_fft: 8192
309
+ hop_length: 1024
310
+ win_length: 4096
311
+ reduction_factor: 1
312
+ energy_normalize: global_mvn
313
+ energy_normalize_conf:
314
+ stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
315
+ required:
316
+ - output_dir
317
+ - token_list
318
+ version: '202402'
319
+ distributed: true
assamese_latest/female/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e33101ff3538ca740f6c8fc35483fffab31722c9f0ae99adab07dd29c361de
3
+ size 770
assamese_latest/female/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9b6ee7475d00198e08ea5b675f2cb5e81239a5f0babf83866b37b51ef2e0a1
3
+ size 2042
assamese_latest/female/model/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e5cd37cac859ad35acd2d0510fe3b4c5b388d167c9d70fb12efd1f5d0b03560
3
+ size 152129434
assamese_latest/female/model/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dbac0bea459888e39a56f5f04e150d35a21f966e6e04b1d027c354e9de99aab
3
+ size 770
assamese_latest/male/model/config.yaml ADDED
@@ -0,0 +1,315 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_grad: 8
2
+ adapter: lora
3
+ adapter_conf: {}
4
+ allow_multi_rates: false
5
+ allow_variable_data_keys: false
6
+ batch_bins: 3000000
7
+ batch_size: 20
8
+ batch_type: numel
9
+ best_model_criterion:
10
+ - - valid
11
+ - loss
12
+ - min
13
+ - - train
14
+ - loss
15
+ - min
16
+ bpemodel: null
17
+ chunk_default_fs: null
18
+ chunk_discard_short_samples: true
19
+ chunk_excluded_key_prefixes: []
20
+ chunk_length: 500
21
+ chunk_max_abs_length: null
22
+ chunk_shift_ratio: 0.5
23
+ cleaner: null
24
+ collect_stats: false
25
+ config: conf/tuning/train_fastspeech2.yaml
26
+ create_graph_in_tensorboard: false
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ cudnn_enabled: true
30
+ detect_anomaly: false
31
+ dist_backend: nccl
32
+ dist_init_method: env://
33
+ dist_launcher: null
34
+ dist_master_addr: localhost
35
+ dist_master_port: 44409
36
+ dist_rank: 0
37
+ dist_world_size: 2
38
+ distributed: true
39
+ drop_last_iter: false
40
+ dry_run: false
41
+ early_stopping_criterion:
42
+ - valid
43
+ - loss
44
+ - min
45
+ energy_extract: energy
46
+ energy_extract_conf:
47
+ fs: 48000
48
+ hop_length: 1024
49
+ n_fft: 8192
50
+ reduction_factor: 1
51
+ win_length: 4096
52
+ energy_normalize: global_mvn
53
+ energy_normalize_conf:
54
+ stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/energy_stats.npz
55
+ exclude_weight_decay: false
56
+ exclude_weight_decay_conf: {}
57
+ feats_extract: fbank
58
+ feats_extract_conf:
59
+ fmax: 24000
60
+ fmin: 0
61
+ fs: 48000
62
+ hop_length: 1024
63
+ n_fft: 8192
64
+ n_mels: 160
65
+ win_length: 4096
66
+ fold_length:
67
+ - 150
68
+ - 819200
69
+ freeze_param: []
70
+ g2p: null
71
+ grad_clip: 1.0
72
+ grad_clip_type: 2.0
73
+ grad_noise: false
74
+ ignore_init_mismatch: false
75
+ init_param: []
76
+ iterator_type: sequence
77
+ keep_nbest_models: 5
78
+ local_rank: 0
79
+ log_interval: null
80
+ log_level: INFO
81
+ max_cache_fd: 32
82
+ max_cache_size: 0.0
83
+ max_epoch: 1000
84
+ model_conf: {}
85
+ multiple_iterator: false
86
+ multiprocessing_distributed: true
87
+ nbest_averaging_interval: 0
88
+ ngpu: 1
89
+ no_forward_run: false
90
+ non_linguistic_symbols: null
91
+ normalize: global_mvn
92
+ normalize_conf:
93
+ stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/feats_stats.npz
94
+ num_att_plot: 3
95
+ num_cache_chunks: 1024
96
+ num_iters_per_epoch: 800
97
+ num_workers: 1
98
+ odim: null
99
+ optim: adam
100
+ optim_conf:
101
+ lr: 1.0
102
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
103
+ patience: null
104
+ pitch_extract: dio
105
+ pitch_extract_conf:
106
+ f0max: 350
107
+ f0min: 40
108
+ fs: 48000
109
+ hop_length: 1024
110
+ n_fft: 8192
111
+ reduction_factor: 1
112
+ pitch_normalize: global_mvn
113
+ pitch_normalize_conf:
114
+ stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/pitch_stats.npz
115
+ pretrain_path: null
116
+ print_config: false
117
+ required:
118
+ - output_dir
119
+ - token_list
120
+ resume: true
121
+ save_strategy: all
122
+ scheduler: noamlr
123
+ scheduler_conf:
124
+ model_size: 384
125
+ warmup_steps: 4000
126
+ seed: 0
127
+ sharded_ddp: false
128
+ shuffle_within_batch: false
129
+ sort_batch: descending
130
+ sort_in_batch: descending
131
+ token_list:
132
+ - <blank>
133
+ - <unk>
134
+ - <space>
135
+ - $
136
+ - ','
137
+ - .
138
+ - M
139
+ - q
140
+ - H
141
+ - k
142
+ - "\u0916"
143
+ - g
144
+ - "\u0918"
145
+ - "\u0919"
146
+ - c
147
+ - C
148
+ - j
149
+ - J
150
+ - "\u091E"
151
+ - "\u091F"
152
+ - "\u0920"
153
+ - "\u0921"
154
+ - "\u0922"
155
+ - "\u0923"
156
+ - t
157
+ - "\u0925"
158
+ - d
159
+ - "\u0927"
160
+ - n
161
+ - "\u0929"
162
+ - p
163
+ - P
164
+ - b
165
+ - B
166
+ - m
167
+ - y
168
+ - r
169
+ - "\u0931"
170
+ - l
171
+ - "\u0D33"
172
+ - Z
173
+ - w
174
+ - "\u0936"
175
+ - "\u0937"
176
+ - s
177
+ - h
178
+ - Y
179
+ - "\u093D"
180
+ - "\u0915"
181
+ - K
182
+ - G
183
+ - z
184
+ - D
185
+ - T
186
+ - f
187
+ - "\u0960"
188
+ - "\u0D7A"
189
+ - N
190
+ - "\u0D7C"
191
+ - "\u0D7D"
192
+ - "\u0D7E"
193
+ - a
194
+ - A
195
+ - i
196
+ - I
197
+ - u
198
+ - U
199
+ - R
200
+ - "\u090D"
201
+ - e
202
+ - E
203
+ - "\u0910"
204
+ - "\u0911"
205
+ - o
206
+ - O
207
+ - "\u0914"
208
+ - "\u0B89"
209
+ - <sos/eos>
210
+ token_type: char
211
+ train_data_path_and_name_and_type:
212
+ - - dump/raw/tr_no_dev/text
213
+ - text
214
+ - text
215
+ - - duration_info/tr_no_dev/durations
216
+ - durations
217
+ - text_int
218
+ - - dump/raw/tr_no_dev/wav.scp
219
+ - speech
220
+ - sound
221
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
222
+ - pitch
223
+ - npy
224
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
225
+ - energy
226
+ - npy
227
+ train_dtype: float32
228
+ train_shape_file:
229
+ - exp/tts_stats_raw_char_None/train/text_shape.char
230
+ - exp/tts_stats_raw_char_None/train/speech_shape
231
+ tts: fastspeech2
232
+ tts_conf:
233
+ adim: 384
234
+ aheads: 2
235
+ decoder_normalize_before: true
236
+ dlayers: 4
237
+ dunits: 1536
238
+ duration_predictor_chans: 256
239
+ duration_predictor_kernel_size: 3
240
+ duration_predictor_layers: 2
241
+ elayers: 4
242
+ encoder_normalize_before: true
243
+ energy_embed_dropout: 0.0
244
+ energy_embed_kernel_size: 1
245
+ energy_predictor_chans: 256
246
+ energy_predictor_dropout: 0.5
247
+ energy_predictor_kernel_size: 3
248
+ energy_predictor_layers: 2
249
+ eunits: 1536
250
+ init_dec_alpha: 1.0
251
+ init_enc_alpha: 1.0
252
+ init_type: xavier_uniform
253
+ pitch_embed_dropout: 0.0
254
+ pitch_embed_kernel_size: 1
255
+ pitch_predictor_chans: 256
256
+ pitch_predictor_dropout: 0.5
257
+ pitch_predictor_kernel_size: 5
258
+ pitch_predictor_layers: 5
259
+ positionwise_conv_kernel_size: 3
260
+ positionwise_layer_type: conv1d
261
+ postnet_chans: 256
262
+ postnet_filts: 5
263
+ postnet_layers: 5
264
+ reduction_factor: 1
265
+ stop_gradient_from_energy_predictor: false
266
+ stop_gradient_from_pitch_predictor: true
267
+ transformer_dec_attn_dropout_rate: 0.2
268
+ transformer_dec_dropout_rate: 0.2
269
+ transformer_dec_positional_dropout_rate: 0.2
270
+ transformer_enc_attn_dropout_rate: 0.2
271
+ transformer_enc_dropout_rate: 0.2
272
+ transformer_enc_positional_dropout_rate: 0.2
273
+ use_masking: true
274
+ use_scaled_pos_enc: true
275
+ unused_parameters: false
276
+ use_adapter: false
277
+ use_amp: false
278
+ use_matplotlib: true
279
+ use_preprocessor: true
280
+ use_tensorboard: true
281
+ use_wandb: false
282
+ val_scheduler_criterion:
283
+ - valid
284
+ - loss
285
+ valid_batch_bins: null
286
+ valid_batch_size: null
287
+ valid_batch_type: null
288
+ valid_data_path_and_name_and_type:
289
+ - - dump/raw/dev/text
290
+ - text
291
+ - text
292
+ - - duration_info/dev/durations
293
+ - durations
294
+ - text_int
295
+ - - dump/raw/dev/wav.scp
296
+ - speech
297
+ - sound
298
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
299
+ - pitch
300
+ - npy
301
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
302
+ - energy
303
+ - npy
304
+ valid_iterator_type: null
305
+ valid_max_cache_size: null
306
+ valid_shape_file:
307
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
308
+ - exp/tts_stats_raw_char_None/valid/speech_shape
309
+ version: '202402'
310
+ wandb_entity: null
311
+ wandb_id: null
312
+ wandb_model_log_interval: -1
313
+ wandb_name: null
314
+ wandb_project: null
315
+ write_collected_feats: false
assamese_latest/male/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a64d5dd4ee24ad1b403ad07911b9e30f4d482f97c331b844272725617fb941a6
3
+ size 770
assamese_latest/male/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecbb77de18a76f7e991b256a042acc361aa338498daa52048978ea050a9fd528
3
+ size 2042
assamese_latest/male/model/feats_type ADDED
@@ -0,0 +1 @@
 
 
1
+ raw
assamese_latest/male/model/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f52c3b1c4edd258dbd9e46920896bc0215cfe5c78957e3ee2a25de6f3ef916b
3
+ size 152128410
assamese_latest/male/model/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47de3b8ee9c740a5f24ceafcbe9b3486dfd4b3676d95282d7ce97c1116d834fd
3
+ size 770
bengali_latest/male/model/config.yaml ADDED
@@ -0,0 +1,315 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_grad: 8
2
+ adapter: lora
3
+ adapter_conf: {}
4
+ allow_multi_rates: false
5
+ allow_variable_data_keys: false
6
+ batch_bins: 3000000
7
+ batch_size: 20
8
+ batch_type: numel
9
+ best_model_criterion:
10
+ - - valid
11
+ - loss
12
+ - min
13
+ - - train
14
+ - loss
15
+ - min
16
+ bpemodel: null
17
+ chunk_default_fs: null
18
+ chunk_discard_short_samples: true
19
+ chunk_excluded_key_prefixes: []
20
+ chunk_length: 500
21
+ chunk_max_abs_length: null
22
+ chunk_shift_ratio: 0.5
23
+ cleaner: null
24
+ collect_stats: false
25
+ config: conf/tuning/train_fastspeech2.yaml
26
+ create_graph_in_tensorboard: false
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ cudnn_enabled: true
30
+ detect_anomaly: false
31
+ dist_backend: nccl
32
+ dist_init_method: env://
33
+ dist_launcher: null
34
+ dist_master_addr: localhost
35
+ dist_master_port: 38255
36
+ dist_rank: 0
37
+ dist_world_size: 2
38
+ distributed: true
39
+ drop_last_iter: false
40
+ dry_run: false
41
+ early_stopping_criterion:
42
+ - valid
43
+ - loss
44
+ - min
45
+ energy_extract: energy
46
+ energy_extract_conf:
47
+ fs: 48000
48
+ hop_length: 1024
49
+ n_fft: 8192
50
+ reduction_factor: 1
51
+ win_length: 4096
52
+ energy_normalize: global_mvn
53
+ energy_normalize_conf:
54
+ stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/energy_stats.npz
55
+ exclude_weight_decay: false
56
+ exclude_weight_decay_conf: {}
57
+ feats_extract: fbank
58
+ feats_extract_conf:
59
+ fmax: 24000
60
+ fmin: 0
61
+ fs: 48000
62
+ hop_length: 1024
63
+ n_fft: 8192
64
+ n_mels: 160
65
+ win_length: 4096
66
+ fold_length:
67
+ - 150
68
+ - 819200
69
+ freeze_param: []
70
+ g2p: null
71
+ grad_clip: 1.0
72
+ grad_clip_type: 2.0
73
+ grad_noise: false
74
+ ignore_init_mismatch: false
75
+ init_param: []
76
+ iterator_type: sequence
77
+ keep_nbest_models: 5
78
+ local_rank: 0
79
+ log_interval: null
80
+ log_level: INFO
81
+ max_cache_fd: 32
82
+ max_cache_size: 0.0
83
+ max_epoch: 1000
84
+ model_conf: {}
85
+ multiple_iterator: false
86
+ multiprocessing_distributed: true
87
+ nbest_averaging_interval: 0
88
+ ngpu: 1
89
+ no_forward_run: false
90
+ non_linguistic_symbols: null
91
+ normalize: global_mvn
92
+ normalize_conf:
93
+ stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/feats_stats.npz
94
+ num_att_plot: 3
95
+ num_cache_chunks: 1024
96
+ num_iters_per_epoch: 800
97
+ num_workers: 1
98
+ odim: null
99
+ optim: adam
100
+ optim_conf:
101
+ lr: 1.0
102
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
103
+ patience: null
104
+ pitch_extract: dio
105
+ pitch_extract_conf:
106
+ f0max: 350
107
+ f0min: 40
108
+ fs: 48000
109
+ hop_length: 1024
110
+ n_fft: 8192
111
+ reduction_factor: 1
112
+ pitch_normalize: global_mvn
113
+ pitch_normalize_conf:
114
+ stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/pitch_stats.npz
115
+ pretrain_path: null
116
+ print_config: false
117
+ required:
118
+ - output_dir
119
+ - token_list
120
+ resume: true
121
+ save_strategy: all
122
+ scheduler: noamlr
123
+ scheduler_conf:
124
+ model_size: 384
125
+ warmup_steps: 4000
126
+ seed: 0
127
+ sharded_ddp: false
128
+ shuffle_within_batch: false
129
+ sort_batch: descending
130
+ sort_in_batch: descending
131
+ token_list:
132
+ - <blank>
133
+ - <unk>
134
+ - <space>
135
+ - $
136
+ - ','
137
+ - .
138
+ - M
139
+ - q
140
+ - H
141
+ - k
142
+ - "\u0916"
143
+ - g
144
+ - "\u0918"
145
+ - "\u0919"
146
+ - c
147
+ - C
148
+ - j
149
+ - J
150
+ - "\u091E"
151
+ - "\u091F"
152
+ - "\u0920"
153
+ - "\u0921"
154
+ - "\u0922"
155
+ - "\u0923"
156
+ - t
157
+ - "\u0925"
158
+ - d
159
+ - "\u0927"
160
+ - n
161
+ - "\u0929"
162
+ - p
163
+ - P
164
+ - b
165
+ - B
166
+ - m
167
+ - y
168
+ - r
169
+ - "\u0931"
170
+ - l
171
+ - "\u0D33"
172
+ - Z
173
+ - w
174
+ - "\u0936"
175
+ - "\u0937"
176
+ - s
177
+ - h
178
+ - Y
179
+ - "\u093D"
180
+ - "\u0915"
181
+ - K
182
+ - G
183
+ - z
184
+ - D
185
+ - T
186
+ - f
187
+ - "\u0960"
188
+ - "\u0D7A"
189
+ - N
190
+ - "\u0D7C"
191
+ - "\u0D7D"
192
+ - "\u0D7E"
193
+ - a
194
+ - A
195
+ - i
196
+ - I
197
+ - u
198
+ - U
199
+ - R
200
+ - "\u090D"
201
+ - e
202
+ - E
203
+ - "\u0910"
204
+ - "\u0911"
205
+ - o
206
+ - O
207
+ - "\u0914"
208
+ - "\u0B89"
209
+ - <sos/eos>
210
+ token_type: char
211
+ train_data_path_and_name_and_type:
212
+ - - dump/raw/tr_no_dev/text
213
+ - text
214
+ - text
215
+ - - duration_info/tr_no_dev/durations
216
+ - durations
217
+ - text_int
218
+ - - dump/raw/tr_no_dev/wav.scp
219
+ - speech
220
+ - sound
221
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
222
+ - pitch
223
+ - npy
224
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
225
+ - energy
226
+ - npy
227
+ train_dtype: float32
228
+ train_shape_file:
229
+ - exp/tts_stats_raw_char_None/train/text_shape.char
230
+ - exp/tts_stats_raw_char_None/train/speech_shape
231
+ tts: fastspeech2
232
+ tts_conf:
233
+ adim: 384
234
+ aheads: 2
235
+ decoder_normalize_before: true
236
+ dlayers: 4
237
+ dunits: 1536
238
+ duration_predictor_chans: 256
239
+ duration_predictor_kernel_size: 3
240
+ duration_predictor_layers: 2
241
+ elayers: 4
242
+ encoder_normalize_before: true
243
+ energy_embed_dropout: 0.0
244
+ energy_embed_kernel_size: 1
245
+ energy_predictor_chans: 256
246
+ energy_predictor_dropout: 0.5
247
+ energy_predictor_kernel_size: 3
248
+ energy_predictor_layers: 2
249
+ eunits: 1536
250
+ init_dec_alpha: 1.0
251
+ init_enc_alpha: 1.0
252
+ init_type: xavier_uniform
253
+ pitch_embed_dropout: 0.0
254
+ pitch_embed_kernel_size: 1
255
+ pitch_predictor_chans: 256
256
+ pitch_predictor_dropout: 0.5
257
+ pitch_predictor_kernel_size: 5
258
+ pitch_predictor_layers: 5
259
+ positionwise_conv_kernel_size: 3
260
+ positionwise_layer_type: conv1d
261
+ postnet_chans: 256
262
+ postnet_filts: 5
263
+ postnet_layers: 5
264
+ reduction_factor: 1
265
+ stop_gradient_from_energy_predictor: false
266
+ stop_gradient_from_pitch_predictor: true
267
+ transformer_dec_attn_dropout_rate: 0.2
268
+ transformer_dec_dropout_rate: 0.2
269
+ transformer_dec_positional_dropout_rate: 0.2
270
+ transformer_enc_attn_dropout_rate: 0.2
271
+ transformer_enc_dropout_rate: 0.2
272
+ transformer_enc_positional_dropout_rate: 0.2
273
+ use_masking: true
274
+ use_scaled_pos_enc: true
275
+ unused_parameters: false
276
+ use_adapter: false
277
+ use_amp: false
278
+ use_matplotlib: true
279
+ use_preprocessor: true
280
+ use_tensorboard: true
281
+ use_wandb: false
282
+ val_scheduler_criterion:
283
+ - valid
284
+ - loss
285
+ valid_batch_bins: null
286
+ valid_batch_size: null
287
+ valid_batch_type: null
288
+ valid_data_path_and_name_and_type:
289
+ - - dump/raw/dev/text
290
+ - text
291
+ - text
292
+ - - duration_info/dev/durations
293
+ - durations
294
+ - text_int
295
+ - - dump/raw/dev/wav.scp
296
+ - speech
297
+ - sound
298
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
299
+ - pitch
300
+ - npy
301
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
302
+ - energy
303
+ - npy
304
+ valid_iterator_type: null
305
+ valid_max_cache_size: null
306
+ valid_shape_file:
307
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
308
+ - exp/tts_stats_raw_char_None/valid/speech_shape
309
+ version: '202402'
310
+ wandb_entity: null
311
+ wandb_id: null
312
+ wandb_model_log_interval: -1
313
+ wandb_name: null
314
+ wandb_project: null
315
+ write_collected_feats: false
bengali_latest/male/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e0ff72de15d28f934bf95054d8c82210dbfdbe9114780b92f536a4cfd908358
3
+ size 770
bengali_latest/male/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e63bfa54c96d7998cc22e479118fb7be8a5a9a1fae9508c210fd3f00065e0945
3
+ size 2042
bengali_latest/male/model/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e131b107524777db0ae4f2578856b9baba42c2ed944433c7d5a086c56f0973e8
3
+ size 152128410
bengali_latest/male/model/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:508206b876c66ec155e6473527155c24ed06d65f8a23963e5bec908a27be018f
3
+ size 770
bodo_latest/female/model/config.yaml ADDED
@@ -0,0 +1,319 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_fastspeech2.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 1
12
+ num_att_plot: 3
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: 2
16
+ dist_rank: 0
17
+ local_rank: 0
18
+ dist_master_addr: localhost
19
+ dist_master_port: 40847
20
+ dist_launcher: null
21
+ multiprocessing_distributed: true
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 1000
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - loss
44
+ - min
45
+ - - train
46
+ - loss
47
+ - min
48
+ keep_nbest_models: 5
49
+ nbest_averaging_interval: 0
50
+ grad_clip: 1.0
51
+ grad_clip_type: 2.0
52
+ grad_noise: false
53
+ accum_grad: 8
54
+ no_forward_run: false
55
+ resume: true
56
+ train_dtype: float32
57
+ use_amp: false
58
+ log_interval: null
59
+ use_matplotlib: true
60
+ use_tensorboard: true
61
+ create_graph_in_tensorboard: false
62
+ use_wandb: false
63
+ wandb_project: null
64
+ wandb_id: null
65
+ wandb_entity: null
66
+ wandb_name: null
67
+ wandb_model_log_interval: -1
68
+ detect_anomaly: false
69
+ use_adapter: false
70
+ adapter: lora
71
+ save_strategy: all
72
+ adapter_conf: {}
73
+ pretrain_path: null
74
+ init_param: []
75
+ ignore_init_mismatch: false
76
+ freeze_param: []
77
+ num_iters_per_epoch: 800
78
+ batch_size: 20
79
+ valid_batch_size: null
80
+ batch_bins: 3000000
81
+ valid_batch_bins: null
82
+ train_shape_file:
83
+ - exp/tts_stats_raw_char_None/train/text_shape.char
84
+ - exp/tts_stats_raw_char_None/train/speech_shape
85
+ valid_shape_file:
86
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
87
+ - exp/tts_stats_raw_char_None/valid/speech_shape
88
+ batch_type: numel
89
+ valid_batch_type: null
90
+ fold_length:
91
+ - 150
92
+ - 819200
93
+ sort_in_batch: descending
94
+ shuffle_within_batch: false
95
+ sort_batch: descending
96
+ multiple_iterator: false
97
+ chunk_length: 500
98
+ chunk_shift_ratio: 0.5
99
+ num_cache_chunks: 1024
100
+ chunk_excluded_key_prefixes: []
101
+ chunk_default_fs: null
102
+ chunk_max_abs_length: null
103
+ chunk_discard_short_samples: true
104
+ train_data_path_and_name_and_type:
105
+ - - dump/raw/tr_no_dev/text
106
+ - text
107
+ - text
108
+ - - duration_info/tr_no_dev/durations
109
+ - durations
110
+ - text_int
111
+ - - dump/raw/tr_no_dev/wav.scp
112
+ - speech
113
+ - sound
114
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
115
+ - pitch
116
+ - npy
117
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
118
+ - energy
119
+ - npy
120
+ valid_data_path_and_name_and_type:
121
+ - - dump/raw/dev/text
122
+ - text
123
+ - text
124
+ - - duration_info/dev/durations
125
+ - durations
126
+ - text_int
127
+ - - dump/raw/dev/wav.scp
128
+ - speech
129
+ - sound
130
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
131
+ - pitch
132
+ - npy
133
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
134
+ - energy
135
+ - npy
136
+ multi_task_dataset: false
137
+ allow_variable_data_keys: false
138
+ max_cache_size: 0.0
139
+ max_cache_fd: 32
140
+ allow_multi_rates: false
141
+ valid_max_cache_size: null
142
+ exclude_weight_decay: false
143
+ exclude_weight_decay_conf: {}
144
+ optim: adam
145
+ optim_conf:
146
+ lr: 1.0
147
+ scheduler: noamlr
148
+ scheduler_conf:
149
+ model_size: 384
150
+ warmup_steps: 4000
151
+ token_list:
152
+ - <blank>
153
+ - <unk>
154
+ - <space>
155
+ - $
156
+ - ','
157
+ - .
158
+ - M
159
+ - q
160
+ - H
161
+ - k
162
+ - ख
163
+ - g
164
+ - घ
165
+ - ङ
166
+ - c
167
+ - C
168
+ - j
169
+ - J
170
+ - ञ
171
+ - ट
172
+ - ठ
173
+ - ड
174
+ - ढ
175
+ - ण
176
+ - t
177
+ - थ
178
+ - d
179
+ - ध
180
+ - n
181
+ - ऩ
182
+ - p
183
+ - P
184
+ - b
185
+ - B
186
+ - m
187
+ - y
188
+ - r
189
+ - ऱ
190
+ - l
191
+ - ള
192
+ - Z
193
+ - w
194
+ - श
195
+ - ष
196
+ - s
197
+ - h
198
+ - Y
199
+ - ऽ
200
+ - क
201
+ - K
202
+ - G
203
+ - z
204
+ - D
205
+ - T
206
+ - f
207
+ - ॠ
208
+ - ൺ
209
+ - N
210
+ - ർ
211
+ - ൽ
212
+ - ൾ
213
+ - a
214
+ - A
215
+ - i
216
+ - I
217
+ - u
218
+ - U
219
+ - R
220
+ - ऍ
221
+ - e
222
+ - E
223
+ - ऐ
224
+ - ऑ
225
+ - o
226
+ - O
227
+ - औ
228
+ - உ
229
+ - <sos/eos>
230
+ odim: null
231
+ model_conf: {}
232
+ use_preprocessor: true
233
+ token_type: char
234
+ bpemodel: null
235
+ non_linguistic_symbols: null
236
+ cleaner: null
237
+ g2p: null
238
+ feats_extract: fbank
239
+ feats_extract_conf:
240
+ n_fft: 8192
241
+ hop_length: 1024
242
+ win_length: 4096
243
+ fs: 48000
244
+ fmin: 0
245
+ fmax: 24000
246
+ n_mels: 160
247
+ normalize: global_mvn
248
+ normalize_conf:
249
+ stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
250
+ tts: fastspeech2
251
+ tts_conf:
252
+ adim: 384
253
+ aheads: 2
254
+ elayers: 4
255
+ eunits: 1536
256
+ dlayers: 4
257
+ dunits: 1536
258
+ positionwise_layer_type: conv1d
259
+ positionwise_conv_kernel_size: 3
260
+ duration_predictor_layers: 2
261
+ duration_predictor_chans: 256
262
+ duration_predictor_kernel_size: 3
263
+ postnet_layers: 5
264
+ postnet_filts: 5
265
+ postnet_chans: 256
266
+ use_masking: true
267
+ use_scaled_pos_enc: true
268
+ encoder_normalize_before: true
269
+ decoder_normalize_before: true
270
+ reduction_factor: 1
271
+ init_type: xavier_uniform
272
+ init_enc_alpha: 1.0
273
+ init_dec_alpha: 1.0
274
+ transformer_enc_dropout_rate: 0.2
275
+ transformer_enc_positional_dropout_rate: 0.2
276
+ transformer_enc_attn_dropout_rate: 0.2
277
+ transformer_dec_dropout_rate: 0.2
278
+ transformer_dec_positional_dropout_rate: 0.2
279
+ transformer_dec_attn_dropout_rate: 0.2
280
+ pitch_predictor_layers: 5
281
+ pitch_predictor_chans: 256
282
+ pitch_predictor_kernel_size: 5
283
+ pitch_predictor_dropout: 0.5
284
+ pitch_embed_kernel_size: 1
285
+ pitch_embed_dropout: 0.0
286
+ stop_gradient_from_pitch_predictor: true
287
+ energy_predictor_layers: 2
288
+ energy_predictor_chans: 256
289
+ energy_predictor_kernel_size: 3
290
+ energy_predictor_dropout: 0.5
291
+ energy_embed_kernel_size: 1
292
+ energy_embed_dropout: 0.0
293
+ stop_gradient_from_energy_predictor: false
294
+ pitch_extract: dio
295
+ pitch_extract_conf:
296
+ fs: 48000
297
+ n_fft: 8192
298
+ hop_length: 1024
299
+ f0max: 400
300
+ f0min: 80
301
+ reduction_factor: 1
302
+ pitch_normalize: global_mvn
303
+ pitch_normalize_conf:
304
+ stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
305
+ energy_extract: energy
306
+ energy_extract_conf:
307
+ fs: 48000
308
+ n_fft: 8192
309
+ hop_length: 1024
310
+ win_length: 4096
311
+ reduction_factor: 1
312
+ energy_normalize: global_mvn
313
+ energy_normalize_conf:
314
+ stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
315
+ required:
316
+ - output_dir
317
+ - token_list
318
+ version: '202402'
319
+ distributed: true
bodo_latest/female/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f146e38995c250d297602ef8ae9a86ca151b5dbd85bd2a0c6d6fc480958825c6
3
+ size 770
bodo_latest/female/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ac92ccb722a0ed041407e19bddde97f055e37d1108c2927c573f912b281e9f6
3
+ size 2042
bodo_latest/female/model/feats_type ADDED
@@ -0,0 +1 @@
 
 
1
+ raw
bodo_latest/female/model/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d7e1023281d3358bca078b2a218cddda8fc79aef7f0e3d47272331b8bf9645a
3
+ size 152129434
bodo_latest/female/model/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59051dd33e6f33a98737cbe4a5a220eb9af37c43d2b660f3d257f411f1128025
3
+ size 770
bodo_latest/male/model/config.yaml ADDED
@@ -0,0 +1,319 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/tuning/train_fastspeech2.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ drop_last_iter: false
5
+ dry_run: false
6
+ iterator_type: sequence
7
+ valid_iterator_type: null
8
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
9
+ ngpu: 1
10
+ seed: 0
11
+ num_workers: 1
12
+ num_att_plot: 3
13
+ dist_backend: nccl
14
+ dist_init_method: env://
15
+ dist_world_size: 2
16
+ dist_rank: 0
17
+ local_rank: 0
18
+ dist_master_addr: localhost
19
+ dist_master_port: 53925
20
+ dist_launcher: null
21
+ multiprocessing_distributed: true
22
+ unused_parameters: false
23
+ sharded_ddp: false
24
+ use_deepspeed: false
25
+ deepspeed_config: null
26
+ cudnn_enabled: true
27
+ cudnn_benchmark: false
28
+ cudnn_deterministic: true
29
+ use_tf32: false
30
+ collect_stats: false
31
+ write_collected_feats: false
32
+ max_epoch: 1000
33
+ patience: null
34
+ val_scheduler_criterion:
35
+ - valid
36
+ - loss
37
+ early_stopping_criterion:
38
+ - valid
39
+ - loss
40
+ - min
41
+ best_model_criterion:
42
+ - - valid
43
+ - loss
44
+ - min
45
+ - - train
46
+ - loss
47
+ - min
48
+ keep_nbest_models: 5
49
+ nbest_averaging_interval: 0
50
+ grad_clip: 1.0
51
+ grad_clip_type: 2.0
52
+ grad_noise: false
53
+ accum_grad: 8
54
+ no_forward_run: false
55
+ resume: true
56
+ train_dtype: float32
57
+ use_amp: false
58
+ log_interval: null
59
+ use_matplotlib: true
60
+ use_tensorboard: true
61
+ create_graph_in_tensorboard: false
62
+ use_wandb: false
63
+ wandb_project: null
64
+ wandb_id: null
65
+ wandb_entity: null
66
+ wandb_name: null
67
+ wandb_model_log_interval: -1
68
+ detect_anomaly: false
69
+ use_adapter: false
70
+ adapter: lora
71
+ save_strategy: all
72
+ adapter_conf: {}
73
+ pretrain_path: null
74
+ init_param: []
75
+ ignore_init_mismatch: false
76
+ freeze_param: []
77
+ num_iters_per_epoch: 800
78
+ batch_size: 20
79
+ valid_batch_size: null
80
+ batch_bins: 3000000
81
+ valid_batch_bins: null
82
+ train_shape_file:
83
+ - exp/tts_stats_raw_char_None/train/text_shape.char
84
+ - exp/tts_stats_raw_char_None/train/speech_shape
85
+ valid_shape_file:
86
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
87
+ - exp/tts_stats_raw_char_None/valid/speech_shape
88
+ batch_type: numel
89
+ valid_batch_type: null
90
+ fold_length:
91
+ - 150
92
+ - 819200
93
+ sort_in_batch: descending
94
+ shuffle_within_batch: false
95
+ sort_batch: descending
96
+ multiple_iterator: false
97
+ chunk_length: 500
98
+ chunk_shift_ratio: 0.5
99
+ num_cache_chunks: 1024
100
+ chunk_excluded_key_prefixes: []
101
+ chunk_default_fs: null
102
+ chunk_max_abs_length: null
103
+ chunk_discard_short_samples: true
104
+ train_data_path_and_name_and_type:
105
+ - - dump/raw/tr_no_dev/text
106
+ - text
107
+ - text
108
+ - - duration_info/tr_no_dev/durations
109
+ - durations
110
+ - text_int
111
+ - - dump/raw/tr_no_dev/wav.scp
112
+ - speech
113
+ - sound
114
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
115
+ - pitch
116
+ - npy
117
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
118
+ - energy
119
+ - npy
120
+ valid_data_path_and_name_and_type:
121
+ - - dump/raw/dev/text
122
+ - text
123
+ - text
124
+ - - duration_info/dev/durations
125
+ - durations
126
+ - text_int
127
+ - - dump/raw/dev/wav.scp
128
+ - speech
129
+ - sound
130
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
131
+ - pitch
132
+ - npy
133
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
134
+ - energy
135
+ - npy
136
+ multi_task_dataset: false
137
+ allow_variable_data_keys: false
138
+ max_cache_size: 0.0
139
+ max_cache_fd: 32
140
+ allow_multi_rates: false
141
+ valid_max_cache_size: null
142
+ exclude_weight_decay: false
143
+ exclude_weight_decay_conf: {}
144
+ optim: adam
145
+ optim_conf:
146
+ lr: 1.0
147
+ scheduler: noamlr
148
+ scheduler_conf:
149
+ model_size: 384
150
+ warmup_steps: 4000
151
+ token_list:
152
+ - <blank>
153
+ - <unk>
154
+ - <space>
155
+ - $
156
+ - ','
157
+ - .
158
+ - M
159
+ - q
160
+ - H
161
+ - k
162
+ - ख
163
+ - g
164
+ - घ
165
+ - ङ
166
+ - c
167
+ - C
168
+ - j
169
+ - J
170
+ - ञ
171
+ - ट
172
+ - ठ
173
+ - ड
174
+ - ढ
175
+ - ण
176
+ - t
177
+ - थ
178
+ - d
179
+ - ध
180
+ - n
181
+ - ऩ
182
+ - p
183
+ - P
184
+ - b
185
+ - B
186
+ - m
187
+ - y
188
+ - r
189
+ - ऱ
190
+ - l
191
+ - ള
192
+ - Z
193
+ - w
194
+ - श
195
+ - ष
196
+ - s
197
+ - h
198
+ - Y
199
+ - ऽ
200
+ - क
201
+ - K
202
+ - G
203
+ - z
204
+ - D
205
+ - T
206
+ - f
207
+ - ॠ
208
+ - ൺ
209
+ - N
210
+ - ർ
211
+ - ൽ
212
+ - ൾ
213
+ - a
214
+ - A
215
+ - i
216
+ - I
217
+ - u
218
+ - U
219
+ - R
220
+ - ऍ
221
+ - e
222
+ - E
223
+ - ऐ
224
+ - ऑ
225
+ - o
226
+ - O
227
+ - औ
228
+ - உ
229
+ - <sos/eos>
230
+ odim: null
231
+ model_conf: {}
232
+ use_preprocessor: true
233
+ token_type: char
234
+ bpemodel: null
235
+ non_linguistic_symbols: null
236
+ cleaner: null
237
+ g2p: null
238
+ feats_extract: fbank
239
+ feats_extract_conf:
240
+ n_fft: 8192
241
+ hop_length: 1024
242
+ win_length: 4096
243
+ fs: 48000
244
+ fmin: 0
245
+ fmax: 24000
246
+ n_mels: 160
247
+ normalize: global_mvn
248
+ normalize_conf:
249
+ stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
250
+ tts: fastspeech2
251
+ tts_conf:
252
+ adim: 384
253
+ aheads: 2
254
+ elayers: 4
255
+ eunits: 1536
256
+ dlayers: 4
257
+ dunits: 1536
258
+ positionwise_layer_type: conv1d
259
+ positionwise_conv_kernel_size: 3
260
+ duration_predictor_layers: 2
261
+ duration_predictor_chans: 256
262
+ duration_predictor_kernel_size: 3
263
+ postnet_layers: 5
264
+ postnet_filts: 5
265
+ postnet_chans: 256
266
+ use_masking: true
267
+ use_scaled_pos_enc: true
268
+ encoder_normalize_before: true
269
+ decoder_normalize_before: true
270
+ reduction_factor: 1
271
+ init_type: xavier_uniform
272
+ init_enc_alpha: 1.0
273
+ init_dec_alpha: 1.0
274
+ transformer_enc_dropout_rate: 0.2
275
+ transformer_enc_positional_dropout_rate: 0.2
276
+ transformer_enc_attn_dropout_rate: 0.2
277
+ transformer_dec_dropout_rate: 0.2
278
+ transformer_dec_positional_dropout_rate: 0.2
279
+ transformer_dec_attn_dropout_rate: 0.2
280
+ pitch_predictor_layers: 5
281
+ pitch_predictor_chans: 256
282
+ pitch_predictor_kernel_size: 5
283
+ pitch_predictor_dropout: 0.5
284
+ pitch_embed_kernel_size: 1
285
+ pitch_embed_dropout: 0.0
286
+ stop_gradient_from_pitch_predictor: true
287
+ energy_predictor_layers: 2
288
+ energy_predictor_chans: 256
289
+ energy_predictor_kernel_size: 3
290
+ energy_predictor_dropout: 0.5
291
+ energy_embed_kernel_size: 1
292
+ energy_embed_dropout: 0.0
293
+ stop_gradient_from_energy_predictor: false
294
+ pitch_extract: dio
295
+ pitch_extract_conf:
296
+ fs: 48000
297
+ n_fft: 8192
298
+ hop_length: 1024
299
+ f0max: 350
300
+ f0min: 40
301
+ reduction_factor: 1
302
+ pitch_normalize: global_mvn
303
+ pitch_normalize_conf:
304
+ stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
305
+ energy_extract: energy
306
+ energy_extract_conf:
307
+ fs: 48000
308
+ n_fft: 8192
309
+ hop_length: 1024
310
+ win_length: 4096
311
+ reduction_factor: 1
312
+ energy_normalize: global_mvn
313
+ energy_normalize_conf:
314
+ stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
315
+ required:
316
+ - output_dir
317
+ - token_list
318
+ version: '202402'
319
+ distributed: true
bodo_latest/male/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ccfd0ab92010376d6cecbf0d2d3e2e338ccb2cc1a4c44af9acd1f9bd569f9e
3
+ size 770
bodo_latest/male/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0adb54c43f773f5c078a60c30cfba90f4b3cb02461ac3a4f9cbc638f91e2e82
3
+ size 2042
bodo_latest/male/model/feats_type ADDED
@@ -0,0 +1 @@
 
 
1
+ raw
bodo_latest/male/model/model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:742c513ae2866449704836faeeedb4c4e6c364a4e4d0f9ebc96f234efc084b8d
3
+ size 152129434
bodo_latest/male/model/pitch_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84a143913223f17d10f677a7b94e26ccf8d1251ff97d882fe65f33542a3d5722
3
+ size 770
charmap/Text_Cleaning.ipynb ADDED
@@ -0,0 +1,332 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "code",
5
+ "execution_count": 2,
6
+ "metadata": {
7
+ "collapsed": true
8
+ },
9
+ "outputs": [],
10
+ "source": [
11
+ "############################################################\n",
12
+ "#Author : Bhagyashree\n",
13
+ "#Date : 1st Sept, 2020\n",
14
+ "#Purpose : Text Cleaning\n",
15
+ "#Input : Text file after timestamp removal\n",
16
+ "#Output : Text file after cleaning data\n",
17
+ "############################################################"
18
+ ]
19
+ },
20
+ {
21
+ "cell_type": "code",
22
+ "execution_count": 3,
23
+ "metadata": {
24
+ "collapsed": true
25
+ },
26
+ "outputs": [],
27
+ "source": [
28
+ "import nltk\n",
29
+ "import numpy\n",
30
+ "import xlrd\n",
31
+ "import openpyxl \n",
32
+ "import re"
33
+ ]
34
+ },
35
+ {
36
+ "cell_type": "code",
37
+ "execution_count": 21,
38
+ "metadata": {},
39
+ "outputs": [
40
+ {
41
+ "name": "stdout",
42
+ "output_type": "stream",
43
+ "text": [
44
+ "अब हम ऑलट्रेशन ऑफ मेमोरेंडम के बारे में बात करेंगे।\n",
45
+ " मेमोरेंडम के विषयों को बदल दिया जा सकता है।\n",
46
+ "कंपनी अधिनियम 1956 के तहत\n",
47
+ "निम्नलिखित प्रक्रिया के अनुसार\n",
48
+ "यदि कोई कंपनी अपना नाम बदलना चाहती है,\n",
49
+ "तो वे विशेष संकल्प में ऐसा कर सकती है।\n",
50
+ "और केंद्र सरकार की मंजूरी के साथ\n",
51
+ "लिखित में\n",
52
+ "हालाँकि, ऐसी किसी भी मंजूरी की आवश्यकता नहीं होती है\n",
53
+ "केवल कंपनी के नाम में परिवर्तन के लिए\n",
54
+ "बल्कि यह प्रक्रिया\n",
55
+ "पूरी तरह से निजी शब्द को हटाने के लिए होती है।\n",
56
+ "तो इस मामले में\n",
57
+ "एक सार्वजनिक कंपनी को एक निजी कंपनी के संबंध में,\n",
58
+ "या एक निजी कंपनी को एक सार्वजनिक कंपनी में परिवर्तित करने\n",
59
+ "दूसरी जगह पर पंजीकृत कार्यालय का दोबारा परिवर्तन किया जाना है\n",
60
+ "अगर एक ही शहर, कस्बे\n",
61
+ "या गाँव में एक जगह से\n",
62
+ "30 दिनों का नोटिस दिया जाना होता है।\n",
63
+ "यह रजिस्ट्रार द्वारा परिवर्तन की तिथि के बाद\n",
64
+ "होगा जो उसी को दर्ज करेगा।\n",
65
+ "पंजीकृत कार्यालय के परिवर्तन के मामले में\n",
66
+ "जबकि एक ही राज्य में 1 शहर से दूसरे शहर में,\n",
67
+ "विशेष प्रस्ताव पारित किया जाना आवश्यक है।\n",
68
+ "शेयरधारकों की आम बैठक में\n",
69
+ "और इसकी एक प्रति रजिस्ट्रार के पास कार्यालय को\n",
70
+ "30 दिनों के भीतर बदलने के दाखिल करनी होगी।\n",
71
+ "नोटिस देना होगा।\n",
72
+ "रजिस्ट्रार को कार्यालय के नये पते का\n",
73
+ "तब तक परिवर्तन प्रभावी नहीं होगा।\n",
74
+ "जब तक केंद्र सरकार द्वारा प्रस्ताव की पुष्टि नहीं हो जाती\n",
75
+ "कंपनी किसी भी आधार पर\n",
76
+ "उपधारा 1 से\n",
77
+ "उपधारा 7 में धारा 17 तक उल्लेखित है।\n",
78
+ "जैसा कि अधिनियम के बाद ही परिवर्तन प्रभावी होगा।\n",
79
+ "अपने उद्देश्यों में बदलाव कर सकती है\n",
80
+ "सामान्य बैठक में सदस्यों द्वारा\n",
81
+ "कंपनी संशोधन अधिनियम 1996 को मेमोरेंडम ऑफ एसोसिएशन के\n",
82
+ "केंद्र सरकार के प्रतिबंध के साथ समाप्त कर दिया गया है।\n",
83
+ "विशेष संकल्प के अनुरूप अनुमोदित किए जाने\n",
84
+ "ऑब्जेक्ट क्लॉज में परिवर्तन के प्रति शेयर पूंजी में\n",
85
+ "परिवर्तन की प्रक्रिया और ऐसे परिवर्तन करने के अधिकार।\n",
86
+ "समान्य पहलु को आर्टीकल ऑफ एसोसिएशन में रखा गया है।\n",
87
+ "यदि संबंधित विषय के\n",
88
+ " आर्टीकल ऑफ एसोसिएशन में पीछे की प्रक्रिया नहीं दी गई है।\n",
89
+ "कंपनी को पारित करके आर्टीकल ऑफ एसोसिएशन को बदलना होगा।\n",
90
+ "एक विशेष प्रस्ताव\n",
91
+ "अब, हम ऑलट्रेशन ऑफ पर चर्चा करेंगे।\n",
92
+ "कंपनी अधिनियम 2013 के तहत मेमोरेंडम\n",
93
+ "अधिनियम की धारा 16, 17, 18, 19,\n",
94
+ "1956 के कंपनी 21, 23 और 37 के अनुरूप।\n",
95
+ "कंपनी अधिनियम, 2013 की धारा 13 ने\n",
96
+ " ऑलट्रेशन ऑफ मेमोरेंडम के लिए मानदंड निर्धारित किए हैं।\n",
97
+ "यह वही वर्णन करता है कि जैसा कि धारा 61 में दिया गया है।\n",
98
+ "एक कंपनी विशेष संकल्प द्वारा\n",
99
+ "और प्रावधानों को बदल सकती है।\n",
100
+ "निर्दिष्ट प्रक्रिया के अनुपालन से मेमोरेंडम\n",
101
+ "नाम खंड के परिवर्तन के संबंध में,\n",
102
+ "कंपनी अपना नाम बदल सकती है।\n",
103
+ "अनुमोदन के बाद लिखित रूप में केंद्र सरकार द्वारा\n",
104
+ "इसलिए जब कंपनी के नाम में कोई बदलाव किया जाता है,\n",
105
+ "रजिस्टर में दर्ज करेगा।\n",
106
+ " तो रजिस्ट्रार कंपनी के नया नाम\n",
107
+ "पुराने नाम के स्थान पर\n",
108
+ "निगमन का एक नया प्रमाणपत्र जारी करेगा।\n",
109
+ "कंपनी के पंजीकृत कार्यालय के बारे में\n",
110
+ "जैसा कि पहले उल्लेख किया गया है,\n",
111
+ "तब तक कोई प्रभाव नहीं पड़ेगा जब तक कि वह केंद्र सरकार द्वारा अनुमोदित नहीं हो जाता।\n",
112
+ "ऑब्जेक्ट क्लॉज के किसी भी परिवर्तन के संबंध में,\n",
113
+ "किसी कंपनी के मेमोरेंडम के\n",
114
+ "रजिस्ट्रार को दाखिल करने की\n",
115
+ "30 दिनों की अवधि के भीतर\n",
116
+ "तारीख से पंजीकरण को प्रमाणित करना होता है।\n",
117
+ "इस विशेष प्रस्ताव खंड के उप खंड 6 के खंड A के अनुसार\n",
118
+ "चलिए फिर से संक्षेप में\n",
119
+ " ऑलट्रेशन ऑफ मेमोरेंडम के महत्व के बारे में चर्चा करते हैं\n",
120
+ " क्योंकि ये इस मॉड्यूल के अध्ययन का एक बहुत महत्वपूर्ण हिस्सा है।\n",
121
+ "पहला महत्व यह है\n",
122
+ "कि यह एक बहुत ही आवश्यक दस्तावेज है।\n",
123
+ "एक कंपनी के निगमन के लिए\n",
124
+ "दूसरा, यह कंपनी के पंजीकृत कार्यालय को निर्दिष्ट करते हुए\n",
125
+ "रजिस्ट्रार और अदालत के अधिकार क्षेत्र को निर्धारित करता है।\n",
126
+ "तीसरा, यह कंपनी के अधिकारों में उद्देश्यों को\n",
127
+ "जनता की जानकारी के लिए दर्ज करता है।\n",
128
+ "अगला, यह कंपनी को केवल उन कृत्यों को करने के लिए\n",
129
+ "बाध्य करता है जो कंपनी के ऑब्जेक्ट क्लॉज में शामिल हैं।\n",
130
+ "यह कंपनी की अधिकृत कैपिटल\n",
131
+ "और उसके विभाजन को निश्चित राशि के शेयरों में निर्दिष्ट करता है।\n",
132
+ "पर प्रकाश डालता है।\n",
133
+ "यह कंपनी के सदस्यों के लायबिलिटी\n",
134
+ "अंत में, संघ के नियमों को\n",
135
+ "यह एक कंपनी के भी नियंत्रित करता है।\n"
136
+ ]
137
+ }
138
+ ],
139
+ "source": [
140
+ "file1 = open(\"recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi_new.txt\",\"r+\",encoding='utf-8') \n",
141
+ "data = file1.read()\n",
142
+ "print(data)\n",
143
+ "file1.close()"
144
+ ]
145
+ },
146
+ {
147
+ "cell_type": "code",
148
+ "execution_count": 22,
149
+ "metadata": {},
150
+ "outputs": [
151
+ {
152
+ "name": "stdout",
153
+ "output_type": "stream",
154
+ "text": [
155
+ "अब हम ऑलट्रेशन ऑफ मेमोरेंडम के बारे में बात करेंगे\n",
156
+ " मेमोरेंडम के विषयों को बदल दिया जा सकता है\n",
157
+ "कंपनी अधिनियम वन नाइन फाइव सिक्स के तहत\n",
158
+ "निम्नलिखित प्रक्रिया के अनुसार\n",
159
+ "यदि कोई कंपनी अपना नाम बदलना चाहती है\n",
160
+ "तो वे विशेष संकल्प में ऐसा कर सकती है\n",
161
+ "और केंद्र सरकार की मंजूरी के साथ\n",
162
+ "लिखित में\n",
163
+ "हालाँकि ऐसी किसी भी मंजूरी की आवश्यकता नहीं होती है\n",
164
+ "केवल कंपनी के नाम में परिवर्तन के लिए\n",
165
+ "बल्कि यह प्रक्रिया\n",
166
+ "पूरी तरह से निजी शब्द को हटाने के लिए होती है\n",
167
+ "तो इस मामले में\n",
168
+ "एक सार्वजनिक कंपनी को एक निजी कंपनी के संबंध में\n",
169
+ "या एक निजी कंपनी को एक सार्वजनिक कंपनी में परिवर्तित करने\n",
170
+ "दूसरी जगह पर पंजीकृत कार्यालय का दोबारा परिवर्तन किया जाना है\n",
171
+ "अगर एक ही शहर कस्बे\n",
172
+ "या गाँव में एक जगह से\n",
173
+ " थ्री ज़ीरो दिनों का नोटिस दिया जाना होता है\n",
174
+ "यह रजिस्ट्रार द्वारा परिवर्तन की तिथि के बाद\n",
175
+ "होगा जो उसी को दर्ज करेगा\n",
176
+ "पंजीकृत कार्यालय के परिवर्तन के मामले में\n",
177
+ "जबकि एक ही राज्य में वन शहर से दूसरे शहर में\n",
178
+ "विशेष प्रस्ताव पारित किया जाना आवश्यक है\n",
179
+ "शेयरधारकों की आम बैठक में\n",
180
+ "और इसकी एक प्रति रजिस्ट्रार के पास कार्यालय को\n",
181
+ " थ्री ज़ीरो दिनों के भीतर बदलने के दाखिल करनी होगी\n",
182
+ "नोटिस देना होगा\n",
183
+ "रजिस्ट्रार को कार्यालय के नये पते का\n",
184
+ "तब तक परिवर्तन प्रभावी नहीं होगा\n",
185
+ "जब तक केंद्र सरकार द्वारा प्रस्ताव की पुष्टि नहीं हो जा���ी\n",
186
+ "कंपनी किसी भी आधार पर\n",
187
+ "उपधारा वन से\n",
188
+ "उपधारा सेवेन में धारा वन सेवेन तक उल्लेखित है\n",
189
+ "जैसा कि अधिनियम के बाद ही परिवर्तन प्रभावी होगा\n",
190
+ "अपने उद्देश्यों में बदलाव कर सकती है\n",
191
+ "सामान्य बैठक में सदस्यों द्वारा\n",
192
+ "कंपनी संशोधन अधिनियम वन नाइन नाइन सिक्स को मेमोरेंडम ऑफ एसोसिएशन के\n",
193
+ "केंद्र सरकार के प्रतिबंध के साथ समाप्त कर दिया गया है\n",
194
+ "विशेष संकल्प के अनुरूप अनुमोदित किए जाने\n",
195
+ "ऑब्जेक्ट क्लॉज में परिवर्तन के प्रति शेयर पूंजी में\n",
196
+ "परिवर्तन की प्रक्रिया और ऐसे परिवर्तन करने के अधिकार\n",
197
+ "समान्य पहलु को आर्टीकल ऑफ एसोसिएशन में रखा गया है\n",
198
+ "यदि संबंधित विषय के\n",
199
+ " आर्टीकल ऑफ एसोसिएशन में पीछे की प्रक्रिया नहीं दी गई है\n",
200
+ "कंपनी को पारित करके आर्टीकल ऑफ एसोसिएशन को बदलना होगा\n",
201
+ "एक विशेष प्रस्ताव\n",
202
+ "अब हम ऑलट्रेशन ऑफ पर चर्चा करेंगे\n",
203
+ "कंपनी अधिनियम टू ज़ीरो वन थ्री के तहत मेमोरेंडम\n",
204
+ "अधिनियम की धारा वन सिक्स वन सेवेन वन ऐइट वन नाइन \n",
205
+ " वन नाइन फाइव सिक्स के कंपनी टू वन टू थ्री और थ्री सेवेन के अनुरूप\n",
206
+ "कंपनी अधिनियम टू ज़ीरो वन थ्री की धारा वन थ्री ने\n",
207
+ " ऑलट्रेशन ऑफ मेमोरेंडम के लिए मानदंड निर्धारित किए हैं\n",
208
+ "यह वही वर्णन करता है कि जैसा कि धारा सिक्स वन में दिया गया है\n",
209
+ "एक कंपनी विशेष संकल्प द्वारा\n",
210
+ "और प्रावधानों को बदल सकती है\n",
211
+ "निर्दिष्ट प्रक्रिया के अनुपालन से मेमोरेंडम\n",
212
+ "नाम खंड के परिवर्तन के संबंध में\n",
213
+ "कंपनी अपना नाम बदल सकती है\n",
214
+ "अनुमोदन के बाद लिखित रूप में केंद्र सरकार द्वारा\n",
215
+ "इसलिए जब कंपनी के नाम में कोई बदलाव किया जाता है\n",
216
+ "रजिस्टर में दर्ज करेगा\n",
217
+ " तो रजिस्ट्रार कंपनी के नया नाम\n",
218
+ "पुराने नाम के स्थान पर\n",
219
+ "निगमन का एक नया प्रमाणपत्र जारी करेगा\n",
220
+ "कंपनी के पंजीकृत कार्यालय के बारे में\n",
221
+ "जैसा कि पहले उल्लेख किया गया है\n",
222
+ "तब तक कोई प्रभाव नहीं पड़ेगा जब तक कि वह केंद्र सरकार द्वारा अनुमोदित नहीं हो जाता\n",
223
+ "ऑब्जेक्ट क्लॉज के किसी भी परिवर्तन के संबंध में\n",
224
+ "किसी कंपनी के मेमोरेंडम के\n",
225
+ "रजिस्ट्रार को दाखिल करने की\n",
226
+ " थ्री ज़ीरो दिनों की अवधि के भीतर\n",
227
+ "तारीख से पंजीकरण को प्रमाणित करना होता है\n",
228
+ "इस विशेष प्रस्ताव खंड के उप खंड सिक्स के खंड ए के अनुसार\n",
229
+ "चलिए फिर से संक्षेप में\n",
230
+ " ऑलट्रेशन ऑफ मेमोरेंडम के महत्व के बारे में चर्चा करते हैं\n",
231
+ " क्योंकि ये इस मॉड्यूल के अध्ययन का एक बहुत महत्वपूर्ण हिस्सा है\n",
232
+ "पहला महत्व यह है\n",
233
+ "कि यह एक बहुत ही आवश्यक दस्तावेज है\n",
234
+ "एक कंपनी के निगमन के लिए\n",
235
+ "दूसरा यह कंपनी के पंजीकृत कार्यालय को निर्दिष्ट करते हुए\n",
236
+ "रजिस्ट्रार और अदालत के अधिकार क्षेत्र को निर्धारित करता है\n",
237
+ "तीसरा यह कंपनी के अधिकारों में उद्देश्यों को\n",
238
+ "जनता की जानकारी के लिए दर्ज करता है\n",
239
+ "अगला यह कंपनी को केवल उन कृत्यों को करने के लिए\n",
240
+ "बाध्य करता है जो कंपनी के ऑब्जेक्ट क्लॉज में शामिल हैं\n",
241
+ "यह कंपनी की अधिकृत कैपिटल\n",
242
+ "और उसके विभाजन को निश्चित राशि के शेयरों में निर्दिष्ट करता है\n",
243
+ "पर प्रकाश डालता है\n",
244
+ "यह कंपनी के सदस्यों के लायबिलिटी\n",
245
+ "अंत में संघ के नियमों को\n",
246
+ "यह एक कंपनी के भी नियंत्रित करता है\n"
247
+ ]
248
+ }
249
+ ],
250
+ "source": [
251
+ "\n",
252
+ "wb_obj = openpyxl.load_workbook(\"charmap_v2_new.xlsx\") \n",
253
+ "sheet_obj = wb_obj.active \n",
254
+ "\n",
255
+ "#data = re.sub('[A-Z]*', '',data)\n",
256
+ "#print(data)\n",
257
+ "data = data.replace('?','')\n",
258
+ "data = data.replace(' ',' ')\n",
259
+ "data = data.replace(';','')\n",
260
+ "data = data.replace(')','')\n",
261
+ "data = data.replace('(','')\n",
262
+ "data = data.replace('!','')\n",
263
+ "data = data.replace(' – ',' ')\n",
264
+ "data = data.replace('-',' ')\n",
265
+ "data = data.replace('।','')\n",
266
+ "data = data.replace('&','')\n",
267
+ "data = data.replace('’','')\n",
268
+ "data = data.replace('‘','')\n",
269
+ "data = data.replace(':','')\n",
270
+ "data = data.replace(',','')\n",
271
+ "data = data.replace('/','')\n",
272
+ "data = data.replace(',','')\n",
273
+ "data = data.replace('.','')\n",
274
+ "data = data.replace('|','')\n",
275
+ "m_row = sheet_obj.max_row \n",
276
+ "line = data\n",
277
+ "\n",
278
+ "for i in range(1,m_row+1):\n",
279
+ " num = sheet_obj.cell(row = i, column = 1).value \n",
280
+ " word = sheet_obj.cell(row = i, column = 2).value\n",
281
+ " #print(num)\n",
282
+ " #print(word)\n",
283
+ " line = line.replace(str(num), word)\n",
284
+ "#print(line)\n",
285
+ "#' '.join(line.split())\n",
286
+ "print(line) \n",
287
+ "file1 = open(\"recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi.txt\",\"w+\",encoding='utf-8') \n",
288
+ "file1.write(line)\n",
289
+ "file1.close()"
290
+ ]
291
+ },
292
+ {
293
+ "cell_type": "code",
294
+ "execution_count": null,
295
+ "metadata": {
296
+ "collapsed": true
297
+ },
298
+ "outputs": [],
299
+ "source": []
300
+ },
301
+ {
302
+ "cell_type": "code",
303
+ "execution_count": null,
304
+ "metadata": {
305
+ "collapsed": true
306
+ },
307
+ "outputs": [],
308
+ "source": []
309
+ }
310
+ ],
311
+ "metadata": {
312
+ "kernelspec": {
313
+ "display_name": "Python 3",
314
+ "language": "python",
315
+ "name": "python3"
316
+ },
317
+ "language_info": {
318
+ "codemirror_mode": {
319
+ "name": "ipython",
320
+ "version": 3
321
+ },
322
+ "file_extension": ".py",
323
+ "mimetype": "text/x-python",
324
+ "name": "python",
325
+ "nbconvert_exporter": "python",
326
+ "pygments_lexer": "ipython3",
327
+ "version": "3.6.3"
328
+ }
329
+ },
330
+ "nbformat": 4,
331
+ "nbformat_minor": 2
332
+ }
charmap/Text_Cleaning.py ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python
2
+ # coding: utf-8
3
+
4
+ # In[2]:
5
+
6
+
7
+ ############################################################
8
+ #Author : Bhagyashree
9
+ #Date : 1st Sept, 2020
10
+ #Purpose : Text Cleaning
11
+ #Input : Text file after timestamp removal
12
+ #Output : Text file after cleaning data
13
+ ############################################################
14
+
15
+
16
+ # In[3]:
17
+
18
+
19
+ import nltk
20
+ import numpy
21
+ import xlrd
22
+ import openpyxl
23
+ import re
24
+ import sys
25
+
26
+ # In[21]:
27
+
28
+ #file1 = open("recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi_new.txt","r+",encoding='utf-8')
29
+ file1 = open(sys.argv[1],"r+",encoding='utf-8')
30
+ data = file1.read()
31
+ #print(data)
32
+ file1.close()
33
+
34
+
35
+ # In[22]:
36
+
37
+ wb_obj = openpyxl.load_workbook(sys.argv[2])
38
+ sheet_obj = wb_obj.active
39
+
40
+ #data = re.sub('[A-Z]*', '',data)
41
+ #print(data)
42
+ data = data.replace('?','')
43
+ data = data.replace(' ',' ')
44
+ data = data.replace(';','')
45
+ data = data.replace(')','')
46
+ data = data.replace('(','')
47
+ data = data.replace('!','')
48
+ data = data.replace(' – ',' ')
49
+ data = data.replace('-',' ')
50
+ data = data.replace('।','')
51
+ data = data.replace('&','')
52
+ data = data.replace('’','')
53
+ data = data.replace('‘','')
54
+ data = data.replace(':','')
55
+ data = data.replace(',','')
56
+ data = data.replace('/','')
57
+ data = data.replace(',','')
58
+ data = data.replace('.','')
59
+ data = data.replace('|','')
60
+ m_row = sheet_obj.max_row
61
+ line = data
62
+
63
+ for i in range(1,m_row+1):
64
+ num = sheet_obj.cell(row = i, column = 1).value
65
+ word = sheet_obj.cell(row = i, column = 2).value
66
+ #print(num)
67
+ #print(word)
68
+ line = line.replace(str(num), word)
69
+ #print(line)
70
+ #' '.join(line.split())
71
+ #print(line)
72
+ file1 = open(sys.argv[3],"w+",encoding='utf-8')
73
+ #file1 = open("recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi.txt","w+",encoding='utf-8')
74
+ file1.write(line)
75
+ file1.close()
76
+
charmap/charmap_Bengali.txt ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 জিরো
2
+ 1 ওয়ান
3
+ 2 টু
4
+ 3 থ্রী
5
+ 4 ফোর
6
+ 5 ফাইভ
7
+ 6 সিক্স
8
+ 7 সেবন
9
+ 8 এইট
10
+ 9 নাইন
11
+ A এ
12
+ a এ
13
+ B বী
14
+ b বী
15
+ C সী
16
+ c সী
17
+ D ডি
18
+ d ডি
19
+ E ই
20
+ e ই
21
+ F এফ
22
+ f এফ
23
+ G জি
24
+ g জি
25
+ H এছ
26
+ h এছ
27
+ I আই
28
+ i আই
29
+ J জে
30
+ j জে
31
+ K কে
32
+ k কে
33
+ L এল
34
+ l এল
35
+ M এম
36
+ m এম
37
+ N এন
38
+ n এন
39
+ O ও
40
+ o ও
41
+ P পি
42
+ p পি
43
+ Q ক্যু
44
+ q ক্যু
45
+ R আর
46
+ r আর
47
+ S এস
48
+ s এস
49
+ T টি
50
+ t টি
51
+ U ইউ
52
+ u ইউ
53
+ V ভি
54
+ v ভি
55
+ W ডাবলু
56
+ w ডাবলু
57
+ X এক্স
58
+ x এক্স
59
+ Y উহাই
60
+ y উহাই
61
+ Z জেডঃ
62
+ z জেডঃ
charmap/charmap_Hindi.txt ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 ज़ीरो
2
+ 1 वन
3
+ 2 टू
4
+ 3 थ्री
5
+ 4 फोर
6
+ 5 फाइव
7
+ 6 सिक्स
8
+ 7 सेवेन
9
+ 8 ऐइट
10
+ 9 नाइन
11
+ ० ज़ीरो
12
+ १ वन
13
+ २ टू
14
+ ३ थ्री
15
+ ४ फोर
16
+ ५ फाइव
17
+ ६ सिक्स
18
+ ७ सेवेन
19
+ ८ ऐइट
20
+ ९ नाइन
21
+ A ए
22
+ a ए
23
+ B बी
24
+ b बी
25
+ C सी
26
+ c सी
27
+ D डी
28
+ d डी
29
+ E इ
30
+ e इ
31
+ F एफ
32
+ f एफ
33
+ G जी
34
+ g जी
35
+ H एच
36
+ h एच
37
+ I आई
38
+ i आई
39
+ J जे
40
+ j जे
41
+ K के
42
+ k के
43
+ L एल
44
+ l एल
45
+ M एम
46
+ m एम
47
+ N एन
48
+ n एन
49
+ O ओ
50
+ o ओ
51
+ P पी
52
+ p पी
53
+ Q क्यू
54
+ q क्यू
55
+ R आर
56
+ r आर
57
+ S एस
58
+ s एस
59
+ T टी
60
+ t टी
61
+ U यू
62
+ u यू
63
+ V वी
64
+ v वी
65
+ W डबलु
66
+ w डबलु
67
+ X एक्स
68
+ x एक्स
69
+ Y व्हाई
70
+ y व्हाई
71
+ Z ज़ेड
72
+ z ज़ेड
73
+ α अल्फा
74
+ φ फ़ाई
75
+ + प्लस
76
+ = इक्वल
77
+ λ लैम्ब्डा
78
+ ∅ नॉट
79
+ ϕ फ़ाई
80
+ 𝝅 पाई
81
+ ⇒ इम्प्लइज
charmap/charmap_Hindi.xlsx ADDED
Binary file (10.8 kB). View file
 
charmap/charmap_Malayalam.txt ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 സീറോ
2
+ 1 വൺ
3
+ 2 ടു
4
+ 3 ത്രീ
5
+ 4 ഫോർ
6
+ 5 ഫൈവ്
7
+ 6 സിക്സ്
8
+ 7 സെവൻ
9
+ 8 എയ്റ്റ്
10
+ 9 നൈൻ
11
+ 0 സീറോ
12
+ 1 വൺ
13
+ 2 ടു
14
+ 3 ത്രീ
15
+ 4 ഫോർ
16
+ 5 ഫൈവ്
17
+ 6 സിക്സ്
18
+ 7 സെവൻ
19
+ 8 എയ്റ്റ്
20
+ 9 നൈൻ
21
+ A എ
22
+ a എ
23
+ B ബി
24
+ b ബി
25
+ C സി
26
+ c സി
27
+ D ഡി
28
+ d ഡി
29
+ E ഇ
30
+ e ഇ
31
+ F എഫ്
32
+ f എഫ്
33
+ G ജി
34
+ g ജി
35
+ H എഛ്
36
+ h എഛ്
37
+ I ഐ
38
+ i ഐ
39
+ J ജെ
40
+ j ജെ
41
+ K കെ
42
+ k കെ
43
+ L എൽ
44
+ l എൽ
45
+ M എം
46
+ m എം
47
+ N എൻ
48
+ n എൻ
49
+ O ഒ
50
+ o ഒ
51
+ P പി
52
+ p പി
53
+ Q ക്യു
54
+ q ക്യു
55
+ R ആർ
56
+ r ആർ
57
+ S എസ്
58
+ s എസ്
59
+ T ടി
60
+ t ടി
61
+ U യു
62
+ u യു
63
+ V വി
64
+ v വി
65
+ W ഡബ്ല്യൂ
66
+ w ഡബ്ല്യൂ
67
+ X എക്സ്
68
+ x എക്സ്
69
+ Y വൈ
70
+ y വൈ
71
+ Z സെഡ്
72
+ z സെഡ്
73
+ α ആൽഫ
74
+ φ ഫി
75
+ + പ്ലസ്
76
+ = ഈക്വൽ
77
+ λ ലാംബ്ടാ
78
+ ∅ നോട്ട്
79
+ ϕ സൈ
80
+ 𝝅 പൈ
81
+ ⇒ ഇമ്പ്ലെയ്സ്
charmap/charmap_Malayalam.xlsx ADDED
Binary file (13.1 kB). View file
 
charmap/charmap_Marathi.txt ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 ज़ीरो
2
+ 1 वन
3
+ 2 टू
4
+ 3 थ्री
5
+ 4 फोर
6
+ 5 फाइव
7
+ 6 सिक्स
8
+ 7 सेवेन
9
+ 8 ऐइट
10
+ 9 नाइन
11
+ ० ज़ीरो
12
+ १ वन
13
+ २ टू
14
+ ३ थ्री
15
+ ४ फोर
16
+ ५ फाइव
17
+ ६ सिक्स
18
+ ७ सेवेन
19
+ ८ ऐइट
20
+ ९ नाइन
21
+ A ए
22
+ a ए
23
+ B बी
24
+ b बी
25
+ C सी
26
+ c सी
27
+ D डी
28
+ d डी
29
+ E इ
30
+ e इ
31
+ F एफ
32
+ f एफ
33
+ G जी
34
+ g जी
35
+ H एच
36
+ h एच
37
+ I आई
38
+ i आई
39
+ J जे
40
+ j जे
41
+ K के
42
+ k के
43
+ L एल
44
+ l एल
45
+ M एम
46
+ m एम
47
+ N एन
48
+ n एन
49
+ O ओ
50
+ o ओ
51
+ P पी
52
+ p पी
53
+ Q क्यू
54
+ q क्यू
55
+ R आर
56
+ r आर
57
+ S एस
58
+ s एस
59
+ T टी
60
+ t टी
61
+ U यू
62
+ u यू
63
+ V वी
64
+ v वी
65
+ W डबलु
66
+ w डबलु
67
+ X एक्स
68
+ x एक्स
69
+ Y व्हाई
70
+ y व्हाई
71
+ Z ज़ेड
72
+ z ज़ेड
73
+ α अल्फा
74
+ φ फ़ाई
75
+ + प्लस
76
+ = इक्वल
77
+ λ लैम्ब्डा
78
+ ∅ नॉट
79
+ ϕ फ़ाई
80
+ 𝝅 पाई
81
+ ⇒ इम्प्लइज
charmap/charmap_Marathi.xlsx ADDED
Binary file (10.8 kB). View file
 
charmap/charmap_Tamil.disabled ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 ஸிரோ
2
+ 1 ஒன்னு
3
+ 2 டூ
4
+ 3 த்ரீ
5
+ 4 போர்
6
+ 5 பைவ்
7
+ 6 சீஸ்
8
+ 7 செவென்
9
+ 8 எயிட்
10
+ 9 நயன்
11
+ A எ
12
+ a எ
13
+ B பி
14
+ b பி
15
+ C சி
16
+ c சி
17
+ D டி
18
+ d டி
19
+ E இ
20
+ e இ
21
+ F எப்
22
+ f எப்
23
+ G ஜி
24
+ g ஜி
25
+ H ஹ்
26
+ h ஹ்
27
+ I ஐ
28
+ i ஐ
29
+ J ஜே
30
+ j ஜே
31
+ K கே
32
+ k கே
33
+ L ல்
34
+ l ல்
35
+ M ம்
36
+ m ம்
37
+ N ன்
38
+ n ன்
39
+ O ஓ
40
+ o ஓ
41
+ P பி
42
+ p பி
43
+ Q கியூ
44
+ q கியூ
45
+ R ர்
46
+ r ர்
47
+ S ஸ்
48
+ s ஸ்
49
+ T டீ
50
+ t டீ
51
+ U யூ
52
+ u யூ
53
+ V வி
54
+ v வி
55
+ W டௌபிள்யூ
56
+ w டௌபிள்யூ
57
+ X எஸ்
58
+ x எஸ்
59
+ Y யை
60
+ y யை
61
+ Z செட்
62
+ z செட்
63
+ α ஆல்பா
64
+ φ பிய்
65
+ + பிளஸ்
66
+ = ஏகுவாள்
67
+ λ லாம்டா
68
+ ∅ நோட்
69
+ ϕ பிய்
70
+ 𝝅 பை
71
+ ⇒ இம்ப்ளிஸ்
72
+ . பாயிண்ட்
73
+ % பெர்ஸண்டாஜ்
74
+ °C டிகிரிசெல்சியஸ்
75
+ θ தீட்டா
76
+ * இண்டூ
charmap/charmap_Tamil.xlsx ADDED
Binary file (11.1 kB). View file
 
charmap/charmap_Telugu.txt ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 0 జీరొ
2
+ 1 వన్
3
+ 2 టు
4
+ 3 త్రీ
5
+ 4 ఫోర్
6
+ 5 ఫైవ్
7
+ 6 సిక్స్
8
+ 7 సెవెన్
9
+ 8 ఎఇట్
10
+ 9 నైన్
11
+ ० జీరొ
12
+ १ వన్
13
+ २ టు
14
+ ३ త్రీ
15
+ ४ ఫోర్
16
+ ५ ఫైవ్
17
+ ६ సిక్స్
18
+ ७ సెవెన్
19
+ ८ ఎఇట్
20
+ ९ నైన్
21
+ A ఎ
22
+ a ఎ
23
+ B బి
24
+ b బి
25
+ C సి
26
+ c సి
27
+ D డి
28
+ d డి
29
+ E ఇ
30
+ e ఇ
31
+ F ఎఫ్
32
+ f ఎఫ్
33
+ G జి
34
+ g జి
35
+ H హెచ్
36
+ h హెచ్
37
+ I ఐ
38
+ i ఐ
39
+ J జె
40
+ j జె
41
+ K కె
42
+ k కె
43
+ L ఎల్
44
+ l ఎల్
45
+ M ఎమ్
46
+ m ఎమ్
47
+ N ఎన్
48
+ n ఎన్
49
+ O ఒ
50
+ o ఒ
51
+ P పి
52
+ p పి
53
+ Q క్యు
54
+ q క్యు
55
+ R ఆర్
56
+ r ఆర్
57
+ S ఎస్
58
+ s ఎస్
59
+ T టి
60
+ t టి
61
+ U యు
62
+ u యు
63
+ V వి
64
+ v వి
65
+ W డబ్లు
66
+ w డబ్లు
67
+ X ఎక్స్
68
+ x ఎక్స్
69
+ Y వై
70
+ y వై
71
+ Z జెడ్
72
+ z జెడ్
73
+ α ఆల్ఫ
74
+ φ ఫై
75
+ + ప్లస్
76
+ = ఈక్వల్
77
+ λ లామ్బ్డ
78
+ ∅ నల్
79
+ ϕ ఫై
80
+ 𝝅 పై
81
+ ⇒ ఇమ్ప్లైస్
charmap/charmap_Telugu.xlsx ADDED
Binary file (10 kB). View file
 
dogri_latest/female/model/config.yaml ADDED
@@ -0,0 +1,320 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_grad: 8
2
+ adapter: lora
3
+ adapter_conf: {}
4
+ allow_multi_rates: false
5
+ allow_variable_data_keys: false
6
+ batch_bins: 3000000
7
+ batch_size: 20
8
+ batch_type: numel
9
+ best_model_criterion:
10
+ - - valid
11
+ - loss
12
+ - min
13
+ - - train
14
+ - loss
15
+ - min
16
+ bpemodel: null
17
+ category_sample_size: 10
18
+ chunk_default_fs: null
19
+ chunk_discard_short_samples: true
20
+ chunk_excluded_key_prefixes: []
21
+ chunk_length: 500
22
+ chunk_max_abs_length: null
23
+ chunk_shift_ratio: 0.5
24
+ cleaner: null
25
+ collect_stats: false
26
+ config: conf/tuning/train_fastspeech2.yaml
27
+ create_graph_in_tensorboard: false
28
+ cudnn_benchmark: false
29
+ cudnn_deterministic: true
30
+ cudnn_enabled: true
31
+ deepspeed_config: null
32
+ detect_anomaly: false
33
+ dist_backend: nccl
34
+ dist_init_method: env://
35
+ dist_launcher: null
36
+ dist_master_addr: localhost
37
+ dist_master_port: 33333
38
+ dist_rank: 0
39
+ dist_world_size: 2
40
+ distributed: true
41
+ drop_last_iter: false
42
+ dry_run: false
43
+ early_stopping_criterion:
44
+ - valid
45
+ - loss
46
+ - min
47
+ energy_extract: energy
48
+ energy_extract_conf:
49
+ fs: 48000
50
+ hop_length: 1024
51
+ n_fft: 8192
52
+ reduction_factor: 1
53
+ win_length: 4096
54
+ energy_normalize: global_mvn
55
+ energy_normalize_conf:
56
+ stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/energy_stats.npz
57
+ exclude_weight_decay: false
58
+ exclude_weight_decay_conf: {}
59
+ feats_extract: fbank
60
+ feats_extract_conf:
61
+ fmax: 24000
62
+ fmin: 0
63
+ fs: 48000
64
+ hop_length: 1024
65
+ n_fft: 8192
66
+ n_mels: 160
67
+ win_length: 4096
68
+ fold_length:
69
+ - 150
70
+ - 819200
71
+ freeze_param: []
72
+ g2p: null
73
+ grad_clip: 1.0
74
+ grad_clip_type: 2.0
75
+ grad_noise: false
76
+ ignore_init_mismatch: false
77
+ init_param: []
78
+ iterator_type: sequence
79
+ keep_nbest_models: 5
80
+ local_rank: 0
81
+ log_interval: null
82
+ log_level: INFO
83
+ max_cache_fd: 32
84
+ max_cache_size: 0.0
85
+ max_epoch: 1000
86
+ model_conf: {}
87
+ multi_task_dataset: false
88
+ multiple_iterator: false
89
+ multiprocessing_distributed: true
90
+ nbest_averaging_interval: 0
91
+ ngpu: 1
92
+ no_forward_run: false
93
+ non_linguistic_symbols: null
94
+ normalize: global_mvn
95
+ normalize_conf:
96
+ stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/feats_stats.npz
97
+ num_att_plot: 3
98
+ num_cache_chunks: 1024
99
+ num_iters_per_epoch: 800
100
+ num_workers: 1
101
+ odim: null
102
+ optim: adam
103
+ optim_conf:
104
+ lr: 1.0
105
+ output_dir: exp/tts_train_fastspeech2_raw_char_None
106
+ patience: null
107
+ pitch_extract: dio
108
+ pitch_extract_conf:
109
+ f0max: 400
110
+ f0min: 80
111
+ fs: 48000
112
+ hop_length: 1024
113
+ n_fft: 8192
114
+ reduction_factor: 1
115
+ pitch_normalize: global_mvn
116
+ pitch_normalize_conf:
117
+ stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/pitch_stats.npz
118
+ pretrain_path: null
119
+ print_config: false
120
+ required:
121
+ - output_dir
122
+ - token_list
123
+ resume: true
124
+ save_strategy: all
125
+ scheduler: noamlr
126
+ scheduler_conf:
127
+ model_size: 384
128
+ warmup_steps: 4000
129
+ seed: 0
130
+ sharded_ddp: false
131
+ shuffle_within_batch: false
132
+ sort_batch: descending
133
+ sort_in_batch: descending
134
+ token_list:
135
+ - <blank>
136
+ - <unk>
137
+ - <space>
138
+ - $
139
+ - ','
140
+ - .
141
+ - M
142
+ - q
143
+ - H
144
+ - k
145
+ - "\u0916"
146
+ - g
147
+ - "\u0918"
148
+ - "\u0919"
149
+ - c
150
+ - C
151
+ - j
152
+ - J
153
+ - "\u091E"
154
+ - "\u091F"
155
+ - "\u0920"
156
+ - "\u0921"
157
+ - "\u0922"
158
+ - "\u0923"
159
+ - t
160
+ - "\u0925"
161
+ - d
162
+ - "\u0927"
163
+ - n
164
+ - "\u0929"
165
+ - p
166
+ - P
167
+ - b
168
+ - B
169
+ - m
170
+ - y
171
+ - r
172
+ - "\u0931"
173
+ - l
174
+ - "\u0D33"
175
+ - Z
176
+ - w
177
+ - "\u0936"
178
+ - "\u0937"
179
+ - s
180
+ - h
181
+ - Y
182
+ - "\u093D"
183
+ - "\u0915"
184
+ - K
185
+ - G
186
+ - z
187
+ - D
188
+ - T
189
+ - f
190
+ - "\u0960"
191
+ - "\u0D7A"
192
+ - N
193
+ - "\u0D7C"
194
+ - "\u0D7D"
195
+ - "\u0D7E"
196
+ - a
197
+ - A
198
+ - i
199
+ - I
200
+ - u
201
+ - U
202
+ - R
203
+ - "\u090D"
204
+ - e
205
+ - E
206
+ - "\u0910"
207
+ - "\u0911"
208
+ - o
209
+ - O
210
+ - "\u0914"
211
+ - "\u0B89"
212
+ - <sos/eos>
213
+ token_type: char
214
+ train_data_path_and_name_and_type:
215
+ - - dump/raw/tr_no_dev/text
216
+ - text
217
+ - text
218
+ - - duration_info/tr_no_dev/durations
219
+ - durations
220
+ - text_int
221
+ - - dump/raw/tr_no_dev/wav.scp
222
+ - speech
223
+ - sound
224
+ - - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
225
+ - pitch
226
+ - npy
227
+ - - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
228
+ - energy
229
+ - npy
230
+ train_dtype: float32
231
+ train_shape_file:
232
+ - exp/tts_stats_raw_char_None/train/text_shape.char
233
+ - exp/tts_stats_raw_char_None/train/speech_shape
234
+ tts: fastspeech2
235
+ tts_conf:
236
+ adim: 384
237
+ aheads: 2
238
+ decoder_normalize_before: true
239
+ dlayers: 4
240
+ dunits: 1536
241
+ duration_predictor_chans: 256
242
+ duration_predictor_kernel_size: 3
243
+ duration_predictor_layers: 2
244
+ elayers: 4
245
+ encoder_normalize_before: true
246
+ energy_embed_dropout: 0.0
247
+ energy_embed_kernel_size: 1
248
+ energy_predictor_chans: 256
249
+ energy_predictor_dropout: 0.5
250
+ energy_predictor_kernel_size: 3
251
+ energy_predictor_layers: 2
252
+ eunits: 1536
253
+ init_dec_alpha: 1.0
254
+ init_enc_alpha: 1.0
255
+ init_type: xavier_uniform
256
+ pitch_embed_dropout: 0.0
257
+ pitch_embed_kernel_size: 1
258
+ pitch_predictor_chans: 256
259
+ pitch_predictor_dropout: 0.5
260
+ pitch_predictor_kernel_size: 5
261
+ pitch_predictor_layers: 5
262
+ positionwise_conv_kernel_size: 3
263
+ positionwise_layer_type: conv1d
264
+ postnet_chans: 256
265
+ postnet_filts: 5
266
+ postnet_layers: 5
267
+ reduction_factor: 1
268
+ stop_gradient_from_energy_predictor: false
269
+ stop_gradient_from_pitch_predictor: true
270
+ transformer_dec_attn_dropout_rate: 0.2
271
+ transformer_dec_dropout_rate: 0.2
272
+ transformer_dec_positional_dropout_rate: 0.2
273
+ transformer_enc_attn_dropout_rate: 0.2
274
+ transformer_enc_dropout_rate: 0.2
275
+ transformer_enc_positional_dropout_rate: 0.2
276
+ use_masking: true
277
+ use_scaled_pos_enc: true
278
+ unused_parameters: false
279
+ use_adapter: false
280
+ use_amp: false
281
+ use_deepspeed: false
282
+ use_matplotlib: true
283
+ use_preprocessor: true
284
+ use_tensorboard: true
285
+ use_tf32: false
286
+ use_wandb: false
287
+ val_scheduler_criterion:
288
+ - valid
289
+ - loss
290
+ valid_batch_bins: null
291
+ valid_batch_size: null
292
+ valid_batch_type: null
293
+ valid_data_path_and_name_and_type:
294
+ - - dump/raw/dev/text
295
+ - text
296
+ - text
297
+ - - duration_info/dev/durations
298
+ - durations
299
+ - text_int
300
+ - - dump/raw/dev/wav.scp
301
+ - speech
302
+ - sound
303
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
304
+ - pitch
305
+ - npy
306
+ - - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
307
+ - energy
308
+ - npy
309
+ valid_iterator_type: null
310
+ valid_max_cache_size: null
311
+ valid_shape_file:
312
+ - exp/tts_stats_raw_char_None/valid/text_shape.char
313
+ - exp/tts_stats_raw_char_None/valid/speech_shape
314
+ version: '202412'
315
+ wandb_entity: null
316
+ wandb_id: null
317
+ wandb_model_log_interval: -1
318
+ wandb_name: null
319
+ wandb_project: null
320
+ write_collected_feats: false
dogri_latest/female/model/energy_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fb130c5668e5ed45e934c17a1538a8756c5eb9c68815ba5d32533e45852eb3a
3
+ size 770
dogri_latest/female/model/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b19d99c343e9d668bd1823dc2ca76ded554b799251ff82714836b467044f1f6b
3
+ size 2042