Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +73 -35
- LICENSE +395 -0
- NumberToText.py +96 -0
- README.md +115 -0
- api.py +63 -0
- app.py +179 -0
- assamese_latest/female/model/config.yaml +319 -0
- assamese_latest/female/model/energy_stats.npz +3 -0
- assamese_latest/female/model/feats_stats.npz +3 -0
- assamese_latest/female/model/model.pth +3 -0
- assamese_latest/female/model/pitch_stats.npz +3 -0
- assamese_latest/male/model/config.yaml +315 -0
- assamese_latest/male/model/energy_stats.npz +3 -0
- assamese_latest/male/model/feats_stats.npz +3 -0
- assamese_latest/male/model/feats_type +1 -0
- assamese_latest/male/model/model.pth +3 -0
- assamese_latest/male/model/pitch_stats.npz +3 -0
- bengali_latest/male/model/config.yaml +315 -0
- bengali_latest/male/model/energy_stats.npz +3 -0
- bengali_latest/male/model/feats_stats.npz +3 -0
- bengali_latest/male/model/model.pth +3 -0
- bengali_latest/male/model/pitch_stats.npz +3 -0
- bodo_latest/female/model/config.yaml +319 -0
- bodo_latest/female/model/energy_stats.npz +3 -0
- bodo_latest/female/model/feats_stats.npz +3 -0
- bodo_latest/female/model/feats_type +1 -0
- bodo_latest/female/model/model.pth +3 -0
- bodo_latest/female/model/pitch_stats.npz +3 -0
- bodo_latest/male/model/config.yaml +319 -0
- bodo_latest/male/model/energy_stats.npz +3 -0
- bodo_latest/male/model/feats_stats.npz +3 -0
- bodo_latest/male/model/feats_type +1 -0
- bodo_latest/male/model/model.pth +3 -0
- bodo_latest/male/model/pitch_stats.npz +3 -0
- charmap/Text_Cleaning.ipynb +332 -0
- charmap/Text_Cleaning.py +76 -0
- charmap/charmap_Bengali.txt +62 -0
- charmap/charmap_Hindi.txt +81 -0
- charmap/charmap_Hindi.xlsx +0 -0
- charmap/charmap_Malayalam.txt +81 -0
- charmap/charmap_Malayalam.xlsx +0 -0
- charmap/charmap_Marathi.txt +81 -0
- charmap/charmap_Marathi.xlsx +0 -0
- charmap/charmap_Tamil.disabled +76 -0
- charmap/charmap_Tamil.xlsx +0 -0
- charmap/charmap_Telugu.txt +81 -0
- charmap/charmap_Telugu.xlsx +0 -0
- dogri_latest/female/model/config.yaml +320 -0
- dogri_latest/female/model/energy_stats.npz +3 -0
- dogri_latest/female/model/feats_stats.npz +3 -0
.gitattributes
CHANGED
|
@@ -1,35 +1,73 @@
|
|
| 1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
-
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
| 11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
| 12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
| 13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
| 14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
| 15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
| 16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
| 17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
| 18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
| 19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
| 20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
| 21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
| 22 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
| 23 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
| 24 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
| 25 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 26 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
| 27 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
| 30 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
| 31 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
| 32 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
| 33 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
license.pdf filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
vocoder/female/assamese_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
vocoder/female/bengali_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
vocoder/female/bodo_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
vocoder/female/dogri_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
vocoder/female/gujarati_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
vocoder/female/hindi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
vocoder/female/kannada_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
vocoder/female/konkani_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
vocoder/female/maithili_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
vocoder/female/malayalam_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
vocoder/female/manipuri_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
vocoder/female/nepali_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
vocoder/female/punjabi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
vocoder/female/rajasthani_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
vocoder/female/sanskrit_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
vocoder/female/sindhi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
vocoder/female/tamil_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
vocoder/female/telugu_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
vocoder/male/assamese_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
vocoder/male/bengali_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
vocoder/male/bodo_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
vocoder/male/dogri_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
vocoder/male/gujarati_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
vocoder/male/hindi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
vocoder/male/kannada_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
vocoder/male/konkani_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
vocoder/male/maithili_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
vocoder/male/malayalam_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
vocoder/male/manipuri_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
vocoder/male/nepali_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
vocoder/male/punjabi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
vocoder/male/rajasthani_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
vocoder/male/sanskrit_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
vocoder/male/sindhi_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
vocoder/male/tamil_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
vocoder/male/telugu_latest/generator filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
ssn_parser_new/scripts/tamil_trans_py filter=lfs diff=lfs merge=lfs -text
|
LICENSE
ADDED
|
@@ -0,0 +1,395 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Attribution 4.0 International
|
| 2 |
+
|
| 3 |
+
=======================================================================
|
| 4 |
+
|
| 5 |
+
Creative Commons Corporation ("Creative Commons") is not a law firm and
|
| 6 |
+
does not provide legal services or legal advice. Distribution of
|
| 7 |
+
Creative Commons public licenses does not create a lawyer-client or
|
| 8 |
+
other relationship. Creative Commons makes its licenses and related
|
| 9 |
+
information available on an "as-is" basis. Creative Commons gives no
|
| 10 |
+
warranties regarding its licenses, any material licensed under their
|
| 11 |
+
terms and conditions, or any related information. Creative Commons
|
| 12 |
+
disclaims all liability for damages resulting from their use to the
|
| 13 |
+
fullest extent possible.
|
| 14 |
+
|
| 15 |
+
Using Creative Commons Public Licenses
|
| 16 |
+
|
| 17 |
+
Creative Commons public licenses provide a standard set of terms and
|
| 18 |
+
conditions that creators and other rights holders may use to share
|
| 19 |
+
original works of authorship and other material subject to copyright
|
| 20 |
+
and certain other rights specified in the public license below. The
|
| 21 |
+
following considerations are for informational purposes only, are not
|
| 22 |
+
exhaustive, and do not form part of our licenses.
|
| 23 |
+
|
| 24 |
+
Considerations for licensors: Our public licenses are
|
| 25 |
+
intended for use by those authorized to give the public
|
| 26 |
+
permission to use material in ways otherwise restricted by
|
| 27 |
+
copyright and certain other rights. Our licenses are
|
| 28 |
+
irrevocable. Licensors should read and understand the terms
|
| 29 |
+
and conditions of the license they choose before applying it.
|
| 30 |
+
Licensors should also secure all rights necessary before
|
| 31 |
+
applying our licenses so that the public can reuse the
|
| 32 |
+
material as expected. Licensors should clearly mark any
|
| 33 |
+
material not subject to the license. This includes other CC-
|
| 34 |
+
licensed material, or material used under an exception or
|
| 35 |
+
limitation to copyright. More considerations for licensors:
|
| 36 |
+
wiki.creativecommons.org/Considerations_for_licensors
|
| 37 |
+
|
| 38 |
+
Considerations for the public: By using one of our public
|
| 39 |
+
licenses, a licensor grants the public permission to use the
|
| 40 |
+
licensed material under specified terms and conditions. If
|
| 41 |
+
the licensor's permission is not necessary for any reason--for
|
| 42 |
+
example, because of any applicable exception or limitation to
|
| 43 |
+
copyright--then that use is not regulated by the license. Our
|
| 44 |
+
licenses grant only permissions under copyright and certain
|
| 45 |
+
other rights that a licensor has authority to grant. Use of
|
| 46 |
+
the licensed material may still be restricted for other
|
| 47 |
+
reasons, including because others have copyright or other
|
| 48 |
+
rights in the material. A licensor may make special requests,
|
| 49 |
+
such as asking that all changes be marked or described.
|
| 50 |
+
Although not required by our licenses, you are encouraged to
|
| 51 |
+
respect those requests where reasonable. More_considerations
|
| 52 |
+
for the public:
|
| 53 |
+
wiki.creativecommons.org/Considerations_for_licensees
|
| 54 |
+
|
| 55 |
+
=======================================================================
|
| 56 |
+
|
| 57 |
+
Creative Commons Attribution 4.0 International Public License
|
| 58 |
+
|
| 59 |
+
By exercising the Licensed Rights (defined below), You accept and agree
|
| 60 |
+
to be bound by the terms and conditions of this Creative Commons
|
| 61 |
+
Attribution 4.0 International Public License ("Public License"). To the
|
| 62 |
+
extent this Public License may be interpreted as a contract, You are
|
| 63 |
+
granted the Licensed Rights in consideration of Your acceptance of
|
| 64 |
+
these terms and conditions, and the Licensor grants You such rights in
|
| 65 |
+
consideration of benefits the Licensor receives from making the
|
| 66 |
+
Licensed Material available under these terms and conditions.
|
| 67 |
+
|
| 68 |
+
|
| 69 |
+
Section 1 -- Definitions.
|
| 70 |
+
|
| 71 |
+
a. Adapted Material means material subject to Copyright and Similar
|
| 72 |
+
Rights that is derived from or based upon the Licensed Material
|
| 73 |
+
and in which the Licensed Material is translated, altered,
|
| 74 |
+
arranged, transformed, or otherwise modified in a manner requiring
|
| 75 |
+
permission under the Copyright and Similar Rights held by the
|
| 76 |
+
Licensor. For purposes of this Public License, where the Licensed
|
| 77 |
+
Material is a musical work, performance, or sound recording,
|
| 78 |
+
Adapted Material is always produced where the Licensed Material is
|
| 79 |
+
synched in timed relation with a moving image.
|
| 80 |
+
|
| 81 |
+
b. Adapter's License means the license You apply to Your Copyright
|
| 82 |
+
and Similar Rights in Your contributions to Adapted Material in
|
| 83 |
+
accordance with the terms and conditions of this Public License.
|
| 84 |
+
|
| 85 |
+
c. Copyright and Similar Rights means copyright and/or similar rights
|
| 86 |
+
closely related to copyright including, without limitation,
|
| 87 |
+
performance, broadcast, sound recording, and Sui Generis Database
|
| 88 |
+
Rights, without regard to how the rights are labeled or
|
| 89 |
+
categorized. For purposes of this Public License, the rights
|
| 90 |
+
specified in Section 2(b)(1)-(2) are not Copyright and Similar
|
| 91 |
+
Rights.
|
| 92 |
+
|
| 93 |
+
d. Effective Technological Measures means those measures that, in the
|
| 94 |
+
absence of proper authority, may not be circumvented under laws
|
| 95 |
+
fulfilling obligations under Article 11 of the WIPO Copyright
|
| 96 |
+
Treaty adopted on December 20, 1996, and/or similar international
|
| 97 |
+
agreements.
|
| 98 |
+
|
| 99 |
+
e. Exceptions and Limitations means fair use, fair dealing, and/or
|
| 100 |
+
any other exception or limitation to Copyright and Similar Rights
|
| 101 |
+
that applies to Your use of the Licensed Material.
|
| 102 |
+
|
| 103 |
+
f. Licensed Material means the artistic or literary work, database,
|
| 104 |
+
or other material to which the Licensor applied this Public
|
| 105 |
+
License.
|
| 106 |
+
|
| 107 |
+
g. Licensed Rights means the rights granted to You subject to the
|
| 108 |
+
terms and conditions of this Public License, which are limited to
|
| 109 |
+
all Copyright and Similar Rights that apply to Your use of the
|
| 110 |
+
Licensed Material and that the Licensor has authority to license.
|
| 111 |
+
|
| 112 |
+
h. Licensor means the individual(s) or entity(ies) granting rights
|
| 113 |
+
under this Public License.
|
| 114 |
+
|
| 115 |
+
i. Share means to provide material to the public by any means or
|
| 116 |
+
process that requires permission under the Licensed Rights, such
|
| 117 |
+
as reproduction, public display, public performance, distribution,
|
| 118 |
+
dissemination, communication, or importation, and to make material
|
| 119 |
+
available to the public including in ways that members of the
|
| 120 |
+
public may access the material from a place and at a time
|
| 121 |
+
individually chosen by them.
|
| 122 |
+
|
| 123 |
+
j. Sui Generis Database Rights means rights other than copyright
|
| 124 |
+
resulting from Directive 96/9/EC of the European Parliament and of
|
| 125 |
+
the Council of 11 March 1996 on the legal protection of databases,
|
| 126 |
+
as amended and/or succeeded, as well as other essentially
|
| 127 |
+
equivalent rights anywhere in the world.
|
| 128 |
+
|
| 129 |
+
k. You means the individual or entity exercising the Licensed Rights
|
| 130 |
+
under this Public License. Your has a corresponding meaning.
|
| 131 |
+
|
| 132 |
+
|
| 133 |
+
Section 2 -- Scope.
|
| 134 |
+
|
| 135 |
+
a. License grant.
|
| 136 |
+
|
| 137 |
+
1. Subject to the terms and conditions of this Public License,
|
| 138 |
+
the Licensor hereby grants You a worldwide, royalty-free,
|
| 139 |
+
non-sublicensable, non-exclusive, irrevocable license to
|
| 140 |
+
exercise the Licensed Rights in the Licensed Material to:
|
| 141 |
+
|
| 142 |
+
a. reproduce and Share the Licensed Material, in whole or
|
| 143 |
+
in part; and
|
| 144 |
+
|
| 145 |
+
b. produce, reproduce, and Share Adapted Material.
|
| 146 |
+
|
| 147 |
+
2. Exceptions and Limitations. For the avoidance of doubt, where
|
| 148 |
+
Exceptions and Limitations apply to Your use, this Public
|
| 149 |
+
License does not apply, and You do not need to comply with
|
| 150 |
+
its terms and conditions.
|
| 151 |
+
|
| 152 |
+
3. Term. The term of this Public License is specified in Section
|
| 153 |
+
6(a).
|
| 154 |
+
|
| 155 |
+
4. Media and formats; technical modifications allowed. The
|
| 156 |
+
Licensor authorizes You to exercise the Licensed Rights in
|
| 157 |
+
all media and formats whether now known or hereafter created,
|
| 158 |
+
and to make technical modifications necessary to do so. The
|
| 159 |
+
Licensor waives and/or agrees not to assert any right or
|
| 160 |
+
authority to forbid You from making technical modifications
|
| 161 |
+
necessary to exercise the Licensed Rights, including
|
| 162 |
+
technical modifications necessary to circumvent Effective
|
| 163 |
+
Technological Measures. For purposes of this Public License,
|
| 164 |
+
simply making modifications authorized by this Section 2(a)
|
| 165 |
+
(4) never produces Adapted Material.
|
| 166 |
+
|
| 167 |
+
5. Downstream recipients.
|
| 168 |
+
|
| 169 |
+
a. Offer from the Licensor -- Licensed Material. Every
|
| 170 |
+
recipient of the Licensed Material automatically
|
| 171 |
+
receives an offer from the Licensor to exercise the
|
| 172 |
+
Licensed Rights under the terms and conditions of this
|
| 173 |
+
Public License.
|
| 174 |
+
|
| 175 |
+
b. No downstream restrictions. You may not offer or impose
|
| 176 |
+
any additional or different terms or conditions on, or
|
| 177 |
+
apply any Effective Technological Measures to, the
|
| 178 |
+
Licensed Material if doing so restricts exercise of the
|
| 179 |
+
Licensed Rights by any recipient of the Licensed
|
| 180 |
+
Material.
|
| 181 |
+
|
| 182 |
+
6. No endorsement. Nothing in this Public License constitutes or
|
| 183 |
+
may be construed as permission to assert or imply that You
|
| 184 |
+
are, or that Your use of the Licensed Material is, connected
|
| 185 |
+
with, or sponsored, endorsed, or granted official status by,
|
| 186 |
+
the Licensor or others designated to receive attribution as
|
| 187 |
+
provided in Section 3(a)(1)(A)(i).
|
| 188 |
+
|
| 189 |
+
b. Other rights.
|
| 190 |
+
|
| 191 |
+
1. Moral rights, such as the right of integrity, are not
|
| 192 |
+
licensed under this Public License, nor are publicity,
|
| 193 |
+
privacy, and/or other similar personality rights; however, to
|
| 194 |
+
the extent possible, the Licensor waives and/or agrees not to
|
| 195 |
+
assert any such rights held by the Licensor to the limited
|
| 196 |
+
extent necessary to allow You to exercise the Licensed
|
| 197 |
+
Rights, but not otherwise.
|
| 198 |
+
|
| 199 |
+
2. Patent and trademark rights are not licensed under this
|
| 200 |
+
Public License.
|
| 201 |
+
|
| 202 |
+
3. To the extent possible, the Licensor waives any right to
|
| 203 |
+
collect royalties from You for the exercise of the Licensed
|
| 204 |
+
Rights, whether directly or through a collecting society
|
| 205 |
+
under any voluntary or waivable statutory or compulsory
|
| 206 |
+
licensing scheme. In all other cases the Licensor expressly
|
| 207 |
+
reserves any right to collect such royalties.
|
| 208 |
+
|
| 209 |
+
|
| 210 |
+
Section 3 -- License Conditions.
|
| 211 |
+
|
| 212 |
+
Your exercise of the Licensed Rights is expressly made subject to the
|
| 213 |
+
following conditions.
|
| 214 |
+
|
| 215 |
+
a. Attribution.
|
| 216 |
+
|
| 217 |
+
1. If You Share the Licensed Material (including in modified
|
| 218 |
+
form), You must:
|
| 219 |
+
|
| 220 |
+
a. retain the following if it is supplied by the Licensor
|
| 221 |
+
with the Licensed Material:
|
| 222 |
+
|
| 223 |
+
i. identification of the creator(s) of the Licensed
|
| 224 |
+
Material and any others designated to receive
|
| 225 |
+
attribution, in any reasonable manner requested by
|
| 226 |
+
the Licensor (including by pseudonym if
|
| 227 |
+
designated);
|
| 228 |
+
|
| 229 |
+
ii. a copyright notice;
|
| 230 |
+
|
| 231 |
+
iii. a notice that refers to this Public License;
|
| 232 |
+
|
| 233 |
+
iv. a notice that refers to the disclaimer of
|
| 234 |
+
warranties;
|
| 235 |
+
|
| 236 |
+
v. a URI or hyperlink to the Licensed Material to the
|
| 237 |
+
extent reasonably practicable;
|
| 238 |
+
|
| 239 |
+
b. indicate if You modified the Licensed Material and
|
| 240 |
+
retain an indication of any previous modifications; and
|
| 241 |
+
|
| 242 |
+
c. indicate the Licensed Material is licensed under this
|
| 243 |
+
Public License, and include the text of, or the URI or
|
| 244 |
+
hyperlink to, this Public License.
|
| 245 |
+
|
| 246 |
+
2. You may satisfy the conditions in Section 3(a)(1) in any
|
| 247 |
+
reasonable manner based on the medium, means, and context in
|
| 248 |
+
which You Share the Licensed Material. For example, it may be
|
| 249 |
+
reasonable to satisfy the conditions by providing a URI or
|
| 250 |
+
hyperlink to a resource that includes the required
|
| 251 |
+
information.
|
| 252 |
+
|
| 253 |
+
3. If requested by the Licensor, You must remove any of the
|
| 254 |
+
information required by Section 3(a)(1)(A) to the extent
|
| 255 |
+
reasonably practicable.
|
| 256 |
+
|
| 257 |
+
4. If You Share Adapted Material You produce, the Adapter's
|
| 258 |
+
License You apply must not prevent recipients of the Adapted
|
| 259 |
+
Material from complying with this Public License.
|
| 260 |
+
|
| 261 |
+
|
| 262 |
+
Section 4 -- Sui Generis Database Rights.
|
| 263 |
+
|
| 264 |
+
Where the Licensed Rights include Sui Generis Database Rights that
|
| 265 |
+
apply to Your use of the Licensed Material:
|
| 266 |
+
|
| 267 |
+
a. for the avoidance of doubt, Section 2(a)(1) grants You the right
|
| 268 |
+
to extract, reuse, reproduce, and Share all or a substantial
|
| 269 |
+
portion of the contents of the database;
|
| 270 |
+
|
| 271 |
+
b. if You include all or a substantial portion of the database
|
| 272 |
+
contents in a database in which You have Sui Generis Database
|
| 273 |
+
Rights, then the database in which You have Sui Generis Database
|
| 274 |
+
Rights (but not its individual contents) is Adapted Material; and
|
| 275 |
+
|
| 276 |
+
c. You must comply with the conditions in Section 3(a) if You Share
|
| 277 |
+
all or a substantial portion of the contents of the database.
|
| 278 |
+
|
| 279 |
+
For the avoidance of doubt, this Section 4 supplements and does not
|
| 280 |
+
replace Your obligations under this Public License where the Licensed
|
| 281 |
+
Rights include other Copyright and Similar Rights.
|
| 282 |
+
|
| 283 |
+
|
| 284 |
+
Section 5 -- Disclaimer of Warranties and Limitation of Liability.
|
| 285 |
+
|
| 286 |
+
a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
|
| 287 |
+
EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
|
| 288 |
+
AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
|
| 289 |
+
ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
|
| 290 |
+
IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
|
| 291 |
+
WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
|
| 292 |
+
PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
|
| 293 |
+
ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
|
| 294 |
+
KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
|
| 295 |
+
ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
|
| 296 |
+
|
| 297 |
+
b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
|
| 298 |
+
TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
|
| 299 |
+
NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
|
| 300 |
+
INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
|
| 301 |
+
COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
|
| 302 |
+
USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
|
| 303 |
+
ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
|
| 304 |
+
DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
|
| 305 |
+
IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
|
| 306 |
+
|
| 307 |
+
c. The disclaimer of warranties and limitation of liability provided
|
| 308 |
+
above shall be interpreted in a manner that, to the extent
|
| 309 |
+
possible, most closely approximates an absolute disclaimer and
|
| 310 |
+
waiver of all liability.
|
| 311 |
+
|
| 312 |
+
|
| 313 |
+
Section 6 -- Term and Termination.
|
| 314 |
+
|
| 315 |
+
a. This Public License applies for the term of the Copyright and
|
| 316 |
+
Similar Rights licensed here. However, if You fail to comply with
|
| 317 |
+
this Public License, then Your rights under this Public License
|
| 318 |
+
terminate automatically.
|
| 319 |
+
|
| 320 |
+
b. Where Your right to use the Licensed Material has terminated under
|
| 321 |
+
Section 6(a), it reinstates:
|
| 322 |
+
|
| 323 |
+
1. automatically as of the date the violation is cured, provided
|
| 324 |
+
it is cured within 30 days of Your discovery of the
|
| 325 |
+
violation; or
|
| 326 |
+
|
| 327 |
+
2. upon express reinstatement by the Licensor.
|
| 328 |
+
|
| 329 |
+
For the avoidance of doubt, this Section 6(b) does not affect any
|
| 330 |
+
right the Licensor may have to seek remedies for Your violations
|
| 331 |
+
of this Public License.
|
| 332 |
+
|
| 333 |
+
c. For the avoidance of doubt, the Licensor may also offer the
|
| 334 |
+
Licensed Material under separate terms or conditions or stop
|
| 335 |
+
distributing the Licensed Material at any time; however, doing so
|
| 336 |
+
will not terminate this Public License.
|
| 337 |
+
|
| 338 |
+
d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
|
| 339 |
+
License.
|
| 340 |
+
|
| 341 |
+
|
| 342 |
+
Section 7 -- Other Terms and Conditions.
|
| 343 |
+
|
| 344 |
+
a. The Licensor shall not be bound by any additional or different
|
| 345 |
+
terms or conditions communicated by You unless expressly agreed.
|
| 346 |
+
|
| 347 |
+
b. Any arrangements, understandings, or agreements regarding the
|
| 348 |
+
Licensed Material not stated herein are separate from and
|
| 349 |
+
independent of the terms and conditions of this Public License.
|
| 350 |
+
|
| 351 |
+
|
| 352 |
+
Section 8 -- Interpretation.
|
| 353 |
+
|
| 354 |
+
a. For the avoidance of doubt, this Public License does not, and
|
| 355 |
+
shall not be interpreted to, reduce, limit, restrict, or impose
|
| 356 |
+
conditions on any use of the Licensed Material that could lawfully
|
| 357 |
+
be made without permission under this Public License.
|
| 358 |
+
|
| 359 |
+
b. To the extent possible, if any provision of this Public License is
|
| 360 |
+
deemed unenforceable, it shall be automatically reformed to the
|
| 361 |
+
minimum extent necessary to make it enforceable. If the provision
|
| 362 |
+
cannot be reformed, it shall be severed from this Public License
|
| 363 |
+
without affecting the enforceability of the remaining terms and
|
| 364 |
+
conditions.
|
| 365 |
+
|
| 366 |
+
c. No term or condition of this Public License will be waived and no
|
| 367 |
+
failure to comply consented to unless expressly agreed to by the
|
| 368 |
+
Licensor.
|
| 369 |
+
|
| 370 |
+
d. Nothing in this Public License constitutes or may be interpreted
|
| 371 |
+
as a limitation upon, or waiver of, any privileges and immunities
|
| 372 |
+
that apply to the Licensor or You, including from the legal
|
| 373 |
+
processes of any jurisdiction or authority.
|
| 374 |
+
|
| 375 |
+
|
| 376 |
+
=======================================================================
|
| 377 |
+
|
| 378 |
+
Creative Commons is not a party to its public
|
| 379 |
+
licenses. Notwithstanding, Creative Commons may elect to apply one of
|
| 380 |
+
its public licenses to material it publishes and in those instances
|
| 381 |
+
will be considered the “Licensor.” The text of the Creative Commons
|
| 382 |
+
public licenses is dedicated to the public domain under the CC0 Public
|
| 383 |
+
Domain Dedication. Except for the limited purpose of indicating that
|
| 384 |
+
material is shared under a Creative Commons public license or as
|
| 385 |
+
otherwise permitted by the Creative Commons policies published at
|
| 386 |
+
creativecommons.org/policies, Creative Commons does not authorize the
|
| 387 |
+
use of the trademark "Creative Commons" or any other trademark or logo
|
| 388 |
+
of Creative Commons without its prior written consent including,
|
| 389 |
+
without limitation, in connection with any unauthorized modifications
|
| 390 |
+
to any of its public licenses or any other arrangements,
|
| 391 |
+
understandings, or agreements concerning use of licensed material. For
|
| 392 |
+
the avoidance of doubt, this paragraph does not form part of the
|
| 393 |
+
public licenses.
|
| 394 |
+
|
| 395 |
+
Creative Commons may be contacted at creativecommons.org.
|
NumberToText.py
ADDED
|
@@ -0,0 +1,96 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import os
|
| 2 |
+
import csv
|
| 3 |
+
|
| 4 |
+
class NumberDictionary:
|
| 5 |
+
def __init__(self):
|
| 6 |
+
directoryPath = "numToText"
|
| 7 |
+
# print(directoryPath)
|
| 8 |
+
languages = self.get_filenames_in_folder(directoryPath)
|
| 9 |
+
# print(languages, directoryPath)
|
| 10 |
+
self.lang_num_dictionary = self.load_language_dictionary(directoryPath, languages)
|
| 11 |
+
# print(self.lang_num_dictionary)
|
| 12 |
+
|
| 13 |
+
|
| 14 |
+
|
| 15 |
+
def get_filenames_in_folder(self,folder_path):
|
| 16 |
+
file_list = []
|
| 17 |
+
|
| 18 |
+
# Loop through the files in the directory
|
| 19 |
+
for filename in os.listdir(folder_path):
|
| 20 |
+
# Check if it's a file (not a subdirectory)
|
| 21 |
+
if os.path.isfile(os.path.join(folder_path, filename)):
|
| 22 |
+
file_list.append(filename[:-4])
|
| 23 |
+
|
| 24 |
+
return file_list
|
| 25 |
+
|
| 26 |
+
|
| 27 |
+
def load_language_dictionary(self, directory_path, file_names):
|
| 28 |
+
lang_num_dictionary = {}
|
| 29 |
+
|
| 30 |
+
for file_name in file_names:
|
| 31 |
+
language = os.path.splitext(file_name)[0]
|
| 32 |
+
file_path = os.path.join(directory_path, f"{file_name}.csv")
|
| 33 |
+
if not os.path.exists(file_path):
|
| 34 |
+
# print(f"File '{file_path}' not found. Skipping...")
|
| 35 |
+
continue
|
| 36 |
+
|
| 37 |
+
with open(file_path, 'r', encoding='utf-8') as file:
|
| 38 |
+
reader = csv.reader(file)
|
| 39 |
+
language_map = {row[0].strip(): row[1].strip() for row in reader}
|
| 40 |
+
|
| 41 |
+
lang_num_dictionary[language] = language_map
|
| 42 |
+
|
| 43 |
+
return lang_num_dictionary
|
| 44 |
+
|
| 45 |
+
def num2text(self, input_str, language):
|
| 46 |
+
if language not in self.lang_num_dictionary:
|
| 47 |
+
return "Language not supported."
|
| 48 |
+
|
| 49 |
+
integer_part, *decimal_part = input_str.split('.')
|
| 50 |
+
try:
|
| 51 |
+
int_part = int(integer_part)
|
| 52 |
+
except ValueError:
|
| 53 |
+
return "Invalid input. Please provide a valid number."
|
| 54 |
+
|
| 55 |
+
if int_part < 0 or int_part > 999999999999999:
|
| 56 |
+
return "Number out of range (0-999999999999999)"
|
| 57 |
+
|
| 58 |
+
lang_map = self.lang_num_dictionary[language]
|
| 59 |
+
integer_text = self.convert_to_indian_number(int_part, lang_map)
|
| 60 |
+
|
| 61 |
+
if decimal_part:
|
| 62 |
+
decimal_text = lang_map.get('.', '') + ' '
|
| 63 |
+
for digit in decimal_part[0]:
|
| 64 |
+
decimal_text += lang_map.get(digit, '') + ' '
|
| 65 |
+
return (integer_text + ' ' + decimal_text).strip()
|
| 66 |
+
else:
|
| 67 |
+
return integer_text.strip()
|
| 68 |
+
|
| 69 |
+
def convert_to_indian_number(self, n, lang_map):
|
| 70 |
+
numeric_keys = [key for key in lang_map.keys() if key.isdigit()] # Filter numeric keys
|
| 71 |
+
if n <= 20 or (n <= 100 and str(n) in lang_map):
|
| 72 |
+
return lang_map.get(str(n), '')
|
| 73 |
+
elif n < 1000:
|
| 74 |
+
result = f"{lang_map.get(str(n // 100), '')} {lang_map.get('100', '')}"
|
| 75 |
+
if n % 100 != 0:
|
| 76 |
+
result += f" {self.convert_to_indian_number(n % 100, lang_map)}"
|
| 77 |
+
return result.strip()
|
| 78 |
+
else:
|
| 79 |
+
base, term = 0, ''
|
| 80 |
+
for key in sorted(numeric_keys, key=int, reverse=True): # Sort only numeric keys
|
| 81 |
+
if n >= int(key):
|
| 82 |
+
base = int(key)
|
| 83 |
+
term = lang_map[key]
|
| 84 |
+
break
|
| 85 |
+
|
| 86 |
+
if n % base == 0:
|
| 87 |
+
return f"{self.convert_to_indian_number(n // base, lang_map)} {term}"
|
| 88 |
+
else:
|
| 89 |
+
return f"{self.convert_to_indian_number(n // base, lang_map)} {term} {self.convert_to_indian_number(n % base, lang_map)}"
|
| 90 |
+
|
| 91 |
+
|
| 92 |
+
|
| 93 |
+
|
| 94 |
+
# number_dict = NumberDictionary()
|
| 95 |
+
# result = number_dict.num2text("2000048.145", "gujarati")
|
| 96 |
+
# print(result)
|
README.md
CHANGED
|
@@ -1,3 +1,118 @@
|
|
| 1 |
---
|
| 2 |
license: cc-by-4.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
---
|
| 2 |
license: cc-by-4.0
|
| 3 |
+
language:
|
| 4 |
+
- hi
|
| 5 |
+
- as
|
| 6 |
+
- bn
|
| 7 |
+
- bo
|
| 8 |
+
- en
|
| 9 |
+
- gu
|
| 10 |
+
- kn
|
| 11 |
+
- ml
|
| 12 |
+
- mr
|
| 13 |
+
- or
|
| 14 |
+
- pa
|
| 15 |
+
- ta
|
| 16 |
+
- te
|
| 17 |
+
- ur
|
| 18 |
+
tags:
|
| 19 |
+
- tts
|
| 20 |
+
- indictts
|
| 21 |
+
- fs2
|
| 22 |
+
- mfa
|
| 23 |
+
- HS
|
| 24 |
+
- hybrid_segmentation
|
| 25 |
+
- fastspeech2
|
| 26 |
---
|
| 27 |
+
# Latest Fastspeech2 Models using FLAT Start
|
| 28 |
+
|
| 29 |
+
This repository contains new and high quality Fastspeech2 Models for Indian languages implemented using the Flat Start for speech synthesis. The models are capable of generating mel-spectrograms from text inputs and can be used to synthesize speech.
|
| 30 |
+
|
| 31 |
+
The Repo is large in size. New Models are in "language"_latest folder.
|
| 32 |
+
|
| 33 |
+
Supported languages: Assamese, Bengali, Bodo, Dogri, Gujarati, Hindi, Kannada, Konkani(Maharashtrian), Maithili, Malayalam, Manipuri, Nepali, Punjabi, Rajasthani, Sanskrit, Tamil, Telugu.
|
| 34 |
+
|
| 35 |
+
NOTE - I do not own any right to the repository, all the rights goes to original owner. This repository is meant to help easy installation of the speech models.
|
| 36 |
+
|
| 37 |
+
## Model Files
|
| 38 |
+
|
| 39 |
+
The model for each language includes the following files:
|
| 40 |
+
|
| 41 |
+
- `config.yaml`: Configuration file for the Fastspeech2 Model.
|
| 42 |
+
- `energy_stats.npz`: Energy statistics for normalization during synthesis.
|
| 43 |
+
- `feats_stats.npz`: Features statistics for normalization during synthesis.
|
| 44 |
+
- `feats_type`: Features type information.
|
| 45 |
+
- `pitch_stats.npz`: Pitch statistics for normalization during synthesis.
|
| 46 |
+
- `model.pth`: Pre-trained Fastspeech2 model weights.
|
| 47 |
+
|
| 48 |
+
## Installation
|
| 49 |
+
|
| 50 |
+
1. Install [Miniconda](https://docs.conda.io/projects/miniconda/en/latest/) first. Create a conda environment using the provided `environment.yml` file:
|
| 51 |
+
|
| 52 |
+
```shell
|
| 53 |
+
conda env create -f environment.yml
|
| 54 |
+
```
|
| 55 |
+
|
| 56 |
+
2.Activate the conda environment (check inside environment.yaml file):
|
| 57 |
+
```shell
|
| 58 |
+
conda activate tts-hs-hifigan
|
| 59 |
+
```
|
| 60 |
+
|
| 61 |
+
3. Install PyTorch separately (you can install the specific version based on your requirements):
|
| 62 |
+
```shell
|
| 63 |
+
conda install pytorch cudatoolkit
|
| 64 |
+
pip install torchaudio
|
| 65 |
+
```
|
| 66 |
+
## Vocoder
|
| 67 |
+
For generating WAV files from mel-spectrograms, you can use a vocoder of your choice. One popular option is the [HIFIGAN](https://github.com/jik876/hifi-gan) vocoder (Clone this repo and put it in the current working directory). Please refer to the documentation of the vocoder you choose for installation and usage instructions.
|
| 68 |
+
|
| 69 |
+
(**We have used the HIFIGAN V1 vocoder and have provided Vocoder for few languages in the Vocoder folder. If needed, make sure to adjust the path in the inference file.**)
|
| 70 |
+
|
| 71 |
+
## Usage
|
| 72 |
+
|
| 73 |
+
The directory paths are Relative. ( But if needed, Make changes to **text_preprocess_for_inference.py** and **inference.py** file, Update folder/file paths wherever required.)
|
| 74 |
+
|
| 75 |
+
**Please give language/gender in small cases and sample text between quotes. Adjust output speed using the alpha parameter (higher for slow voiced output and vice versa). Output argument is optional; the provide name will be used for the output file.**
|
| 76 |
+
|
| 77 |
+
Use the inference file to synthesize speech from text inputs:
|
| 78 |
+
```shell
|
| 79 |
+
python inference.py --sample_text "Your input text here" --language <language>_latest --gender <gender> --alpha <alpha> --output_file <file_name.wav OR path/to/file_name.wav>
|
| 80 |
+
```
|
| 81 |
+
|
| 82 |
+
**Example:**
|
| 83 |
+
|
| 84 |
+
```
|
| 85 |
+
python inference.py --sample_text "श्रीलंका और पाकिस्तान में खेला जा रहा एशिया कप अब तक का सबसे विवादित टूर्नामेंट होता जा रहा है।" --language hindi_latest --gender male --alpha 1 --output_file male_hindi_output.wav
|
| 86 |
+
```
|
| 87 |
+
The file will be stored as `male_hindi_output.wav` and will be inside current working directory. If **--output_file** argument is not given it will be stored as `<language>_<gender>_output.wav` in the current working directory.
|
| 88 |
+
|
| 89 |
+
**Use "language"_latest in --language to use latest models.**
|
| 90 |
+
|
| 91 |
+
|
| 92 |
+
### Citation
|
| 93 |
+
If you use this Fastspeech2 Model in your research or work, please consider citing:
|
| 94 |
+
|
| 95 |
+
“
|
| 96 |
+
COPYRIGHT
|
| 97 |
+
2025, Speech Technology Consortium,
|
| 98 |
+
|
| 99 |
+
Bhashini, MeiTY and by Hema A Murthy & S Umesh,
|
| 100 |
+
|
| 101 |
+
|
| 102 |
+
DEPARTMENT OF COMPUTER SCIENCE AND ENGINEERING
|
| 103 |
+
and
|
| 104 |
+
ELECTRICAL ENGINEERING,
|
| 105 |
+
IIT MADRAS. ALL RIGHTS RESERVED "
|
| 106 |
+
|
| 107 |
+
|
| 108 |
+
|
| 109 |
+
Shield: [![CC BY 4.0][cc-by-shield]][cc-by]
|
| 110 |
+
|
| 111 |
+
This work is licensed under a
|
| 112 |
+
[Creative Commons Attribution 4.0 International License][cc-by].
|
| 113 |
+
|
| 114 |
+
[![CC BY 4.0][cc-by-image]][cc-by]
|
| 115 |
+
|
| 116 |
+
[cc-by]: http://creativecommons.org/licenses/by/4.0/
|
| 117 |
+
[cc-by-image]: https://i.creativecommons.org/l/by/4.0/88x31.png
|
| 118 |
+
[cc-by-shield]: https://img.shields.io/badge/License-CC%20BY%204.0-lightgrey.svg
|
api.py
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# TTS IITM SPEECH LAB
|
| 2 |
+
import requests
|
| 3 |
+
import json
|
| 4 |
+
import base64
|
| 5 |
+
|
| 6 |
+
text = "सुप्रभात, आप कैसे हैं?" # hindi
|
| 7 |
+
# text = "സുപ്രഭാതം, സുഖമാ?" # malayalam
|
| 8 |
+
# text = "সুপ্ৰভাত, তুমি কেনে?" # manipuri
|
| 9 |
+
# text = "सुप्रभात, तुम्ही कसे आहात?" # marathi
|
| 10 |
+
# text = "ಶುಭೋದಯ, ನೀವು ಹೇಗಿದ್ದೀರಿ?" # kannada
|
| 11 |
+
# text = "बसु म्विथ्बो, बरि दिबाबो?" # bodo male not working <---
|
| 12 |
+
# text = "Good morning, how are you?" # english
|
| 13 |
+
# text = "সুপ্ৰভাত, আপুনি কেমন আছে?" # assamese
|
| 14 |
+
# text = "காலை வணக்கம், நீங்கள் எப்படி இருக்கின்றீர்கள்?" # tamil
|
| 15 |
+
# text = "ସୁପ୍ରଭାତ, ଆପଣ କେମିତି ଅଛନ୍ତି?" # odia male not working <---
|
| 16 |
+
# text = "सुप्रभात, आप कैसे छो?" # rajasthani
|
| 17 |
+
# text = "శుభోదయం, మీరు ఎలా ఉన్నారు?" # telugu
|
| 18 |
+
# text = "সুপ্রভাত, আপনি কেমন আছেন?" # bengali male not working <---
|
| 19 |
+
# text = "સુપ્રભાત, તમે કેમ છો?" # gujarati
|
| 20 |
+
|
| 21 |
+
lang = 'hindi'
|
| 22 |
+
gender = 'female'
|
| 23 |
+
|
| 24 |
+
url = "http://localhost:4005/tts"
|
| 25 |
+
# url = 'http://projects.respark.iitm.ac.in:8009/tts' # proxy
|
| 26 |
+
|
| 27 |
+
payload = json.dumps({
|
| 28 |
+
"input": text,
|
| 29 |
+
"gender": gender,
|
| 30 |
+
"lang": lang,
|
| 31 |
+
"alpha": 1,
|
| 32 |
+
"segmentwise":"True"
|
| 33 |
+
})
|
| 34 |
+
headers = {'Content-Type': 'application/json'}
|
| 35 |
+
response = requests.request("POST", url, headers=headers, data=payload).json()
|
| 36 |
+
|
| 37 |
+
audio = response['audio']
|
| 38 |
+
file_name = "tts.mp3"
|
| 39 |
+
wav_file = open(file_name,'wb')
|
| 40 |
+
decode_string = base64.b64decode(audio)
|
| 41 |
+
wav_file.write(decode_string)
|
| 42 |
+
wav_file.close()
|
| 43 |
+
|
| 44 |
+
'''
|
| 45 |
+
Supported languages
|
| 46 |
+
|
| 47 |
+
Assamese
|
| 48 |
+
Bengali
|
| 49 |
+
Bodo
|
| 50 |
+
English
|
| 51 |
+
Gujarati
|
| 52 |
+
Hindi
|
| 53 |
+
Kannada
|
| 54 |
+
Malayalam
|
| 55 |
+
Manipuri
|
| 56 |
+
Marathi
|
| 57 |
+
Odia
|
| 58 |
+
Punjabi
|
| 59 |
+
Rajasthani
|
| 60 |
+
Tamil
|
| 61 |
+
Telugu
|
| 62 |
+
Urdu
|
| 63 |
+
'''
|
app.py
ADDED
|
@@ -0,0 +1,179 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from flask import Flask, render_template, request, send_file, jsonify
|
| 2 |
+
import requests
|
| 3 |
+
import json
|
| 4 |
+
import ssl
|
| 5 |
+
import logging
|
| 6 |
+
import sys
|
| 7 |
+
import os
|
| 8 |
+
import base64
|
| 9 |
+
import io
|
| 10 |
+
#replace the path with your hifigan path to import Generator from models.py
|
| 11 |
+
sys.path.append("hifigan")
|
| 12 |
+
# import argparse
|
| 13 |
+
import torch
|
| 14 |
+
from espnet2.bin.tts_inference import Text2Speech
|
| 15 |
+
from models import Generator
|
| 16 |
+
from scipy.io.wavfile import write
|
| 17 |
+
from meldataset import MAX_WAV_VALUE
|
| 18 |
+
from env import AttrDict
|
| 19 |
+
import json
|
| 20 |
+
import yaml
|
| 21 |
+
from text_preprocess_for_inference import TTSDurAlignPreprocessor
|
| 22 |
+
# import time
|
| 23 |
+
|
| 24 |
+
logging.basicConfig(filename='access.log', level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
|
| 25 |
+
|
| 26 |
+
SAMPLING_RATE = 22050
|
| 27 |
+
if torch.cuda.is_available():
|
| 28 |
+
device = "cuda"
|
| 29 |
+
else:
|
| 30 |
+
device = "cpu"
|
| 31 |
+
|
| 32 |
+
preprocessor = TTSDurAlignPreprocessor()
|
| 33 |
+
|
| 34 |
+
app = Flask(__name__)
|
| 35 |
+
# app.config['SECRET_KEY'] = 'key'
|
| 36 |
+
# socketio = SocketIO(app)
|
| 37 |
+
|
| 38 |
+
# @socketio.on('new_user')
|
| 39 |
+
# def handle_new_user(data):
|
| 40 |
+
# client_id = data['id']
|
| 41 |
+
# # print('\n'+f"New user connected with ID: {client_id}")
|
| 42 |
+
# logging.info('\n'+f"New user connected with ID: {client_id}")
|
| 43 |
+
|
| 44 |
+
def load_hifigan_vocoder(language, gender, device):
|
| 45 |
+
# Load HiFi-GAN vocoder configuration file and generator model for the specified language and gender
|
| 46 |
+
vocoder_config = f"vocoder/{gender}/aryan/hifigan/config.json"
|
| 47 |
+
vocoder_generator = f"vocoder/{gender}/aryan/hifigan/generator"
|
| 48 |
+
# Read the contents of the vocoder configuration file
|
| 49 |
+
with open(vocoder_config, 'r') as f:
|
| 50 |
+
data = f.read()
|
| 51 |
+
json_config = json.loads(data)
|
| 52 |
+
h = AttrDict(json_config)
|
| 53 |
+
torch.manual_seed(h.seed)
|
| 54 |
+
# Move the generator model to the specified device (CPU or GPU)
|
| 55 |
+
device = torch.device(device)
|
| 56 |
+
generator = Generator(h).to(device)
|
| 57 |
+
state_dict_g = torch.load(vocoder_generator, device)
|
| 58 |
+
generator.load_state_dict(state_dict_g['generator'])
|
| 59 |
+
generator.eval()
|
| 60 |
+
generator.remove_weight_norm()
|
| 61 |
+
|
| 62 |
+
# Return the loaded and prepared HiFi-GAN generator model
|
| 63 |
+
return generator
|
| 64 |
+
|
| 65 |
+
def load_fastspeech2_model(language, gender, device):
|
| 66 |
+
|
| 67 |
+
#updating the config.yaml fiel based on language and gender
|
| 68 |
+
with open(f"{language}/{gender}/model/config.yaml", "r") as file:
|
| 69 |
+
config = yaml.safe_load(file)
|
| 70 |
+
|
| 71 |
+
current_working_directory = os.getcwd()
|
| 72 |
+
feat="model/feats_stats.npz"
|
| 73 |
+
pitch="model/pitch_stats.npz"
|
| 74 |
+
energy="model/energy_stats.npz"
|
| 75 |
+
|
| 76 |
+
feat_path=os.path.join(current_working_directory,language,gender,feat)
|
| 77 |
+
pitch_path=os.path.join(current_working_directory,language,gender,pitch)
|
| 78 |
+
energy_path=os.path.join(current_working_directory,language,gender,energy)
|
| 79 |
+
|
| 80 |
+
|
| 81 |
+
config["normalize_conf"]["stats_file"] = feat_path
|
| 82 |
+
config["pitch_normalize_conf"]["stats_file"] = pitch_path
|
| 83 |
+
config["energy_normalize_conf"]["stats_file"] = energy_path
|
| 84 |
+
|
| 85 |
+
with open(f"{language}/{gender}/model/config.yaml", "w") as file:
|
| 86 |
+
yaml.dump(config, file)
|
| 87 |
+
|
| 88 |
+
tts_model = f"{language}/{gender}/model/model.pth"
|
| 89 |
+
tts_config = f"{language}/{gender}/model/config.yaml"
|
| 90 |
+
|
| 91 |
+
|
| 92 |
+
return Text2Speech(train_config=tts_config, model_file=tts_model, device=device)
|
| 93 |
+
|
| 94 |
+
def text_synthesis(language, gender, sample_text, vocoder, MAX_WAV_VALUE, device, alpha=1):
|
| 95 |
+
# Perform Text-to-Speech synthesis
|
| 96 |
+
with torch.no_grad():
|
| 97 |
+
# Load the FastSpeech2 model for the specified language and gender
|
| 98 |
+
|
| 99 |
+
model = load_fastspeech2_model(language, gender, device)
|
| 100 |
+
|
| 101 |
+
# Generate mel-spectrograms from the input text using the FastSpeech2 model
|
| 102 |
+
out = model(sample_text, decode_conf={"alpha": alpha})
|
| 103 |
+
print("TTS Done")
|
| 104 |
+
x = out["feat_gen_denorm"].T.unsqueeze(0) * 2.3262
|
| 105 |
+
x = x.to(device)
|
| 106 |
+
|
| 107 |
+
# Use the HiFi-GAN vocoder to convert mel-spectrograms to raw audio waveforms
|
| 108 |
+
y_g_hat = vocoder(x)
|
| 109 |
+
audio = y_g_hat.squeeze()
|
| 110 |
+
audio = audio * MAX_WAV_VALUE
|
| 111 |
+
audio = audio.cpu().numpy().astype('int16')
|
| 112 |
+
|
| 113 |
+
# Return the synthesized audio
|
| 114 |
+
return audio
|
| 115 |
+
|
| 116 |
+
def setup_app():
|
| 117 |
+
genders = ['male','female']
|
| 118 |
+
# to make dummy calls in all languages available
|
| 119 |
+
languages = {'hindi': "नमस्ते",'malayalam': "ഹലോ",'manipuri': "হ্যালো",'marathi': "हॅलो",'kannada': "ಹಲೋ",'bodo': "हॅलो",'english': "Hello",'assamese': "হ্যালো",'tamil': "ஹலோ",'odia': "ହେଲୋ",'rajasthani': "हॅलो",'telugu': "హలో",'bengali': "হ্যালো",'gujarati': "હલો"}
|
| 120 |
+
|
| 121 |
+
vocoders = {}
|
| 122 |
+
for gender in genders:
|
| 123 |
+
vocoders[gender]={}
|
| 124 |
+
for language,text in languages.items():
|
| 125 |
+
# Load the HiFi-GAN vocoder with dynamic language and gender
|
| 126 |
+
vocoder = load_hifigan_vocoder(language, gender, device)
|
| 127 |
+
vocoders[gender][language] = vocoder
|
| 128 |
+
# dummy calls
|
| 129 |
+
print(f"making dummy calls for {language} - {gender}")
|
| 130 |
+
try:
|
| 131 |
+
out = text_synthesis(language, gender, text, vocoder, MAX_WAV_VALUE, device)
|
| 132 |
+
except:
|
| 133 |
+
message = f"cannot make dummy call for {gender} - {language} <==================="
|
| 134 |
+
print(message.upper())
|
| 135 |
+
|
| 136 |
+
print("Server Started...")
|
| 137 |
+
return vocoders
|
| 138 |
+
vocoders = setup_app()
|
| 139 |
+
|
| 140 |
+
@app.route('/', methods=['GET'])
|
| 141 |
+
def main():
|
| 142 |
+
return "IITM_TTS_V2"
|
| 143 |
+
|
| 144 |
+
@app.route('/tts', methods=['GET', 'POST'], strict_slashes=False)
|
| 145 |
+
def tts():
|
| 146 |
+
try:
|
| 147 |
+
json_data = request.get_json()
|
| 148 |
+
text = json_data["input"]
|
| 149 |
+
if not isinstance(text,str):
|
| 150 |
+
input_type = type(text)
|
| 151 |
+
ret = jsonify(status='failure', reason=f"Unsupported input type {input_type}. Input text should be in string format.")
|
| 152 |
+
gender = json_data["gender"]
|
| 153 |
+
language = json_data["lang"].lower()
|
| 154 |
+
alpha = json_data["alpha"]
|
| 155 |
+
# Preprocess the sample text
|
| 156 |
+
preprocessed_text, phrases = preprocessor.preprocess(text, language, gender)
|
| 157 |
+
preprocessed_text = " ".join(preprocessed_text)
|
| 158 |
+
vocoder = vocoders[gender][language]
|
| 159 |
+
out = text_synthesis(language, gender, preprocessed_text, vocoder, MAX_WAV_VALUE, device, alpha=alpha)
|
| 160 |
+
|
| 161 |
+
# output_file = f"{language}_{gender}_output.wav"
|
| 162 |
+
# write(output_file, SAMPLING_RATE, out)
|
| 163 |
+
# audio_wav_bytes = base64.b64encode(open(output_file, "rb").read())
|
| 164 |
+
|
| 165 |
+
# avoid saving file on disk
|
| 166 |
+
output_stream = io.BytesIO()
|
| 167 |
+
write(output_stream, SAMPLING_RATE, out)
|
| 168 |
+
audio_wav_bytes = base64.b64encode(output_stream.getvalue())
|
| 169 |
+
|
| 170 |
+
ret = jsonify(status="success",audio=audio_wav_bytes.decode('utf-8'))
|
| 171 |
+
|
| 172 |
+
except Exception as err:
|
| 173 |
+
ret = jsonify(status="failure", reason=str(err))
|
| 174 |
+
return ret
|
| 175 |
+
|
| 176 |
+
if __name__ == '__main__':
|
| 177 |
+
# ssl_context = ssl.create_default_context(ssl.Purpose.CLIENT_AUTH)
|
| 178 |
+
# ssl_context.load_cert_chain('./ssl2023/iitm2022.crt','./ssl2023/iitm2022.key')
|
| 179 |
+
app.run(host='0.0.0.0', port=4005, debug=True)
|
assamese_latest/female/model/config.yaml
ADDED
|
@@ -0,0 +1,319 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 2 |
+
print_config: false
|
| 3 |
+
log_level: INFO
|
| 4 |
+
drop_last_iter: false
|
| 5 |
+
dry_run: false
|
| 6 |
+
iterator_type: sequence
|
| 7 |
+
valid_iterator_type: null
|
| 8 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 9 |
+
ngpu: 1
|
| 10 |
+
seed: 0
|
| 11 |
+
num_workers: 1
|
| 12 |
+
num_att_plot: 3
|
| 13 |
+
dist_backend: nccl
|
| 14 |
+
dist_init_method: env://
|
| 15 |
+
dist_world_size: 2
|
| 16 |
+
dist_rank: 0
|
| 17 |
+
local_rank: 0
|
| 18 |
+
dist_master_addr: localhost
|
| 19 |
+
dist_master_port: 36807
|
| 20 |
+
dist_launcher: null
|
| 21 |
+
multiprocessing_distributed: true
|
| 22 |
+
unused_parameters: false
|
| 23 |
+
sharded_ddp: false
|
| 24 |
+
use_deepspeed: false
|
| 25 |
+
deepspeed_config: null
|
| 26 |
+
cudnn_enabled: true
|
| 27 |
+
cudnn_benchmark: false
|
| 28 |
+
cudnn_deterministic: true
|
| 29 |
+
use_tf32: false
|
| 30 |
+
collect_stats: false
|
| 31 |
+
write_collected_feats: false
|
| 32 |
+
max_epoch: 1000
|
| 33 |
+
patience: null
|
| 34 |
+
val_scheduler_criterion:
|
| 35 |
+
- valid
|
| 36 |
+
- loss
|
| 37 |
+
early_stopping_criterion:
|
| 38 |
+
- valid
|
| 39 |
+
- loss
|
| 40 |
+
- min
|
| 41 |
+
best_model_criterion:
|
| 42 |
+
- - valid
|
| 43 |
+
- loss
|
| 44 |
+
- min
|
| 45 |
+
- - train
|
| 46 |
+
- loss
|
| 47 |
+
- min
|
| 48 |
+
keep_nbest_models: 5
|
| 49 |
+
nbest_averaging_interval: 0
|
| 50 |
+
grad_clip: 1.0
|
| 51 |
+
grad_clip_type: 2.0
|
| 52 |
+
grad_noise: false
|
| 53 |
+
accum_grad: 8
|
| 54 |
+
no_forward_run: false
|
| 55 |
+
resume: true
|
| 56 |
+
train_dtype: float32
|
| 57 |
+
use_amp: false
|
| 58 |
+
log_interval: null
|
| 59 |
+
use_matplotlib: true
|
| 60 |
+
use_tensorboard: true
|
| 61 |
+
create_graph_in_tensorboard: false
|
| 62 |
+
use_wandb: false
|
| 63 |
+
wandb_project: null
|
| 64 |
+
wandb_id: null
|
| 65 |
+
wandb_entity: null
|
| 66 |
+
wandb_name: null
|
| 67 |
+
wandb_model_log_interval: -1
|
| 68 |
+
detect_anomaly: false
|
| 69 |
+
use_adapter: false
|
| 70 |
+
adapter: lora
|
| 71 |
+
save_strategy: all
|
| 72 |
+
adapter_conf: {}
|
| 73 |
+
pretrain_path: null
|
| 74 |
+
init_param: []
|
| 75 |
+
ignore_init_mismatch: false
|
| 76 |
+
freeze_param: []
|
| 77 |
+
num_iters_per_epoch: 800
|
| 78 |
+
batch_size: 20
|
| 79 |
+
valid_batch_size: null
|
| 80 |
+
batch_bins: 3000000
|
| 81 |
+
valid_batch_bins: null
|
| 82 |
+
train_shape_file:
|
| 83 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 84 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 85 |
+
valid_shape_file:
|
| 86 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 87 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 88 |
+
batch_type: numel
|
| 89 |
+
valid_batch_type: null
|
| 90 |
+
fold_length:
|
| 91 |
+
- 150
|
| 92 |
+
- 819200
|
| 93 |
+
sort_in_batch: descending
|
| 94 |
+
shuffle_within_batch: false
|
| 95 |
+
sort_batch: descending
|
| 96 |
+
multiple_iterator: false
|
| 97 |
+
chunk_length: 500
|
| 98 |
+
chunk_shift_ratio: 0.5
|
| 99 |
+
num_cache_chunks: 1024
|
| 100 |
+
chunk_excluded_key_prefixes: []
|
| 101 |
+
chunk_default_fs: null
|
| 102 |
+
chunk_max_abs_length: null
|
| 103 |
+
chunk_discard_short_samples: true
|
| 104 |
+
train_data_path_and_name_and_type:
|
| 105 |
+
- - dump/raw/tr_no_dev/text
|
| 106 |
+
- text
|
| 107 |
+
- text
|
| 108 |
+
- - duration_info/tr_no_dev/durations
|
| 109 |
+
- durations
|
| 110 |
+
- text_int
|
| 111 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 112 |
+
- speech
|
| 113 |
+
- sound
|
| 114 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 115 |
+
- pitch
|
| 116 |
+
- npy
|
| 117 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 118 |
+
- energy
|
| 119 |
+
- npy
|
| 120 |
+
valid_data_path_and_name_and_type:
|
| 121 |
+
- - dump/raw/dev/text
|
| 122 |
+
- text
|
| 123 |
+
- text
|
| 124 |
+
- - duration_info/dev/durations
|
| 125 |
+
- durations
|
| 126 |
+
- text_int
|
| 127 |
+
- - dump/raw/dev/wav.scp
|
| 128 |
+
- speech
|
| 129 |
+
- sound
|
| 130 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 131 |
+
- pitch
|
| 132 |
+
- npy
|
| 133 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 134 |
+
- energy
|
| 135 |
+
- npy
|
| 136 |
+
multi_task_dataset: false
|
| 137 |
+
allow_variable_data_keys: false
|
| 138 |
+
max_cache_size: 0.0
|
| 139 |
+
max_cache_fd: 32
|
| 140 |
+
allow_multi_rates: false
|
| 141 |
+
valid_max_cache_size: null
|
| 142 |
+
exclude_weight_decay: false
|
| 143 |
+
exclude_weight_decay_conf: {}
|
| 144 |
+
optim: adam
|
| 145 |
+
optim_conf:
|
| 146 |
+
lr: 1.0
|
| 147 |
+
scheduler: noamlr
|
| 148 |
+
scheduler_conf:
|
| 149 |
+
model_size: 384
|
| 150 |
+
warmup_steps: 4000
|
| 151 |
+
token_list:
|
| 152 |
+
- <blank>
|
| 153 |
+
- <unk>
|
| 154 |
+
- <space>
|
| 155 |
+
- $
|
| 156 |
+
- ','
|
| 157 |
+
- .
|
| 158 |
+
- M
|
| 159 |
+
- q
|
| 160 |
+
- H
|
| 161 |
+
- k
|
| 162 |
+
- ख
|
| 163 |
+
- g
|
| 164 |
+
- घ
|
| 165 |
+
- ङ
|
| 166 |
+
- c
|
| 167 |
+
- C
|
| 168 |
+
- j
|
| 169 |
+
- J
|
| 170 |
+
- ञ
|
| 171 |
+
- ट
|
| 172 |
+
- ठ
|
| 173 |
+
- ड
|
| 174 |
+
- ढ
|
| 175 |
+
- ण
|
| 176 |
+
- t
|
| 177 |
+
- थ
|
| 178 |
+
- d
|
| 179 |
+
- ध
|
| 180 |
+
- n
|
| 181 |
+
- ऩ
|
| 182 |
+
- p
|
| 183 |
+
- P
|
| 184 |
+
- b
|
| 185 |
+
- B
|
| 186 |
+
- m
|
| 187 |
+
- y
|
| 188 |
+
- r
|
| 189 |
+
- ऱ
|
| 190 |
+
- l
|
| 191 |
+
- ള
|
| 192 |
+
- Z
|
| 193 |
+
- w
|
| 194 |
+
- श
|
| 195 |
+
- ष
|
| 196 |
+
- s
|
| 197 |
+
- h
|
| 198 |
+
- Y
|
| 199 |
+
- ऽ
|
| 200 |
+
- क
|
| 201 |
+
- K
|
| 202 |
+
- G
|
| 203 |
+
- z
|
| 204 |
+
- D
|
| 205 |
+
- T
|
| 206 |
+
- f
|
| 207 |
+
- ॠ
|
| 208 |
+
- ൺ
|
| 209 |
+
- N
|
| 210 |
+
- ർ
|
| 211 |
+
- ൽ
|
| 212 |
+
- ൾ
|
| 213 |
+
- a
|
| 214 |
+
- A
|
| 215 |
+
- i
|
| 216 |
+
- I
|
| 217 |
+
- u
|
| 218 |
+
- U
|
| 219 |
+
- R
|
| 220 |
+
- ऍ
|
| 221 |
+
- e
|
| 222 |
+
- E
|
| 223 |
+
- ऐ
|
| 224 |
+
- ऑ
|
| 225 |
+
- o
|
| 226 |
+
- O
|
| 227 |
+
- औ
|
| 228 |
+
- உ
|
| 229 |
+
- <sos/eos>
|
| 230 |
+
odim: null
|
| 231 |
+
model_conf: {}
|
| 232 |
+
use_preprocessor: true
|
| 233 |
+
token_type: char
|
| 234 |
+
bpemodel: null
|
| 235 |
+
non_linguistic_symbols: null
|
| 236 |
+
cleaner: null
|
| 237 |
+
g2p: null
|
| 238 |
+
feats_extract: fbank
|
| 239 |
+
feats_extract_conf:
|
| 240 |
+
n_fft: 8192
|
| 241 |
+
hop_length: 1024
|
| 242 |
+
win_length: 4096
|
| 243 |
+
fs: 48000
|
| 244 |
+
fmin: 0
|
| 245 |
+
fmax: 24000
|
| 246 |
+
n_mels: 160
|
| 247 |
+
normalize: global_mvn
|
| 248 |
+
normalize_conf:
|
| 249 |
+
stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
|
| 250 |
+
tts: fastspeech2
|
| 251 |
+
tts_conf:
|
| 252 |
+
adim: 384
|
| 253 |
+
aheads: 2
|
| 254 |
+
elayers: 4
|
| 255 |
+
eunits: 1536
|
| 256 |
+
dlayers: 4
|
| 257 |
+
dunits: 1536
|
| 258 |
+
positionwise_layer_type: conv1d
|
| 259 |
+
positionwise_conv_kernel_size: 3
|
| 260 |
+
duration_predictor_layers: 2
|
| 261 |
+
duration_predictor_chans: 256
|
| 262 |
+
duration_predictor_kernel_size: 3
|
| 263 |
+
postnet_layers: 5
|
| 264 |
+
postnet_filts: 5
|
| 265 |
+
postnet_chans: 256
|
| 266 |
+
use_masking: true
|
| 267 |
+
use_scaled_pos_enc: true
|
| 268 |
+
encoder_normalize_before: true
|
| 269 |
+
decoder_normalize_before: true
|
| 270 |
+
reduction_factor: 1
|
| 271 |
+
init_type: xavier_uniform
|
| 272 |
+
init_enc_alpha: 1.0
|
| 273 |
+
init_dec_alpha: 1.0
|
| 274 |
+
transformer_enc_dropout_rate: 0.2
|
| 275 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 276 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 277 |
+
transformer_dec_dropout_rate: 0.2
|
| 278 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 279 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 280 |
+
pitch_predictor_layers: 5
|
| 281 |
+
pitch_predictor_chans: 256
|
| 282 |
+
pitch_predictor_kernel_size: 5
|
| 283 |
+
pitch_predictor_dropout: 0.5
|
| 284 |
+
pitch_embed_kernel_size: 1
|
| 285 |
+
pitch_embed_dropout: 0.0
|
| 286 |
+
stop_gradient_from_pitch_predictor: true
|
| 287 |
+
energy_predictor_layers: 2
|
| 288 |
+
energy_predictor_chans: 256
|
| 289 |
+
energy_predictor_kernel_size: 3
|
| 290 |
+
energy_predictor_dropout: 0.5
|
| 291 |
+
energy_embed_kernel_size: 1
|
| 292 |
+
energy_embed_dropout: 0.0
|
| 293 |
+
stop_gradient_from_energy_predictor: false
|
| 294 |
+
pitch_extract: dio
|
| 295 |
+
pitch_extract_conf:
|
| 296 |
+
fs: 48000
|
| 297 |
+
n_fft: 8192
|
| 298 |
+
hop_length: 1024
|
| 299 |
+
f0max: 400
|
| 300 |
+
f0min: 80
|
| 301 |
+
reduction_factor: 1
|
| 302 |
+
pitch_normalize: global_mvn
|
| 303 |
+
pitch_normalize_conf:
|
| 304 |
+
stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
|
| 305 |
+
energy_extract: energy
|
| 306 |
+
energy_extract_conf:
|
| 307 |
+
fs: 48000
|
| 308 |
+
n_fft: 8192
|
| 309 |
+
hop_length: 1024
|
| 310 |
+
win_length: 4096
|
| 311 |
+
reduction_factor: 1
|
| 312 |
+
energy_normalize: global_mvn
|
| 313 |
+
energy_normalize_conf:
|
| 314 |
+
stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
|
| 315 |
+
required:
|
| 316 |
+
- output_dir
|
| 317 |
+
- token_list
|
| 318 |
+
version: '202402'
|
| 319 |
+
distributed: true
|
assamese_latest/female/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04e33101ff3538ca740f6c8fc35483fffab31722c9f0ae99adab07dd29c361de
|
| 3 |
+
size 770
|
assamese_latest/female/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b9b6ee7475d00198e08ea5b675f2cb5e81239a5f0babf83866b37b51ef2e0a1
|
| 3 |
+
size 2042
|
assamese_latest/female/model/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e5cd37cac859ad35acd2d0510fe3b4c5b388d167c9d70fb12efd1f5d0b03560
|
| 3 |
+
size 152129434
|
assamese_latest/female/model/pitch_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3dbac0bea459888e39a56f5f04e150d35a21f966e6e04b1d027c354e9de99aab
|
| 3 |
+
size 770
|
assamese_latest/male/model/config.yaml
ADDED
|
@@ -0,0 +1,315 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
accum_grad: 8
|
| 2 |
+
adapter: lora
|
| 3 |
+
adapter_conf: {}
|
| 4 |
+
allow_multi_rates: false
|
| 5 |
+
allow_variable_data_keys: false
|
| 6 |
+
batch_bins: 3000000
|
| 7 |
+
batch_size: 20
|
| 8 |
+
batch_type: numel
|
| 9 |
+
best_model_criterion:
|
| 10 |
+
- - valid
|
| 11 |
+
- loss
|
| 12 |
+
- min
|
| 13 |
+
- - train
|
| 14 |
+
- loss
|
| 15 |
+
- min
|
| 16 |
+
bpemodel: null
|
| 17 |
+
chunk_default_fs: null
|
| 18 |
+
chunk_discard_short_samples: true
|
| 19 |
+
chunk_excluded_key_prefixes: []
|
| 20 |
+
chunk_length: 500
|
| 21 |
+
chunk_max_abs_length: null
|
| 22 |
+
chunk_shift_ratio: 0.5
|
| 23 |
+
cleaner: null
|
| 24 |
+
collect_stats: false
|
| 25 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 26 |
+
create_graph_in_tensorboard: false
|
| 27 |
+
cudnn_benchmark: false
|
| 28 |
+
cudnn_deterministic: true
|
| 29 |
+
cudnn_enabled: true
|
| 30 |
+
detect_anomaly: false
|
| 31 |
+
dist_backend: nccl
|
| 32 |
+
dist_init_method: env://
|
| 33 |
+
dist_launcher: null
|
| 34 |
+
dist_master_addr: localhost
|
| 35 |
+
dist_master_port: 44409
|
| 36 |
+
dist_rank: 0
|
| 37 |
+
dist_world_size: 2
|
| 38 |
+
distributed: true
|
| 39 |
+
drop_last_iter: false
|
| 40 |
+
dry_run: false
|
| 41 |
+
early_stopping_criterion:
|
| 42 |
+
- valid
|
| 43 |
+
- loss
|
| 44 |
+
- min
|
| 45 |
+
energy_extract: energy
|
| 46 |
+
energy_extract_conf:
|
| 47 |
+
fs: 48000
|
| 48 |
+
hop_length: 1024
|
| 49 |
+
n_fft: 8192
|
| 50 |
+
reduction_factor: 1
|
| 51 |
+
win_length: 4096
|
| 52 |
+
energy_normalize: global_mvn
|
| 53 |
+
energy_normalize_conf:
|
| 54 |
+
stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/energy_stats.npz
|
| 55 |
+
exclude_weight_decay: false
|
| 56 |
+
exclude_weight_decay_conf: {}
|
| 57 |
+
feats_extract: fbank
|
| 58 |
+
feats_extract_conf:
|
| 59 |
+
fmax: 24000
|
| 60 |
+
fmin: 0
|
| 61 |
+
fs: 48000
|
| 62 |
+
hop_length: 1024
|
| 63 |
+
n_fft: 8192
|
| 64 |
+
n_mels: 160
|
| 65 |
+
win_length: 4096
|
| 66 |
+
fold_length:
|
| 67 |
+
- 150
|
| 68 |
+
- 819200
|
| 69 |
+
freeze_param: []
|
| 70 |
+
g2p: null
|
| 71 |
+
grad_clip: 1.0
|
| 72 |
+
grad_clip_type: 2.0
|
| 73 |
+
grad_noise: false
|
| 74 |
+
ignore_init_mismatch: false
|
| 75 |
+
init_param: []
|
| 76 |
+
iterator_type: sequence
|
| 77 |
+
keep_nbest_models: 5
|
| 78 |
+
local_rank: 0
|
| 79 |
+
log_interval: null
|
| 80 |
+
log_level: INFO
|
| 81 |
+
max_cache_fd: 32
|
| 82 |
+
max_cache_size: 0.0
|
| 83 |
+
max_epoch: 1000
|
| 84 |
+
model_conf: {}
|
| 85 |
+
multiple_iterator: false
|
| 86 |
+
multiprocessing_distributed: true
|
| 87 |
+
nbest_averaging_interval: 0
|
| 88 |
+
ngpu: 1
|
| 89 |
+
no_forward_run: false
|
| 90 |
+
non_linguistic_symbols: null
|
| 91 |
+
normalize: global_mvn
|
| 92 |
+
normalize_conf:
|
| 93 |
+
stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/feats_stats.npz
|
| 94 |
+
num_att_plot: 3
|
| 95 |
+
num_cache_chunks: 1024
|
| 96 |
+
num_iters_per_epoch: 800
|
| 97 |
+
num_workers: 1
|
| 98 |
+
odim: null
|
| 99 |
+
optim: adam
|
| 100 |
+
optim_conf:
|
| 101 |
+
lr: 1.0
|
| 102 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 103 |
+
patience: null
|
| 104 |
+
pitch_extract: dio
|
| 105 |
+
pitch_extract_conf:
|
| 106 |
+
f0max: 350
|
| 107 |
+
f0min: 40
|
| 108 |
+
fs: 48000
|
| 109 |
+
hop_length: 1024
|
| 110 |
+
n_fft: 8192
|
| 111 |
+
reduction_factor: 1
|
| 112 |
+
pitch_normalize: global_mvn
|
| 113 |
+
pitch_normalize_conf:
|
| 114 |
+
stats_file: /home/speech/Fastspeech2_HS/assamese_latest/male/model/pitch_stats.npz
|
| 115 |
+
pretrain_path: null
|
| 116 |
+
print_config: false
|
| 117 |
+
required:
|
| 118 |
+
- output_dir
|
| 119 |
+
- token_list
|
| 120 |
+
resume: true
|
| 121 |
+
save_strategy: all
|
| 122 |
+
scheduler: noamlr
|
| 123 |
+
scheduler_conf:
|
| 124 |
+
model_size: 384
|
| 125 |
+
warmup_steps: 4000
|
| 126 |
+
seed: 0
|
| 127 |
+
sharded_ddp: false
|
| 128 |
+
shuffle_within_batch: false
|
| 129 |
+
sort_batch: descending
|
| 130 |
+
sort_in_batch: descending
|
| 131 |
+
token_list:
|
| 132 |
+
- <blank>
|
| 133 |
+
- <unk>
|
| 134 |
+
- <space>
|
| 135 |
+
- $
|
| 136 |
+
- ','
|
| 137 |
+
- .
|
| 138 |
+
- M
|
| 139 |
+
- q
|
| 140 |
+
- H
|
| 141 |
+
- k
|
| 142 |
+
- "\u0916"
|
| 143 |
+
- g
|
| 144 |
+
- "\u0918"
|
| 145 |
+
- "\u0919"
|
| 146 |
+
- c
|
| 147 |
+
- C
|
| 148 |
+
- j
|
| 149 |
+
- J
|
| 150 |
+
- "\u091E"
|
| 151 |
+
- "\u091F"
|
| 152 |
+
- "\u0920"
|
| 153 |
+
- "\u0921"
|
| 154 |
+
- "\u0922"
|
| 155 |
+
- "\u0923"
|
| 156 |
+
- t
|
| 157 |
+
- "\u0925"
|
| 158 |
+
- d
|
| 159 |
+
- "\u0927"
|
| 160 |
+
- n
|
| 161 |
+
- "\u0929"
|
| 162 |
+
- p
|
| 163 |
+
- P
|
| 164 |
+
- b
|
| 165 |
+
- B
|
| 166 |
+
- m
|
| 167 |
+
- y
|
| 168 |
+
- r
|
| 169 |
+
- "\u0931"
|
| 170 |
+
- l
|
| 171 |
+
- "\u0D33"
|
| 172 |
+
- Z
|
| 173 |
+
- w
|
| 174 |
+
- "\u0936"
|
| 175 |
+
- "\u0937"
|
| 176 |
+
- s
|
| 177 |
+
- h
|
| 178 |
+
- Y
|
| 179 |
+
- "\u093D"
|
| 180 |
+
- "\u0915"
|
| 181 |
+
- K
|
| 182 |
+
- G
|
| 183 |
+
- z
|
| 184 |
+
- D
|
| 185 |
+
- T
|
| 186 |
+
- f
|
| 187 |
+
- "\u0960"
|
| 188 |
+
- "\u0D7A"
|
| 189 |
+
- N
|
| 190 |
+
- "\u0D7C"
|
| 191 |
+
- "\u0D7D"
|
| 192 |
+
- "\u0D7E"
|
| 193 |
+
- a
|
| 194 |
+
- A
|
| 195 |
+
- i
|
| 196 |
+
- I
|
| 197 |
+
- u
|
| 198 |
+
- U
|
| 199 |
+
- R
|
| 200 |
+
- "\u090D"
|
| 201 |
+
- e
|
| 202 |
+
- E
|
| 203 |
+
- "\u0910"
|
| 204 |
+
- "\u0911"
|
| 205 |
+
- o
|
| 206 |
+
- O
|
| 207 |
+
- "\u0914"
|
| 208 |
+
- "\u0B89"
|
| 209 |
+
- <sos/eos>
|
| 210 |
+
token_type: char
|
| 211 |
+
train_data_path_and_name_and_type:
|
| 212 |
+
- - dump/raw/tr_no_dev/text
|
| 213 |
+
- text
|
| 214 |
+
- text
|
| 215 |
+
- - duration_info/tr_no_dev/durations
|
| 216 |
+
- durations
|
| 217 |
+
- text_int
|
| 218 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 219 |
+
- speech
|
| 220 |
+
- sound
|
| 221 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 222 |
+
- pitch
|
| 223 |
+
- npy
|
| 224 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 225 |
+
- energy
|
| 226 |
+
- npy
|
| 227 |
+
train_dtype: float32
|
| 228 |
+
train_shape_file:
|
| 229 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 230 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 231 |
+
tts: fastspeech2
|
| 232 |
+
tts_conf:
|
| 233 |
+
adim: 384
|
| 234 |
+
aheads: 2
|
| 235 |
+
decoder_normalize_before: true
|
| 236 |
+
dlayers: 4
|
| 237 |
+
dunits: 1536
|
| 238 |
+
duration_predictor_chans: 256
|
| 239 |
+
duration_predictor_kernel_size: 3
|
| 240 |
+
duration_predictor_layers: 2
|
| 241 |
+
elayers: 4
|
| 242 |
+
encoder_normalize_before: true
|
| 243 |
+
energy_embed_dropout: 0.0
|
| 244 |
+
energy_embed_kernel_size: 1
|
| 245 |
+
energy_predictor_chans: 256
|
| 246 |
+
energy_predictor_dropout: 0.5
|
| 247 |
+
energy_predictor_kernel_size: 3
|
| 248 |
+
energy_predictor_layers: 2
|
| 249 |
+
eunits: 1536
|
| 250 |
+
init_dec_alpha: 1.0
|
| 251 |
+
init_enc_alpha: 1.0
|
| 252 |
+
init_type: xavier_uniform
|
| 253 |
+
pitch_embed_dropout: 0.0
|
| 254 |
+
pitch_embed_kernel_size: 1
|
| 255 |
+
pitch_predictor_chans: 256
|
| 256 |
+
pitch_predictor_dropout: 0.5
|
| 257 |
+
pitch_predictor_kernel_size: 5
|
| 258 |
+
pitch_predictor_layers: 5
|
| 259 |
+
positionwise_conv_kernel_size: 3
|
| 260 |
+
positionwise_layer_type: conv1d
|
| 261 |
+
postnet_chans: 256
|
| 262 |
+
postnet_filts: 5
|
| 263 |
+
postnet_layers: 5
|
| 264 |
+
reduction_factor: 1
|
| 265 |
+
stop_gradient_from_energy_predictor: false
|
| 266 |
+
stop_gradient_from_pitch_predictor: true
|
| 267 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 268 |
+
transformer_dec_dropout_rate: 0.2
|
| 269 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 270 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 271 |
+
transformer_enc_dropout_rate: 0.2
|
| 272 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 273 |
+
use_masking: true
|
| 274 |
+
use_scaled_pos_enc: true
|
| 275 |
+
unused_parameters: false
|
| 276 |
+
use_adapter: false
|
| 277 |
+
use_amp: false
|
| 278 |
+
use_matplotlib: true
|
| 279 |
+
use_preprocessor: true
|
| 280 |
+
use_tensorboard: true
|
| 281 |
+
use_wandb: false
|
| 282 |
+
val_scheduler_criterion:
|
| 283 |
+
- valid
|
| 284 |
+
- loss
|
| 285 |
+
valid_batch_bins: null
|
| 286 |
+
valid_batch_size: null
|
| 287 |
+
valid_batch_type: null
|
| 288 |
+
valid_data_path_and_name_and_type:
|
| 289 |
+
- - dump/raw/dev/text
|
| 290 |
+
- text
|
| 291 |
+
- text
|
| 292 |
+
- - duration_info/dev/durations
|
| 293 |
+
- durations
|
| 294 |
+
- text_int
|
| 295 |
+
- - dump/raw/dev/wav.scp
|
| 296 |
+
- speech
|
| 297 |
+
- sound
|
| 298 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 299 |
+
- pitch
|
| 300 |
+
- npy
|
| 301 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 302 |
+
- energy
|
| 303 |
+
- npy
|
| 304 |
+
valid_iterator_type: null
|
| 305 |
+
valid_max_cache_size: null
|
| 306 |
+
valid_shape_file:
|
| 307 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 308 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 309 |
+
version: '202402'
|
| 310 |
+
wandb_entity: null
|
| 311 |
+
wandb_id: null
|
| 312 |
+
wandb_model_log_interval: -1
|
| 313 |
+
wandb_name: null
|
| 314 |
+
wandb_project: null
|
| 315 |
+
write_collected_feats: false
|
assamese_latest/male/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a64d5dd4ee24ad1b403ad07911b9e30f4d482f97c331b844272725617fb941a6
|
| 3 |
+
size 770
|
assamese_latest/male/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecbb77de18a76f7e991b256a042acc361aa338498daa52048978ea050a9fd528
|
| 3 |
+
size 2042
|
assamese_latest/male/model/feats_type
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
raw
|
assamese_latest/male/model/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f52c3b1c4edd258dbd9e46920896bc0215cfe5c78957e3ee2a25de6f3ef916b
|
| 3 |
+
size 152128410
|
assamese_latest/male/model/pitch_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47de3b8ee9c740a5f24ceafcbe9b3486dfd4b3676d95282d7ce97c1116d834fd
|
| 3 |
+
size 770
|
bengali_latest/male/model/config.yaml
ADDED
|
@@ -0,0 +1,315 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
accum_grad: 8
|
| 2 |
+
adapter: lora
|
| 3 |
+
adapter_conf: {}
|
| 4 |
+
allow_multi_rates: false
|
| 5 |
+
allow_variable_data_keys: false
|
| 6 |
+
batch_bins: 3000000
|
| 7 |
+
batch_size: 20
|
| 8 |
+
batch_type: numel
|
| 9 |
+
best_model_criterion:
|
| 10 |
+
- - valid
|
| 11 |
+
- loss
|
| 12 |
+
- min
|
| 13 |
+
- - train
|
| 14 |
+
- loss
|
| 15 |
+
- min
|
| 16 |
+
bpemodel: null
|
| 17 |
+
chunk_default_fs: null
|
| 18 |
+
chunk_discard_short_samples: true
|
| 19 |
+
chunk_excluded_key_prefixes: []
|
| 20 |
+
chunk_length: 500
|
| 21 |
+
chunk_max_abs_length: null
|
| 22 |
+
chunk_shift_ratio: 0.5
|
| 23 |
+
cleaner: null
|
| 24 |
+
collect_stats: false
|
| 25 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 26 |
+
create_graph_in_tensorboard: false
|
| 27 |
+
cudnn_benchmark: false
|
| 28 |
+
cudnn_deterministic: true
|
| 29 |
+
cudnn_enabled: true
|
| 30 |
+
detect_anomaly: false
|
| 31 |
+
dist_backend: nccl
|
| 32 |
+
dist_init_method: env://
|
| 33 |
+
dist_launcher: null
|
| 34 |
+
dist_master_addr: localhost
|
| 35 |
+
dist_master_port: 38255
|
| 36 |
+
dist_rank: 0
|
| 37 |
+
dist_world_size: 2
|
| 38 |
+
distributed: true
|
| 39 |
+
drop_last_iter: false
|
| 40 |
+
dry_run: false
|
| 41 |
+
early_stopping_criterion:
|
| 42 |
+
- valid
|
| 43 |
+
- loss
|
| 44 |
+
- min
|
| 45 |
+
energy_extract: energy
|
| 46 |
+
energy_extract_conf:
|
| 47 |
+
fs: 48000
|
| 48 |
+
hop_length: 1024
|
| 49 |
+
n_fft: 8192
|
| 50 |
+
reduction_factor: 1
|
| 51 |
+
win_length: 4096
|
| 52 |
+
energy_normalize: global_mvn
|
| 53 |
+
energy_normalize_conf:
|
| 54 |
+
stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/energy_stats.npz
|
| 55 |
+
exclude_weight_decay: false
|
| 56 |
+
exclude_weight_decay_conf: {}
|
| 57 |
+
feats_extract: fbank
|
| 58 |
+
feats_extract_conf:
|
| 59 |
+
fmax: 24000
|
| 60 |
+
fmin: 0
|
| 61 |
+
fs: 48000
|
| 62 |
+
hop_length: 1024
|
| 63 |
+
n_fft: 8192
|
| 64 |
+
n_mels: 160
|
| 65 |
+
win_length: 4096
|
| 66 |
+
fold_length:
|
| 67 |
+
- 150
|
| 68 |
+
- 819200
|
| 69 |
+
freeze_param: []
|
| 70 |
+
g2p: null
|
| 71 |
+
grad_clip: 1.0
|
| 72 |
+
grad_clip_type: 2.0
|
| 73 |
+
grad_noise: false
|
| 74 |
+
ignore_init_mismatch: false
|
| 75 |
+
init_param: []
|
| 76 |
+
iterator_type: sequence
|
| 77 |
+
keep_nbest_models: 5
|
| 78 |
+
local_rank: 0
|
| 79 |
+
log_interval: null
|
| 80 |
+
log_level: INFO
|
| 81 |
+
max_cache_fd: 32
|
| 82 |
+
max_cache_size: 0.0
|
| 83 |
+
max_epoch: 1000
|
| 84 |
+
model_conf: {}
|
| 85 |
+
multiple_iterator: false
|
| 86 |
+
multiprocessing_distributed: true
|
| 87 |
+
nbest_averaging_interval: 0
|
| 88 |
+
ngpu: 1
|
| 89 |
+
no_forward_run: false
|
| 90 |
+
non_linguistic_symbols: null
|
| 91 |
+
normalize: global_mvn
|
| 92 |
+
normalize_conf:
|
| 93 |
+
stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/feats_stats.npz
|
| 94 |
+
num_att_plot: 3
|
| 95 |
+
num_cache_chunks: 1024
|
| 96 |
+
num_iters_per_epoch: 800
|
| 97 |
+
num_workers: 1
|
| 98 |
+
odim: null
|
| 99 |
+
optim: adam
|
| 100 |
+
optim_conf:
|
| 101 |
+
lr: 1.0
|
| 102 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 103 |
+
patience: null
|
| 104 |
+
pitch_extract: dio
|
| 105 |
+
pitch_extract_conf:
|
| 106 |
+
f0max: 350
|
| 107 |
+
f0min: 40
|
| 108 |
+
fs: 48000
|
| 109 |
+
hop_length: 1024
|
| 110 |
+
n_fft: 8192
|
| 111 |
+
reduction_factor: 1
|
| 112 |
+
pitch_normalize: global_mvn
|
| 113 |
+
pitch_normalize_conf:
|
| 114 |
+
stats_file: /home/speech/Fastspeech2_latest models/Fastspeech2_HS/bengali_latest/male/model/pitch_stats.npz
|
| 115 |
+
pretrain_path: null
|
| 116 |
+
print_config: false
|
| 117 |
+
required:
|
| 118 |
+
- output_dir
|
| 119 |
+
- token_list
|
| 120 |
+
resume: true
|
| 121 |
+
save_strategy: all
|
| 122 |
+
scheduler: noamlr
|
| 123 |
+
scheduler_conf:
|
| 124 |
+
model_size: 384
|
| 125 |
+
warmup_steps: 4000
|
| 126 |
+
seed: 0
|
| 127 |
+
sharded_ddp: false
|
| 128 |
+
shuffle_within_batch: false
|
| 129 |
+
sort_batch: descending
|
| 130 |
+
sort_in_batch: descending
|
| 131 |
+
token_list:
|
| 132 |
+
- <blank>
|
| 133 |
+
- <unk>
|
| 134 |
+
- <space>
|
| 135 |
+
- $
|
| 136 |
+
- ','
|
| 137 |
+
- .
|
| 138 |
+
- M
|
| 139 |
+
- q
|
| 140 |
+
- H
|
| 141 |
+
- k
|
| 142 |
+
- "\u0916"
|
| 143 |
+
- g
|
| 144 |
+
- "\u0918"
|
| 145 |
+
- "\u0919"
|
| 146 |
+
- c
|
| 147 |
+
- C
|
| 148 |
+
- j
|
| 149 |
+
- J
|
| 150 |
+
- "\u091E"
|
| 151 |
+
- "\u091F"
|
| 152 |
+
- "\u0920"
|
| 153 |
+
- "\u0921"
|
| 154 |
+
- "\u0922"
|
| 155 |
+
- "\u0923"
|
| 156 |
+
- t
|
| 157 |
+
- "\u0925"
|
| 158 |
+
- d
|
| 159 |
+
- "\u0927"
|
| 160 |
+
- n
|
| 161 |
+
- "\u0929"
|
| 162 |
+
- p
|
| 163 |
+
- P
|
| 164 |
+
- b
|
| 165 |
+
- B
|
| 166 |
+
- m
|
| 167 |
+
- y
|
| 168 |
+
- r
|
| 169 |
+
- "\u0931"
|
| 170 |
+
- l
|
| 171 |
+
- "\u0D33"
|
| 172 |
+
- Z
|
| 173 |
+
- w
|
| 174 |
+
- "\u0936"
|
| 175 |
+
- "\u0937"
|
| 176 |
+
- s
|
| 177 |
+
- h
|
| 178 |
+
- Y
|
| 179 |
+
- "\u093D"
|
| 180 |
+
- "\u0915"
|
| 181 |
+
- K
|
| 182 |
+
- G
|
| 183 |
+
- z
|
| 184 |
+
- D
|
| 185 |
+
- T
|
| 186 |
+
- f
|
| 187 |
+
- "\u0960"
|
| 188 |
+
- "\u0D7A"
|
| 189 |
+
- N
|
| 190 |
+
- "\u0D7C"
|
| 191 |
+
- "\u0D7D"
|
| 192 |
+
- "\u0D7E"
|
| 193 |
+
- a
|
| 194 |
+
- A
|
| 195 |
+
- i
|
| 196 |
+
- I
|
| 197 |
+
- u
|
| 198 |
+
- U
|
| 199 |
+
- R
|
| 200 |
+
- "\u090D"
|
| 201 |
+
- e
|
| 202 |
+
- E
|
| 203 |
+
- "\u0910"
|
| 204 |
+
- "\u0911"
|
| 205 |
+
- o
|
| 206 |
+
- O
|
| 207 |
+
- "\u0914"
|
| 208 |
+
- "\u0B89"
|
| 209 |
+
- <sos/eos>
|
| 210 |
+
token_type: char
|
| 211 |
+
train_data_path_and_name_and_type:
|
| 212 |
+
- - dump/raw/tr_no_dev/text
|
| 213 |
+
- text
|
| 214 |
+
- text
|
| 215 |
+
- - duration_info/tr_no_dev/durations
|
| 216 |
+
- durations
|
| 217 |
+
- text_int
|
| 218 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 219 |
+
- speech
|
| 220 |
+
- sound
|
| 221 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 222 |
+
- pitch
|
| 223 |
+
- npy
|
| 224 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 225 |
+
- energy
|
| 226 |
+
- npy
|
| 227 |
+
train_dtype: float32
|
| 228 |
+
train_shape_file:
|
| 229 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 230 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 231 |
+
tts: fastspeech2
|
| 232 |
+
tts_conf:
|
| 233 |
+
adim: 384
|
| 234 |
+
aheads: 2
|
| 235 |
+
decoder_normalize_before: true
|
| 236 |
+
dlayers: 4
|
| 237 |
+
dunits: 1536
|
| 238 |
+
duration_predictor_chans: 256
|
| 239 |
+
duration_predictor_kernel_size: 3
|
| 240 |
+
duration_predictor_layers: 2
|
| 241 |
+
elayers: 4
|
| 242 |
+
encoder_normalize_before: true
|
| 243 |
+
energy_embed_dropout: 0.0
|
| 244 |
+
energy_embed_kernel_size: 1
|
| 245 |
+
energy_predictor_chans: 256
|
| 246 |
+
energy_predictor_dropout: 0.5
|
| 247 |
+
energy_predictor_kernel_size: 3
|
| 248 |
+
energy_predictor_layers: 2
|
| 249 |
+
eunits: 1536
|
| 250 |
+
init_dec_alpha: 1.0
|
| 251 |
+
init_enc_alpha: 1.0
|
| 252 |
+
init_type: xavier_uniform
|
| 253 |
+
pitch_embed_dropout: 0.0
|
| 254 |
+
pitch_embed_kernel_size: 1
|
| 255 |
+
pitch_predictor_chans: 256
|
| 256 |
+
pitch_predictor_dropout: 0.5
|
| 257 |
+
pitch_predictor_kernel_size: 5
|
| 258 |
+
pitch_predictor_layers: 5
|
| 259 |
+
positionwise_conv_kernel_size: 3
|
| 260 |
+
positionwise_layer_type: conv1d
|
| 261 |
+
postnet_chans: 256
|
| 262 |
+
postnet_filts: 5
|
| 263 |
+
postnet_layers: 5
|
| 264 |
+
reduction_factor: 1
|
| 265 |
+
stop_gradient_from_energy_predictor: false
|
| 266 |
+
stop_gradient_from_pitch_predictor: true
|
| 267 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 268 |
+
transformer_dec_dropout_rate: 0.2
|
| 269 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 270 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 271 |
+
transformer_enc_dropout_rate: 0.2
|
| 272 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 273 |
+
use_masking: true
|
| 274 |
+
use_scaled_pos_enc: true
|
| 275 |
+
unused_parameters: false
|
| 276 |
+
use_adapter: false
|
| 277 |
+
use_amp: false
|
| 278 |
+
use_matplotlib: true
|
| 279 |
+
use_preprocessor: true
|
| 280 |
+
use_tensorboard: true
|
| 281 |
+
use_wandb: false
|
| 282 |
+
val_scheduler_criterion:
|
| 283 |
+
- valid
|
| 284 |
+
- loss
|
| 285 |
+
valid_batch_bins: null
|
| 286 |
+
valid_batch_size: null
|
| 287 |
+
valid_batch_type: null
|
| 288 |
+
valid_data_path_and_name_and_type:
|
| 289 |
+
- - dump/raw/dev/text
|
| 290 |
+
- text
|
| 291 |
+
- text
|
| 292 |
+
- - duration_info/dev/durations
|
| 293 |
+
- durations
|
| 294 |
+
- text_int
|
| 295 |
+
- - dump/raw/dev/wav.scp
|
| 296 |
+
- speech
|
| 297 |
+
- sound
|
| 298 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 299 |
+
- pitch
|
| 300 |
+
- npy
|
| 301 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 302 |
+
- energy
|
| 303 |
+
- npy
|
| 304 |
+
valid_iterator_type: null
|
| 305 |
+
valid_max_cache_size: null
|
| 306 |
+
valid_shape_file:
|
| 307 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 308 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 309 |
+
version: '202402'
|
| 310 |
+
wandb_entity: null
|
| 311 |
+
wandb_id: null
|
| 312 |
+
wandb_model_log_interval: -1
|
| 313 |
+
wandb_name: null
|
| 314 |
+
wandb_project: null
|
| 315 |
+
write_collected_feats: false
|
bengali_latest/male/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e0ff72de15d28f934bf95054d8c82210dbfdbe9114780b92f536a4cfd908358
|
| 3 |
+
size 770
|
bengali_latest/male/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e63bfa54c96d7998cc22e479118fb7be8a5a9a1fae9508c210fd3f00065e0945
|
| 3 |
+
size 2042
|
bengali_latest/male/model/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e131b107524777db0ae4f2578856b9baba42c2ed944433c7d5a086c56f0973e8
|
| 3 |
+
size 152128410
|
bengali_latest/male/model/pitch_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:508206b876c66ec155e6473527155c24ed06d65f8a23963e5bec908a27be018f
|
| 3 |
+
size 770
|
bodo_latest/female/model/config.yaml
ADDED
|
@@ -0,0 +1,319 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 2 |
+
print_config: false
|
| 3 |
+
log_level: INFO
|
| 4 |
+
drop_last_iter: false
|
| 5 |
+
dry_run: false
|
| 6 |
+
iterator_type: sequence
|
| 7 |
+
valid_iterator_type: null
|
| 8 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 9 |
+
ngpu: 1
|
| 10 |
+
seed: 0
|
| 11 |
+
num_workers: 1
|
| 12 |
+
num_att_plot: 3
|
| 13 |
+
dist_backend: nccl
|
| 14 |
+
dist_init_method: env://
|
| 15 |
+
dist_world_size: 2
|
| 16 |
+
dist_rank: 0
|
| 17 |
+
local_rank: 0
|
| 18 |
+
dist_master_addr: localhost
|
| 19 |
+
dist_master_port: 40847
|
| 20 |
+
dist_launcher: null
|
| 21 |
+
multiprocessing_distributed: true
|
| 22 |
+
unused_parameters: false
|
| 23 |
+
sharded_ddp: false
|
| 24 |
+
use_deepspeed: false
|
| 25 |
+
deepspeed_config: null
|
| 26 |
+
cudnn_enabled: true
|
| 27 |
+
cudnn_benchmark: false
|
| 28 |
+
cudnn_deterministic: true
|
| 29 |
+
use_tf32: false
|
| 30 |
+
collect_stats: false
|
| 31 |
+
write_collected_feats: false
|
| 32 |
+
max_epoch: 1000
|
| 33 |
+
patience: null
|
| 34 |
+
val_scheduler_criterion:
|
| 35 |
+
- valid
|
| 36 |
+
- loss
|
| 37 |
+
early_stopping_criterion:
|
| 38 |
+
- valid
|
| 39 |
+
- loss
|
| 40 |
+
- min
|
| 41 |
+
best_model_criterion:
|
| 42 |
+
- - valid
|
| 43 |
+
- loss
|
| 44 |
+
- min
|
| 45 |
+
- - train
|
| 46 |
+
- loss
|
| 47 |
+
- min
|
| 48 |
+
keep_nbest_models: 5
|
| 49 |
+
nbest_averaging_interval: 0
|
| 50 |
+
grad_clip: 1.0
|
| 51 |
+
grad_clip_type: 2.0
|
| 52 |
+
grad_noise: false
|
| 53 |
+
accum_grad: 8
|
| 54 |
+
no_forward_run: false
|
| 55 |
+
resume: true
|
| 56 |
+
train_dtype: float32
|
| 57 |
+
use_amp: false
|
| 58 |
+
log_interval: null
|
| 59 |
+
use_matplotlib: true
|
| 60 |
+
use_tensorboard: true
|
| 61 |
+
create_graph_in_tensorboard: false
|
| 62 |
+
use_wandb: false
|
| 63 |
+
wandb_project: null
|
| 64 |
+
wandb_id: null
|
| 65 |
+
wandb_entity: null
|
| 66 |
+
wandb_name: null
|
| 67 |
+
wandb_model_log_interval: -1
|
| 68 |
+
detect_anomaly: false
|
| 69 |
+
use_adapter: false
|
| 70 |
+
adapter: lora
|
| 71 |
+
save_strategy: all
|
| 72 |
+
adapter_conf: {}
|
| 73 |
+
pretrain_path: null
|
| 74 |
+
init_param: []
|
| 75 |
+
ignore_init_mismatch: false
|
| 76 |
+
freeze_param: []
|
| 77 |
+
num_iters_per_epoch: 800
|
| 78 |
+
batch_size: 20
|
| 79 |
+
valid_batch_size: null
|
| 80 |
+
batch_bins: 3000000
|
| 81 |
+
valid_batch_bins: null
|
| 82 |
+
train_shape_file:
|
| 83 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 84 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 85 |
+
valid_shape_file:
|
| 86 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 87 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 88 |
+
batch_type: numel
|
| 89 |
+
valid_batch_type: null
|
| 90 |
+
fold_length:
|
| 91 |
+
- 150
|
| 92 |
+
- 819200
|
| 93 |
+
sort_in_batch: descending
|
| 94 |
+
shuffle_within_batch: false
|
| 95 |
+
sort_batch: descending
|
| 96 |
+
multiple_iterator: false
|
| 97 |
+
chunk_length: 500
|
| 98 |
+
chunk_shift_ratio: 0.5
|
| 99 |
+
num_cache_chunks: 1024
|
| 100 |
+
chunk_excluded_key_prefixes: []
|
| 101 |
+
chunk_default_fs: null
|
| 102 |
+
chunk_max_abs_length: null
|
| 103 |
+
chunk_discard_short_samples: true
|
| 104 |
+
train_data_path_and_name_and_type:
|
| 105 |
+
- - dump/raw/tr_no_dev/text
|
| 106 |
+
- text
|
| 107 |
+
- text
|
| 108 |
+
- - duration_info/tr_no_dev/durations
|
| 109 |
+
- durations
|
| 110 |
+
- text_int
|
| 111 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 112 |
+
- speech
|
| 113 |
+
- sound
|
| 114 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 115 |
+
- pitch
|
| 116 |
+
- npy
|
| 117 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 118 |
+
- energy
|
| 119 |
+
- npy
|
| 120 |
+
valid_data_path_and_name_and_type:
|
| 121 |
+
- - dump/raw/dev/text
|
| 122 |
+
- text
|
| 123 |
+
- text
|
| 124 |
+
- - duration_info/dev/durations
|
| 125 |
+
- durations
|
| 126 |
+
- text_int
|
| 127 |
+
- - dump/raw/dev/wav.scp
|
| 128 |
+
- speech
|
| 129 |
+
- sound
|
| 130 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 131 |
+
- pitch
|
| 132 |
+
- npy
|
| 133 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 134 |
+
- energy
|
| 135 |
+
- npy
|
| 136 |
+
multi_task_dataset: false
|
| 137 |
+
allow_variable_data_keys: false
|
| 138 |
+
max_cache_size: 0.0
|
| 139 |
+
max_cache_fd: 32
|
| 140 |
+
allow_multi_rates: false
|
| 141 |
+
valid_max_cache_size: null
|
| 142 |
+
exclude_weight_decay: false
|
| 143 |
+
exclude_weight_decay_conf: {}
|
| 144 |
+
optim: adam
|
| 145 |
+
optim_conf:
|
| 146 |
+
lr: 1.0
|
| 147 |
+
scheduler: noamlr
|
| 148 |
+
scheduler_conf:
|
| 149 |
+
model_size: 384
|
| 150 |
+
warmup_steps: 4000
|
| 151 |
+
token_list:
|
| 152 |
+
- <blank>
|
| 153 |
+
- <unk>
|
| 154 |
+
- <space>
|
| 155 |
+
- $
|
| 156 |
+
- ','
|
| 157 |
+
- .
|
| 158 |
+
- M
|
| 159 |
+
- q
|
| 160 |
+
- H
|
| 161 |
+
- k
|
| 162 |
+
- ख
|
| 163 |
+
- g
|
| 164 |
+
- घ
|
| 165 |
+
- ङ
|
| 166 |
+
- c
|
| 167 |
+
- C
|
| 168 |
+
- j
|
| 169 |
+
- J
|
| 170 |
+
- ञ
|
| 171 |
+
- ट
|
| 172 |
+
- ठ
|
| 173 |
+
- ड
|
| 174 |
+
- ढ
|
| 175 |
+
- ण
|
| 176 |
+
- t
|
| 177 |
+
- थ
|
| 178 |
+
- d
|
| 179 |
+
- ध
|
| 180 |
+
- n
|
| 181 |
+
- ऩ
|
| 182 |
+
- p
|
| 183 |
+
- P
|
| 184 |
+
- b
|
| 185 |
+
- B
|
| 186 |
+
- m
|
| 187 |
+
- y
|
| 188 |
+
- r
|
| 189 |
+
- ऱ
|
| 190 |
+
- l
|
| 191 |
+
- ള
|
| 192 |
+
- Z
|
| 193 |
+
- w
|
| 194 |
+
- श
|
| 195 |
+
- ष
|
| 196 |
+
- s
|
| 197 |
+
- h
|
| 198 |
+
- Y
|
| 199 |
+
- ऽ
|
| 200 |
+
- क
|
| 201 |
+
- K
|
| 202 |
+
- G
|
| 203 |
+
- z
|
| 204 |
+
- D
|
| 205 |
+
- T
|
| 206 |
+
- f
|
| 207 |
+
- ॠ
|
| 208 |
+
- ൺ
|
| 209 |
+
- N
|
| 210 |
+
- ർ
|
| 211 |
+
- ൽ
|
| 212 |
+
- ൾ
|
| 213 |
+
- a
|
| 214 |
+
- A
|
| 215 |
+
- i
|
| 216 |
+
- I
|
| 217 |
+
- u
|
| 218 |
+
- U
|
| 219 |
+
- R
|
| 220 |
+
- ऍ
|
| 221 |
+
- e
|
| 222 |
+
- E
|
| 223 |
+
- ऐ
|
| 224 |
+
- ऑ
|
| 225 |
+
- o
|
| 226 |
+
- O
|
| 227 |
+
- औ
|
| 228 |
+
- உ
|
| 229 |
+
- <sos/eos>
|
| 230 |
+
odim: null
|
| 231 |
+
model_conf: {}
|
| 232 |
+
use_preprocessor: true
|
| 233 |
+
token_type: char
|
| 234 |
+
bpemodel: null
|
| 235 |
+
non_linguistic_symbols: null
|
| 236 |
+
cleaner: null
|
| 237 |
+
g2p: null
|
| 238 |
+
feats_extract: fbank
|
| 239 |
+
feats_extract_conf:
|
| 240 |
+
n_fft: 8192
|
| 241 |
+
hop_length: 1024
|
| 242 |
+
win_length: 4096
|
| 243 |
+
fs: 48000
|
| 244 |
+
fmin: 0
|
| 245 |
+
fmax: 24000
|
| 246 |
+
n_mels: 160
|
| 247 |
+
normalize: global_mvn
|
| 248 |
+
normalize_conf:
|
| 249 |
+
stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
|
| 250 |
+
tts: fastspeech2
|
| 251 |
+
tts_conf:
|
| 252 |
+
adim: 384
|
| 253 |
+
aheads: 2
|
| 254 |
+
elayers: 4
|
| 255 |
+
eunits: 1536
|
| 256 |
+
dlayers: 4
|
| 257 |
+
dunits: 1536
|
| 258 |
+
positionwise_layer_type: conv1d
|
| 259 |
+
positionwise_conv_kernel_size: 3
|
| 260 |
+
duration_predictor_layers: 2
|
| 261 |
+
duration_predictor_chans: 256
|
| 262 |
+
duration_predictor_kernel_size: 3
|
| 263 |
+
postnet_layers: 5
|
| 264 |
+
postnet_filts: 5
|
| 265 |
+
postnet_chans: 256
|
| 266 |
+
use_masking: true
|
| 267 |
+
use_scaled_pos_enc: true
|
| 268 |
+
encoder_normalize_before: true
|
| 269 |
+
decoder_normalize_before: true
|
| 270 |
+
reduction_factor: 1
|
| 271 |
+
init_type: xavier_uniform
|
| 272 |
+
init_enc_alpha: 1.0
|
| 273 |
+
init_dec_alpha: 1.0
|
| 274 |
+
transformer_enc_dropout_rate: 0.2
|
| 275 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 276 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 277 |
+
transformer_dec_dropout_rate: 0.2
|
| 278 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 279 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 280 |
+
pitch_predictor_layers: 5
|
| 281 |
+
pitch_predictor_chans: 256
|
| 282 |
+
pitch_predictor_kernel_size: 5
|
| 283 |
+
pitch_predictor_dropout: 0.5
|
| 284 |
+
pitch_embed_kernel_size: 1
|
| 285 |
+
pitch_embed_dropout: 0.0
|
| 286 |
+
stop_gradient_from_pitch_predictor: true
|
| 287 |
+
energy_predictor_layers: 2
|
| 288 |
+
energy_predictor_chans: 256
|
| 289 |
+
energy_predictor_kernel_size: 3
|
| 290 |
+
energy_predictor_dropout: 0.5
|
| 291 |
+
energy_embed_kernel_size: 1
|
| 292 |
+
energy_embed_dropout: 0.0
|
| 293 |
+
stop_gradient_from_energy_predictor: false
|
| 294 |
+
pitch_extract: dio
|
| 295 |
+
pitch_extract_conf:
|
| 296 |
+
fs: 48000
|
| 297 |
+
n_fft: 8192
|
| 298 |
+
hop_length: 1024
|
| 299 |
+
f0max: 400
|
| 300 |
+
f0min: 80
|
| 301 |
+
reduction_factor: 1
|
| 302 |
+
pitch_normalize: global_mvn
|
| 303 |
+
pitch_normalize_conf:
|
| 304 |
+
stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
|
| 305 |
+
energy_extract: energy
|
| 306 |
+
energy_extract_conf:
|
| 307 |
+
fs: 48000
|
| 308 |
+
n_fft: 8192
|
| 309 |
+
hop_length: 1024
|
| 310 |
+
win_length: 4096
|
| 311 |
+
reduction_factor: 1
|
| 312 |
+
energy_normalize: global_mvn
|
| 313 |
+
energy_normalize_conf:
|
| 314 |
+
stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
|
| 315 |
+
required:
|
| 316 |
+
- output_dir
|
| 317 |
+
- token_list
|
| 318 |
+
version: '202402'
|
| 319 |
+
distributed: true
|
bodo_latest/female/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f146e38995c250d297602ef8ae9a86ca151b5dbd85bd2a0c6d6fc480958825c6
|
| 3 |
+
size 770
|
bodo_latest/female/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ac92ccb722a0ed041407e19bddde97f055e37d1108c2927c573f912b281e9f6
|
| 3 |
+
size 2042
|
bodo_latest/female/model/feats_type
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
raw
|
bodo_latest/female/model/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d7e1023281d3358bca078b2a218cddda8fc79aef7f0e3d47272331b8bf9645a
|
| 3 |
+
size 152129434
|
bodo_latest/female/model/pitch_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59051dd33e6f33a98737cbe4a5a220eb9af37c43d2b660f3d257f411f1128025
|
| 3 |
+
size 770
|
bodo_latest/male/model/config.yaml
ADDED
|
@@ -0,0 +1,319 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 2 |
+
print_config: false
|
| 3 |
+
log_level: INFO
|
| 4 |
+
drop_last_iter: false
|
| 5 |
+
dry_run: false
|
| 6 |
+
iterator_type: sequence
|
| 7 |
+
valid_iterator_type: null
|
| 8 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 9 |
+
ngpu: 1
|
| 10 |
+
seed: 0
|
| 11 |
+
num_workers: 1
|
| 12 |
+
num_att_plot: 3
|
| 13 |
+
dist_backend: nccl
|
| 14 |
+
dist_init_method: env://
|
| 15 |
+
dist_world_size: 2
|
| 16 |
+
dist_rank: 0
|
| 17 |
+
local_rank: 0
|
| 18 |
+
dist_master_addr: localhost
|
| 19 |
+
dist_master_port: 53925
|
| 20 |
+
dist_launcher: null
|
| 21 |
+
multiprocessing_distributed: true
|
| 22 |
+
unused_parameters: false
|
| 23 |
+
sharded_ddp: false
|
| 24 |
+
use_deepspeed: false
|
| 25 |
+
deepspeed_config: null
|
| 26 |
+
cudnn_enabled: true
|
| 27 |
+
cudnn_benchmark: false
|
| 28 |
+
cudnn_deterministic: true
|
| 29 |
+
use_tf32: false
|
| 30 |
+
collect_stats: false
|
| 31 |
+
write_collected_feats: false
|
| 32 |
+
max_epoch: 1000
|
| 33 |
+
patience: null
|
| 34 |
+
val_scheduler_criterion:
|
| 35 |
+
- valid
|
| 36 |
+
- loss
|
| 37 |
+
early_stopping_criterion:
|
| 38 |
+
- valid
|
| 39 |
+
- loss
|
| 40 |
+
- min
|
| 41 |
+
best_model_criterion:
|
| 42 |
+
- - valid
|
| 43 |
+
- loss
|
| 44 |
+
- min
|
| 45 |
+
- - train
|
| 46 |
+
- loss
|
| 47 |
+
- min
|
| 48 |
+
keep_nbest_models: 5
|
| 49 |
+
nbest_averaging_interval: 0
|
| 50 |
+
grad_clip: 1.0
|
| 51 |
+
grad_clip_type: 2.0
|
| 52 |
+
grad_noise: false
|
| 53 |
+
accum_grad: 8
|
| 54 |
+
no_forward_run: false
|
| 55 |
+
resume: true
|
| 56 |
+
train_dtype: float32
|
| 57 |
+
use_amp: false
|
| 58 |
+
log_interval: null
|
| 59 |
+
use_matplotlib: true
|
| 60 |
+
use_tensorboard: true
|
| 61 |
+
create_graph_in_tensorboard: false
|
| 62 |
+
use_wandb: false
|
| 63 |
+
wandb_project: null
|
| 64 |
+
wandb_id: null
|
| 65 |
+
wandb_entity: null
|
| 66 |
+
wandb_name: null
|
| 67 |
+
wandb_model_log_interval: -1
|
| 68 |
+
detect_anomaly: false
|
| 69 |
+
use_adapter: false
|
| 70 |
+
adapter: lora
|
| 71 |
+
save_strategy: all
|
| 72 |
+
adapter_conf: {}
|
| 73 |
+
pretrain_path: null
|
| 74 |
+
init_param: []
|
| 75 |
+
ignore_init_mismatch: false
|
| 76 |
+
freeze_param: []
|
| 77 |
+
num_iters_per_epoch: 800
|
| 78 |
+
batch_size: 20
|
| 79 |
+
valid_batch_size: null
|
| 80 |
+
batch_bins: 3000000
|
| 81 |
+
valid_batch_bins: null
|
| 82 |
+
train_shape_file:
|
| 83 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 84 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 85 |
+
valid_shape_file:
|
| 86 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 87 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 88 |
+
batch_type: numel
|
| 89 |
+
valid_batch_type: null
|
| 90 |
+
fold_length:
|
| 91 |
+
- 150
|
| 92 |
+
- 819200
|
| 93 |
+
sort_in_batch: descending
|
| 94 |
+
shuffle_within_batch: false
|
| 95 |
+
sort_batch: descending
|
| 96 |
+
multiple_iterator: false
|
| 97 |
+
chunk_length: 500
|
| 98 |
+
chunk_shift_ratio: 0.5
|
| 99 |
+
num_cache_chunks: 1024
|
| 100 |
+
chunk_excluded_key_prefixes: []
|
| 101 |
+
chunk_default_fs: null
|
| 102 |
+
chunk_max_abs_length: null
|
| 103 |
+
chunk_discard_short_samples: true
|
| 104 |
+
train_data_path_and_name_and_type:
|
| 105 |
+
- - dump/raw/tr_no_dev/text
|
| 106 |
+
- text
|
| 107 |
+
- text
|
| 108 |
+
- - duration_info/tr_no_dev/durations
|
| 109 |
+
- durations
|
| 110 |
+
- text_int
|
| 111 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 112 |
+
- speech
|
| 113 |
+
- sound
|
| 114 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 115 |
+
- pitch
|
| 116 |
+
- npy
|
| 117 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 118 |
+
- energy
|
| 119 |
+
- npy
|
| 120 |
+
valid_data_path_and_name_and_type:
|
| 121 |
+
- - dump/raw/dev/text
|
| 122 |
+
- text
|
| 123 |
+
- text
|
| 124 |
+
- - duration_info/dev/durations
|
| 125 |
+
- durations
|
| 126 |
+
- text_int
|
| 127 |
+
- - dump/raw/dev/wav.scp
|
| 128 |
+
- speech
|
| 129 |
+
- sound
|
| 130 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 131 |
+
- pitch
|
| 132 |
+
- npy
|
| 133 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 134 |
+
- energy
|
| 135 |
+
- npy
|
| 136 |
+
multi_task_dataset: false
|
| 137 |
+
allow_variable_data_keys: false
|
| 138 |
+
max_cache_size: 0.0
|
| 139 |
+
max_cache_fd: 32
|
| 140 |
+
allow_multi_rates: false
|
| 141 |
+
valid_max_cache_size: null
|
| 142 |
+
exclude_weight_decay: false
|
| 143 |
+
exclude_weight_decay_conf: {}
|
| 144 |
+
optim: adam
|
| 145 |
+
optim_conf:
|
| 146 |
+
lr: 1.0
|
| 147 |
+
scheduler: noamlr
|
| 148 |
+
scheduler_conf:
|
| 149 |
+
model_size: 384
|
| 150 |
+
warmup_steps: 4000
|
| 151 |
+
token_list:
|
| 152 |
+
- <blank>
|
| 153 |
+
- <unk>
|
| 154 |
+
- <space>
|
| 155 |
+
- $
|
| 156 |
+
- ','
|
| 157 |
+
- .
|
| 158 |
+
- M
|
| 159 |
+
- q
|
| 160 |
+
- H
|
| 161 |
+
- k
|
| 162 |
+
- ख
|
| 163 |
+
- g
|
| 164 |
+
- घ
|
| 165 |
+
- ङ
|
| 166 |
+
- c
|
| 167 |
+
- C
|
| 168 |
+
- j
|
| 169 |
+
- J
|
| 170 |
+
- ञ
|
| 171 |
+
- ट
|
| 172 |
+
- ठ
|
| 173 |
+
- ड
|
| 174 |
+
- ढ
|
| 175 |
+
- ण
|
| 176 |
+
- t
|
| 177 |
+
- थ
|
| 178 |
+
- d
|
| 179 |
+
- ध
|
| 180 |
+
- n
|
| 181 |
+
- ऩ
|
| 182 |
+
- p
|
| 183 |
+
- P
|
| 184 |
+
- b
|
| 185 |
+
- B
|
| 186 |
+
- m
|
| 187 |
+
- y
|
| 188 |
+
- r
|
| 189 |
+
- ऱ
|
| 190 |
+
- l
|
| 191 |
+
- ള
|
| 192 |
+
- Z
|
| 193 |
+
- w
|
| 194 |
+
- श
|
| 195 |
+
- ष
|
| 196 |
+
- s
|
| 197 |
+
- h
|
| 198 |
+
- Y
|
| 199 |
+
- ऽ
|
| 200 |
+
- क
|
| 201 |
+
- K
|
| 202 |
+
- G
|
| 203 |
+
- z
|
| 204 |
+
- D
|
| 205 |
+
- T
|
| 206 |
+
- f
|
| 207 |
+
- ॠ
|
| 208 |
+
- ൺ
|
| 209 |
+
- N
|
| 210 |
+
- ർ
|
| 211 |
+
- ൽ
|
| 212 |
+
- ൾ
|
| 213 |
+
- a
|
| 214 |
+
- A
|
| 215 |
+
- i
|
| 216 |
+
- I
|
| 217 |
+
- u
|
| 218 |
+
- U
|
| 219 |
+
- R
|
| 220 |
+
- ऍ
|
| 221 |
+
- e
|
| 222 |
+
- E
|
| 223 |
+
- ऐ
|
| 224 |
+
- ऑ
|
| 225 |
+
- o
|
| 226 |
+
- O
|
| 227 |
+
- औ
|
| 228 |
+
- உ
|
| 229 |
+
- <sos/eos>
|
| 230 |
+
odim: null
|
| 231 |
+
model_conf: {}
|
| 232 |
+
use_preprocessor: true
|
| 233 |
+
token_type: char
|
| 234 |
+
bpemodel: null
|
| 235 |
+
non_linguistic_symbols: null
|
| 236 |
+
cleaner: null
|
| 237 |
+
g2p: null
|
| 238 |
+
feats_extract: fbank
|
| 239 |
+
feats_extract_conf:
|
| 240 |
+
n_fft: 8192
|
| 241 |
+
hop_length: 1024
|
| 242 |
+
win_length: 4096
|
| 243 |
+
fs: 48000
|
| 244 |
+
fmin: 0
|
| 245 |
+
fmax: 24000
|
| 246 |
+
n_mels: 160
|
| 247 |
+
normalize: global_mvn
|
| 248 |
+
normalize_conf:
|
| 249 |
+
stats_file: exp/tts_stats_raw_char_None/train/feats_stats.npz
|
| 250 |
+
tts: fastspeech2
|
| 251 |
+
tts_conf:
|
| 252 |
+
adim: 384
|
| 253 |
+
aheads: 2
|
| 254 |
+
elayers: 4
|
| 255 |
+
eunits: 1536
|
| 256 |
+
dlayers: 4
|
| 257 |
+
dunits: 1536
|
| 258 |
+
positionwise_layer_type: conv1d
|
| 259 |
+
positionwise_conv_kernel_size: 3
|
| 260 |
+
duration_predictor_layers: 2
|
| 261 |
+
duration_predictor_chans: 256
|
| 262 |
+
duration_predictor_kernel_size: 3
|
| 263 |
+
postnet_layers: 5
|
| 264 |
+
postnet_filts: 5
|
| 265 |
+
postnet_chans: 256
|
| 266 |
+
use_masking: true
|
| 267 |
+
use_scaled_pos_enc: true
|
| 268 |
+
encoder_normalize_before: true
|
| 269 |
+
decoder_normalize_before: true
|
| 270 |
+
reduction_factor: 1
|
| 271 |
+
init_type: xavier_uniform
|
| 272 |
+
init_enc_alpha: 1.0
|
| 273 |
+
init_dec_alpha: 1.0
|
| 274 |
+
transformer_enc_dropout_rate: 0.2
|
| 275 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 276 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 277 |
+
transformer_dec_dropout_rate: 0.2
|
| 278 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 279 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 280 |
+
pitch_predictor_layers: 5
|
| 281 |
+
pitch_predictor_chans: 256
|
| 282 |
+
pitch_predictor_kernel_size: 5
|
| 283 |
+
pitch_predictor_dropout: 0.5
|
| 284 |
+
pitch_embed_kernel_size: 1
|
| 285 |
+
pitch_embed_dropout: 0.0
|
| 286 |
+
stop_gradient_from_pitch_predictor: true
|
| 287 |
+
energy_predictor_layers: 2
|
| 288 |
+
energy_predictor_chans: 256
|
| 289 |
+
energy_predictor_kernel_size: 3
|
| 290 |
+
energy_predictor_dropout: 0.5
|
| 291 |
+
energy_embed_kernel_size: 1
|
| 292 |
+
energy_embed_dropout: 0.0
|
| 293 |
+
stop_gradient_from_energy_predictor: false
|
| 294 |
+
pitch_extract: dio
|
| 295 |
+
pitch_extract_conf:
|
| 296 |
+
fs: 48000
|
| 297 |
+
n_fft: 8192
|
| 298 |
+
hop_length: 1024
|
| 299 |
+
f0max: 350
|
| 300 |
+
f0min: 40
|
| 301 |
+
reduction_factor: 1
|
| 302 |
+
pitch_normalize: global_mvn
|
| 303 |
+
pitch_normalize_conf:
|
| 304 |
+
stats_file: exp/tts_stats_raw_char_None/train/pitch_stats.npz
|
| 305 |
+
energy_extract: energy
|
| 306 |
+
energy_extract_conf:
|
| 307 |
+
fs: 48000
|
| 308 |
+
n_fft: 8192
|
| 309 |
+
hop_length: 1024
|
| 310 |
+
win_length: 4096
|
| 311 |
+
reduction_factor: 1
|
| 312 |
+
energy_normalize: global_mvn
|
| 313 |
+
energy_normalize_conf:
|
| 314 |
+
stats_file: exp/tts_stats_raw_char_None/train/energy_stats.npz
|
| 315 |
+
required:
|
| 316 |
+
- output_dir
|
| 317 |
+
- token_list
|
| 318 |
+
version: '202402'
|
| 319 |
+
distributed: true
|
bodo_latest/male/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d2ccfd0ab92010376d6cecbf0d2d3e2e338ccb2cc1a4c44af9acd1f9bd569f9e
|
| 3 |
+
size 770
|
bodo_latest/male/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0adb54c43f773f5c078a60c30cfba90f4b3cb02461ac3a4f9cbc638f91e2e82
|
| 3 |
+
size 2042
|
bodo_latest/male/model/feats_type
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
raw
|
bodo_latest/male/model/model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:742c513ae2866449704836faeeedb4c4e6c364a4e4d0f9ebc96f234efc084b8d
|
| 3 |
+
size 152129434
|
bodo_latest/male/model/pitch_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84a143913223f17d10f677a7b94e26ccf8d1251ff97d882fe65f33542a3d5722
|
| 3 |
+
size 770
|
charmap/Text_Cleaning.ipynb
ADDED
|
@@ -0,0 +1,332 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cells": [
|
| 3 |
+
{
|
| 4 |
+
"cell_type": "code",
|
| 5 |
+
"execution_count": 2,
|
| 6 |
+
"metadata": {
|
| 7 |
+
"collapsed": true
|
| 8 |
+
},
|
| 9 |
+
"outputs": [],
|
| 10 |
+
"source": [
|
| 11 |
+
"############################################################\n",
|
| 12 |
+
"#Author : Bhagyashree\n",
|
| 13 |
+
"#Date : 1st Sept, 2020\n",
|
| 14 |
+
"#Purpose : Text Cleaning\n",
|
| 15 |
+
"#Input : Text file after timestamp removal\n",
|
| 16 |
+
"#Output : Text file after cleaning data\n",
|
| 17 |
+
"############################################################"
|
| 18 |
+
]
|
| 19 |
+
},
|
| 20 |
+
{
|
| 21 |
+
"cell_type": "code",
|
| 22 |
+
"execution_count": 3,
|
| 23 |
+
"metadata": {
|
| 24 |
+
"collapsed": true
|
| 25 |
+
},
|
| 26 |
+
"outputs": [],
|
| 27 |
+
"source": [
|
| 28 |
+
"import nltk\n",
|
| 29 |
+
"import numpy\n",
|
| 30 |
+
"import xlrd\n",
|
| 31 |
+
"import openpyxl \n",
|
| 32 |
+
"import re"
|
| 33 |
+
]
|
| 34 |
+
},
|
| 35 |
+
{
|
| 36 |
+
"cell_type": "code",
|
| 37 |
+
"execution_count": 21,
|
| 38 |
+
"metadata": {},
|
| 39 |
+
"outputs": [
|
| 40 |
+
{
|
| 41 |
+
"name": "stdout",
|
| 42 |
+
"output_type": "stream",
|
| 43 |
+
"text": [
|
| 44 |
+
"अब हम ऑलट्रेशन ऑफ मेमोरेंडम के बारे में बात करेंगे।\n",
|
| 45 |
+
" मेमोरेंडम के विषयों को बदल दिया जा सकता है।\n",
|
| 46 |
+
"कंपनी अधिनियम 1956 के तहत\n",
|
| 47 |
+
"निम्नलिखित प्रक्रिया के अनुसार\n",
|
| 48 |
+
"यदि कोई कंपनी अपना नाम बदलना चाहती है,\n",
|
| 49 |
+
"तो वे विशेष संकल्प में ऐसा कर सकती है।\n",
|
| 50 |
+
"और केंद्र सरकार की मंजूरी के साथ\n",
|
| 51 |
+
"लिखित में\n",
|
| 52 |
+
"हालाँकि, ऐसी किसी भी मंजूरी की आवश्यकता नहीं होती है\n",
|
| 53 |
+
"केवल कंपनी के नाम में परिवर्तन के लिए\n",
|
| 54 |
+
"बल्कि यह प्रक्रिया\n",
|
| 55 |
+
"पूरी तरह से निजी शब्द को हटाने के लिए होती है।\n",
|
| 56 |
+
"तो इस मामले में\n",
|
| 57 |
+
"एक सार्वजनिक कंपनी को एक निजी कंपनी के संबंध में,\n",
|
| 58 |
+
"या एक निजी कंपनी को एक सार्वजनिक कंपनी में परिवर्तित करने\n",
|
| 59 |
+
"दूसरी जगह पर पंजीकृत कार्यालय का दोबारा परिवर्तन किया जाना है\n",
|
| 60 |
+
"अगर एक ही शहर, कस्बे\n",
|
| 61 |
+
"या गाँव में एक जगह से\n",
|
| 62 |
+
"30 दिनों का नोटिस दिया जाना होता है।\n",
|
| 63 |
+
"यह रजिस्ट्रार द्वारा परिवर्तन की तिथि के बाद\n",
|
| 64 |
+
"होगा जो उसी को दर्ज करेगा।\n",
|
| 65 |
+
"पंजीकृत कार्यालय के परिवर्तन के मामले में\n",
|
| 66 |
+
"जबकि एक ही राज्य में 1 शहर से दूसरे शहर में,\n",
|
| 67 |
+
"विशेष प्रस्ताव पारित किया जाना आवश्यक है।\n",
|
| 68 |
+
"शेयरधारकों की आम बैठक में\n",
|
| 69 |
+
"और इसकी एक प्रति रजिस्ट्रार के पास कार्यालय को\n",
|
| 70 |
+
"30 दिनों के भीतर बदलने के दाखिल करनी होगी।\n",
|
| 71 |
+
"नोटिस देना होगा।\n",
|
| 72 |
+
"रजिस्ट्रार को कार्यालय के नये पते का\n",
|
| 73 |
+
"तब तक परिवर्तन प्रभावी नहीं होगा।\n",
|
| 74 |
+
"जब तक केंद्र सरकार द्वारा प्रस्ताव की पुष्टि नहीं हो जाती\n",
|
| 75 |
+
"कंपनी किसी भी आधार पर\n",
|
| 76 |
+
"उपधारा 1 से\n",
|
| 77 |
+
"उपधारा 7 में धारा 17 तक उल्लेखित है।\n",
|
| 78 |
+
"जैसा कि अधिनियम के बाद ही परिवर्तन प्रभावी होगा।\n",
|
| 79 |
+
"अपने उद्देश्यों में बदलाव कर सकती है\n",
|
| 80 |
+
"सामान्य बैठक में सदस्यों द्वारा\n",
|
| 81 |
+
"कंपनी संशोधन अधिनियम 1996 को मेमोरेंडम ऑफ एसोसिएशन के\n",
|
| 82 |
+
"केंद्र सरकार के प्रतिबंध के साथ समाप्त कर दिया गया है।\n",
|
| 83 |
+
"विशेष संकल्प के अनुरूप अनुमोदित किए जाने\n",
|
| 84 |
+
"ऑब्जेक्ट क्लॉज में परिवर्तन के प्रति शेयर पूंजी में\n",
|
| 85 |
+
"परिवर्तन की प्रक्रिया और ऐसे परिवर्तन करने के अधिकार।\n",
|
| 86 |
+
"समान्य पहलु को आर्टीकल ऑफ एसोसिएशन में रखा गया है।\n",
|
| 87 |
+
"यदि संबंधित विषय के\n",
|
| 88 |
+
" आर्टीकल ऑफ एसोसिएशन में पीछे की प्रक्रिया नहीं दी गई है।\n",
|
| 89 |
+
"कंपनी को पारित करके आर्टीकल ऑफ एसोसिएशन को बदलना होगा।\n",
|
| 90 |
+
"एक विशेष प्रस्ताव\n",
|
| 91 |
+
"अब, हम ऑलट्रेशन ऑफ पर चर्चा करेंगे।\n",
|
| 92 |
+
"कंपनी अधिनियम 2013 के तहत मेमोरेंडम\n",
|
| 93 |
+
"अधिनियम की धारा 16, 17, 18, 19,\n",
|
| 94 |
+
"1956 के कंपनी 21, 23 और 37 के अनुरूप।\n",
|
| 95 |
+
"कंपनी अधिनियम, 2013 की धारा 13 ने\n",
|
| 96 |
+
" ऑलट्रेशन ऑफ मेमोरेंडम के लिए मानदंड निर्धारित किए हैं।\n",
|
| 97 |
+
"यह वही वर्णन करता है कि जैसा कि धारा 61 में दिया गया है।\n",
|
| 98 |
+
"एक कंपनी विशेष संकल्प द्वारा\n",
|
| 99 |
+
"और प्रावधानों को बदल सकती है।\n",
|
| 100 |
+
"निर्दिष्ट प्रक्रिया के अनुपालन से मेमोरेंडम\n",
|
| 101 |
+
"नाम खंड के परिवर्तन के संबंध में,\n",
|
| 102 |
+
"कंपनी अपना नाम बदल सकती है।\n",
|
| 103 |
+
"अनुमोदन के बाद लिखित रूप में केंद्र सरकार द्वारा\n",
|
| 104 |
+
"इसलिए जब कंपनी के नाम में कोई बदलाव किया जाता है,\n",
|
| 105 |
+
"रजिस्टर में दर्ज करेगा।\n",
|
| 106 |
+
" तो रजिस्ट्रार कंपनी के नया नाम\n",
|
| 107 |
+
"पुराने नाम के स्थान पर\n",
|
| 108 |
+
"निगमन का एक नया प्रमाणपत्र जारी करेगा।\n",
|
| 109 |
+
"कंपनी के पंजीकृत कार्यालय के बारे में\n",
|
| 110 |
+
"जैसा कि पहले उल्लेख किया गया है,\n",
|
| 111 |
+
"तब तक कोई प्रभाव नहीं पड़ेगा जब तक कि वह केंद्र सरकार द्वारा अनुमोदित नहीं हो जाता।\n",
|
| 112 |
+
"ऑब्जेक्ट क्लॉज के किसी भी परिवर्तन के संबंध में,\n",
|
| 113 |
+
"किसी कंपनी के मेमोरेंडम के\n",
|
| 114 |
+
"रजिस्ट्रार को दाखिल करने की\n",
|
| 115 |
+
"30 दिनों की अवधि के भीतर\n",
|
| 116 |
+
"तारीख से पंजीकरण को प्रमाणित करना होता है।\n",
|
| 117 |
+
"इस विशेष प्रस्ताव खंड के उप खंड 6 के खंड A के अनुसार\n",
|
| 118 |
+
"चलिए फिर से संक्षेप में\n",
|
| 119 |
+
" ऑलट्रेशन ऑफ मेमोरेंडम के महत्व के बारे में चर्चा करते हैं\n",
|
| 120 |
+
" क्योंकि ये इस मॉड्यूल के अध्ययन का एक बहुत महत्वपूर्ण हिस्सा है।\n",
|
| 121 |
+
"पहला महत्व यह है\n",
|
| 122 |
+
"कि यह एक बहुत ही आवश्यक दस्तावेज है।\n",
|
| 123 |
+
"एक कंपनी के निगमन के लिए\n",
|
| 124 |
+
"दूसरा, यह कंपनी के पंजीकृत कार्यालय को निर्दिष्ट करते हुए\n",
|
| 125 |
+
"रजिस्ट्रार और अदालत के अधिकार क्षेत्र को निर्धारित करता है।\n",
|
| 126 |
+
"तीसरा, यह कंपनी के अधिकारों में उद्देश्यों को\n",
|
| 127 |
+
"जनता की जानकारी के लिए दर्ज करता है।\n",
|
| 128 |
+
"अगला, यह कंपनी को केवल उन कृत्यों को करने के लिए\n",
|
| 129 |
+
"बाध्य करता है जो कंपनी के ऑब्जेक्ट क्लॉज में शामिल हैं।\n",
|
| 130 |
+
"यह कंपनी की अधिकृत कैपिटल\n",
|
| 131 |
+
"और उसके विभाजन को निश्चित राशि के शेयरों में निर्दिष्ट करता है।\n",
|
| 132 |
+
"पर प्रकाश डालता है।\n",
|
| 133 |
+
"यह कंपनी के सदस्यों के लायबिलिटी\n",
|
| 134 |
+
"अंत में, संघ के नियमों को\n",
|
| 135 |
+
"यह एक कंपनी के भी नियंत्रित करता है।\n"
|
| 136 |
+
]
|
| 137 |
+
}
|
| 138 |
+
],
|
| 139 |
+
"source": [
|
| 140 |
+
"file1 = open(\"recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi_new.txt\",\"r+\",encoding='utf-8') \n",
|
| 141 |
+
"data = file1.read()\n",
|
| 142 |
+
"print(data)\n",
|
| 143 |
+
"file1.close()"
|
| 144 |
+
]
|
| 145 |
+
},
|
| 146 |
+
{
|
| 147 |
+
"cell_type": "code",
|
| 148 |
+
"execution_count": 22,
|
| 149 |
+
"metadata": {},
|
| 150 |
+
"outputs": [
|
| 151 |
+
{
|
| 152 |
+
"name": "stdout",
|
| 153 |
+
"output_type": "stream",
|
| 154 |
+
"text": [
|
| 155 |
+
"अब हम ऑलट्रेशन ऑफ मेमोरेंडम के बारे में बात करेंगे\n",
|
| 156 |
+
" मेमोरेंडम के विषयों को बदल दिया जा सकता है\n",
|
| 157 |
+
"कंपनी अधिनियम वन नाइन फाइव सिक्स के तहत\n",
|
| 158 |
+
"निम्नलिखित प्रक्रिया के अनुसार\n",
|
| 159 |
+
"यदि कोई कंपनी अपना नाम बदलना चाहती है\n",
|
| 160 |
+
"तो वे विशेष संकल्प में ऐसा कर सकती है\n",
|
| 161 |
+
"और केंद्र सरकार की मंजूरी के साथ\n",
|
| 162 |
+
"लिखित में\n",
|
| 163 |
+
"हालाँकि ऐसी किसी भी मंजूरी की आवश्यकता नहीं होती है\n",
|
| 164 |
+
"केवल कंपनी के नाम में परिवर्तन के लिए\n",
|
| 165 |
+
"बल्कि यह प्रक्रिया\n",
|
| 166 |
+
"पूरी तरह से निजी शब्द को हटाने के लिए होती है\n",
|
| 167 |
+
"तो इस मामले में\n",
|
| 168 |
+
"एक सार्वजनिक कंपनी को एक निजी कंपनी के संबंध में\n",
|
| 169 |
+
"या एक निजी कंपनी को एक सार्वजनिक कंपनी में परिवर्तित करने\n",
|
| 170 |
+
"दूसरी जगह पर पंजीकृत कार्यालय का दोबारा परिवर्तन किया जाना है\n",
|
| 171 |
+
"अगर एक ही शहर कस्बे\n",
|
| 172 |
+
"या गाँव में एक जगह से\n",
|
| 173 |
+
" थ्री ज़ीरो दिनों का नोटिस दिया जाना होता है\n",
|
| 174 |
+
"यह रजिस्ट्रार द्वारा परिवर्तन की तिथि के बाद\n",
|
| 175 |
+
"होगा जो उसी को दर्ज करेगा\n",
|
| 176 |
+
"पंजीकृत कार्यालय के परिवर्तन के मामले में\n",
|
| 177 |
+
"जबकि एक ही राज्य में वन शहर से दूसरे शहर में\n",
|
| 178 |
+
"विशेष प्रस्ताव पारित किया जाना आवश्यक है\n",
|
| 179 |
+
"शेयरधारकों की आम बैठक में\n",
|
| 180 |
+
"और इसकी एक प्रति रजिस्ट्रार के पास कार्यालय को\n",
|
| 181 |
+
" थ्री ज़ीरो दिनों के भीतर बदलने के दाखिल करनी होगी\n",
|
| 182 |
+
"नोटिस देना होगा\n",
|
| 183 |
+
"रजिस्ट्रार को कार्यालय के नये पते का\n",
|
| 184 |
+
"तब तक परिवर्तन प्रभावी नहीं होगा\n",
|
| 185 |
+
"जब तक केंद्र सरकार द्वारा प्रस्ताव की पुष्टि नहीं हो जा���ी\n",
|
| 186 |
+
"कंपनी किसी भी आधार पर\n",
|
| 187 |
+
"उपधारा वन से\n",
|
| 188 |
+
"उपधारा सेवेन में धारा वन सेवेन तक उल्लेखित है\n",
|
| 189 |
+
"जैसा कि अधिनियम के बाद ही परिवर्तन प्रभावी होगा\n",
|
| 190 |
+
"अपने उद्देश्यों में बदलाव कर सकती है\n",
|
| 191 |
+
"सामान्य बैठक में सदस्यों द्वारा\n",
|
| 192 |
+
"कंपनी संशोधन अधिनियम वन नाइन नाइन सिक्स को मेमोरेंडम ऑफ एसोसिएशन के\n",
|
| 193 |
+
"केंद्र सरकार के प्रतिबंध के साथ समाप्त कर दिया गया है\n",
|
| 194 |
+
"विशेष संकल्प के अनुरूप अनुमोदित किए जाने\n",
|
| 195 |
+
"ऑब्जेक्ट क्लॉज में परिवर्तन के प्रति शेयर पूंजी में\n",
|
| 196 |
+
"परिवर्तन की प्रक्रिया और ऐसे परिवर्तन करने के अधिकार\n",
|
| 197 |
+
"समान्य पहलु को आर्टीकल ऑफ एसोसिएशन में रखा गया है\n",
|
| 198 |
+
"यदि संबंधित विषय के\n",
|
| 199 |
+
" आर्टीकल ऑफ एसोसिएशन में पीछे की प्रक्रिया नहीं दी गई है\n",
|
| 200 |
+
"कंपनी को पारित करके आर्टीकल ऑफ एसोसिएशन को बदलना होगा\n",
|
| 201 |
+
"एक विशेष प्रस्ताव\n",
|
| 202 |
+
"अब हम ऑलट्रेशन ऑफ पर चर्चा करेंगे\n",
|
| 203 |
+
"कंपनी अधिनियम टू ज़ीरो वन थ्री के तहत मेमोरेंडम\n",
|
| 204 |
+
"अधिनियम की धारा वन सिक्स वन सेवेन वन ऐइट वन नाइन \n",
|
| 205 |
+
" वन नाइन फाइव सिक्स के कंपनी टू वन टू थ्री और थ्री सेवेन के अनुरूप\n",
|
| 206 |
+
"कंपनी अधिनियम टू ज़ीरो वन थ्री की धारा वन थ्री ने\n",
|
| 207 |
+
" ऑलट्रेशन ऑफ मेमोरेंडम के लिए मानदंड निर्धारित किए हैं\n",
|
| 208 |
+
"यह वही वर्णन करता है कि जैसा कि धारा सिक्स वन में दिया गया है\n",
|
| 209 |
+
"एक कंपनी विशेष संकल्प द्वारा\n",
|
| 210 |
+
"और प्रावधानों को बदल सकती है\n",
|
| 211 |
+
"निर्दिष्ट प्रक्रिया के अनुपालन से मेमोरेंडम\n",
|
| 212 |
+
"नाम खंड के परिवर्तन के संबंध में\n",
|
| 213 |
+
"कंपनी अपना नाम बदल सकती है\n",
|
| 214 |
+
"अनुमोदन के बाद लिखित रूप में केंद्र सरकार द्वारा\n",
|
| 215 |
+
"इसलिए जब कंपनी के नाम में कोई बदलाव किया जाता है\n",
|
| 216 |
+
"रजिस्टर में दर्ज करेगा\n",
|
| 217 |
+
" तो रजिस्ट्रार कंपनी के नया नाम\n",
|
| 218 |
+
"पुराने नाम के स्थान पर\n",
|
| 219 |
+
"निगमन का एक नया प्रमाणपत्र जारी करेगा\n",
|
| 220 |
+
"कंपनी के पंजीकृत कार्यालय के बारे में\n",
|
| 221 |
+
"जैसा कि पहले उल्लेख किया गया है\n",
|
| 222 |
+
"तब तक कोई प्रभाव नहीं पड़ेगा जब तक कि वह केंद्र सरकार द्वारा अनुमोदित नहीं हो जाता\n",
|
| 223 |
+
"ऑब्जेक्ट क्लॉज के किसी भी परिवर्तन के संबंध में\n",
|
| 224 |
+
"किसी कंपनी के मेमोरेंडम के\n",
|
| 225 |
+
"रजिस्ट्रार को दाखिल करने की\n",
|
| 226 |
+
" थ्री ज़ीरो दिनों की अवधि के भीतर\n",
|
| 227 |
+
"तारीख से पंजीकरण को प्रमाणित करना होता है\n",
|
| 228 |
+
"इस विशेष प्रस्ताव खंड के उप खंड सिक्स के खंड ए के अनुसार\n",
|
| 229 |
+
"चलिए फिर से संक्षेप में\n",
|
| 230 |
+
" ऑलट्रेशन ऑफ मेमोरेंडम के महत्व के बारे में चर्चा करते हैं\n",
|
| 231 |
+
" क्योंकि ये इस मॉड्यूल के अध्ययन का एक बहुत महत्वपूर्ण हिस्सा है\n",
|
| 232 |
+
"पहला महत्व यह है\n",
|
| 233 |
+
"कि यह एक बहुत ही आवश्यक दस्तावेज है\n",
|
| 234 |
+
"एक कंपनी के निगमन के लिए\n",
|
| 235 |
+
"दूसरा यह कंपनी के पंजीकृत कार्यालय को निर्दिष्ट करते हुए\n",
|
| 236 |
+
"रजिस्ट्रार और अदालत के अधिकार क्षेत्र को निर्धारित करता है\n",
|
| 237 |
+
"तीसरा यह कंपनी के अधिकारों में उद्देश्यों को\n",
|
| 238 |
+
"जनता की जानकारी के लिए दर्ज करता है\n",
|
| 239 |
+
"अगला यह कंपनी को केवल उन कृत्यों को करने के लिए\n",
|
| 240 |
+
"बाध्य करता है जो कंपनी के ऑब्जेक्ट क्लॉज में शामिल हैं\n",
|
| 241 |
+
"यह कंपनी की अधिकृत कैपिटल\n",
|
| 242 |
+
"और उसके विभाजन को निश्चित राशि के शेयरों में निर्दिष्ट करता है\n",
|
| 243 |
+
"पर प्रकाश डालता है\n",
|
| 244 |
+
"यह कंपनी के सदस्यों के लायबिलिटी\n",
|
| 245 |
+
"अंत में संघ के नियमों को\n",
|
| 246 |
+
"यह एक कंपनी के भी नियंत्रित करता है\n"
|
| 247 |
+
]
|
| 248 |
+
}
|
| 249 |
+
],
|
| 250 |
+
"source": [
|
| 251 |
+
"\n",
|
| 252 |
+
"wb_obj = openpyxl.load_workbook(\"charmap_v2_new.xlsx\") \n",
|
| 253 |
+
"sheet_obj = wb_obj.active \n",
|
| 254 |
+
"\n",
|
| 255 |
+
"#data = re.sub('[A-Z]*', '',data)\n",
|
| 256 |
+
"#print(data)\n",
|
| 257 |
+
"data = data.replace('?','')\n",
|
| 258 |
+
"data = data.replace(' ',' ')\n",
|
| 259 |
+
"data = data.replace(';','')\n",
|
| 260 |
+
"data = data.replace(')','')\n",
|
| 261 |
+
"data = data.replace('(','')\n",
|
| 262 |
+
"data = data.replace('!','')\n",
|
| 263 |
+
"data = data.replace(' – ',' ')\n",
|
| 264 |
+
"data = data.replace('-',' ')\n",
|
| 265 |
+
"data = data.replace('।','')\n",
|
| 266 |
+
"data = data.replace('&','')\n",
|
| 267 |
+
"data = data.replace('’','')\n",
|
| 268 |
+
"data = data.replace('‘','')\n",
|
| 269 |
+
"data = data.replace(':','')\n",
|
| 270 |
+
"data = data.replace(',','')\n",
|
| 271 |
+
"data = data.replace('/','')\n",
|
| 272 |
+
"data = data.replace(',','')\n",
|
| 273 |
+
"data = data.replace('.','')\n",
|
| 274 |
+
"data = data.replace('|','')\n",
|
| 275 |
+
"m_row = sheet_obj.max_row \n",
|
| 276 |
+
"line = data\n",
|
| 277 |
+
"\n",
|
| 278 |
+
"for i in range(1,m_row+1):\n",
|
| 279 |
+
" num = sheet_obj.cell(row = i, column = 1).value \n",
|
| 280 |
+
" word = sheet_obj.cell(row = i, column = 2).value\n",
|
| 281 |
+
" #print(num)\n",
|
| 282 |
+
" #print(word)\n",
|
| 283 |
+
" line = line.replace(str(num), word)\n",
|
| 284 |
+
"#print(line)\n",
|
| 285 |
+
"#' '.join(line.split())\n",
|
| 286 |
+
"print(line) \n",
|
| 287 |
+
"file1 = open(\"recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi.txt\",\"w+\",encoding='utf-8') \n",
|
| 288 |
+
"file1.write(line)\n",
|
| 289 |
+
"file1.close()"
|
| 290 |
+
]
|
| 291 |
+
},
|
| 292 |
+
{
|
| 293 |
+
"cell_type": "code",
|
| 294 |
+
"execution_count": null,
|
| 295 |
+
"metadata": {
|
| 296 |
+
"collapsed": true
|
| 297 |
+
},
|
| 298 |
+
"outputs": [],
|
| 299 |
+
"source": []
|
| 300 |
+
},
|
| 301 |
+
{
|
| 302 |
+
"cell_type": "code",
|
| 303 |
+
"execution_count": null,
|
| 304 |
+
"metadata": {
|
| 305 |
+
"collapsed": true
|
| 306 |
+
},
|
| 307 |
+
"outputs": [],
|
| 308 |
+
"source": []
|
| 309 |
+
}
|
| 310 |
+
],
|
| 311 |
+
"metadata": {
|
| 312 |
+
"kernelspec": {
|
| 313 |
+
"display_name": "Python 3",
|
| 314 |
+
"language": "python",
|
| 315 |
+
"name": "python3"
|
| 316 |
+
},
|
| 317 |
+
"language_info": {
|
| 318 |
+
"codemirror_mode": {
|
| 319 |
+
"name": "ipython",
|
| 320 |
+
"version": 3
|
| 321 |
+
},
|
| 322 |
+
"file_extension": ".py",
|
| 323 |
+
"mimetype": "text/x-python",
|
| 324 |
+
"name": "python",
|
| 325 |
+
"nbconvert_exporter": "python",
|
| 326 |
+
"pygments_lexer": "ipython3",
|
| 327 |
+
"version": "3.6.3"
|
| 328 |
+
}
|
| 329 |
+
},
|
| 330 |
+
"nbformat": 4,
|
| 331 |
+
"nbformat_minor": 2
|
| 332 |
+
}
|
charmap/Text_Cleaning.py
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/usr/bin/env python
|
| 2 |
+
# coding: utf-8
|
| 3 |
+
|
| 4 |
+
# In[2]:
|
| 5 |
+
|
| 6 |
+
|
| 7 |
+
############################################################
|
| 8 |
+
#Author : Bhagyashree
|
| 9 |
+
#Date : 1st Sept, 2020
|
| 10 |
+
#Purpose : Text Cleaning
|
| 11 |
+
#Input : Text file after timestamp removal
|
| 12 |
+
#Output : Text file after cleaning data
|
| 13 |
+
############################################################
|
| 14 |
+
|
| 15 |
+
|
| 16 |
+
# In[3]:
|
| 17 |
+
|
| 18 |
+
|
| 19 |
+
import nltk
|
| 20 |
+
import numpy
|
| 21 |
+
import xlrd
|
| 22 |
+
import openpyxl
|
| 23 |
+
import re
|
| 24 |
+
import sys
|
| 25 |
+
|
| 26 |
+
# In[21]:
|
| 27 |
+
|
| 28 |
+
#file1 = open("recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi_new.txt","r+",encoding='utf-8')
|
| 29 |
+
file1 = open(sys.argv[1],"r+",encoding='utf-8')
|
| 30 |
+
data = file1.read()
|
| 31 |
+
#print(data)
|
| 32 |
+
file1.close()
|
| 33 |
+
|
| 34 |
+
|
| 35 |
+
# In[22]:
|
| 36 |
+
|
| 37 |
+
wb_obj = openpyxl.load_workbook(sys.argv[2])
|
| 38 |
+
sheet_obj = wb_obj.active
|
| 39 |
+
|
| 40 |
+
#data = re.sub('[A-Z]*', '',data)
|
| 41 |
+
#print(data)
|
| 42 |
+
data = data.replace('?','')
|
| 43 |
+
data = data.replace(' ',' ')
|
| 44 |
+
data = data.replace(';','')
|
| 45 |
+
data = data.replace(')','')
|
| 46 |
+
data = data.replace('(','')
|
| 47 |
+
data = data.replace('!','')
|
| 48 |
+
data = data.replace(' – ',' ')
|
| 49 |
+
data = data.replace('-',' ')
|
| 50 |
+
data = data.replace('।','')
|
| 51 |
+
data = data.replace('&','')
|
| 52 |
+
data = data.replace('’','')
|
| 53 |
+
data = data.replace('‘','')
|
| 54 |
+
data = data.replace(':','')
|
| 55 |
+
data = data.replace(',','')
|
| 56 |
+
data = data.replace('/','')
|
| 57 |
+
data = data.replace(',','')
|
| 58 |
+
data = data.replace('.','')
|
| 59 |
+
data = data.replace('|','')
|
| 60 |
+
m_row = sheet_obj.max_row
|
| 61 |
+
line = data
|
| 62 |
+
|
| 63 |
+
for i in range(1,m_row+1):
|
| 64 |
+
num = sheet_obj.cell(row = i, column = 1).value
|
| 65 |
+
word = sheet_obj.cell(row = i, column = 2).value
|
| 66 |
+
#print(num)
|
| 67 |
+
#print(word)
|
| 68 |
+
line = line.replace(str(num), word)
|
| 69 |
+
#print(line)
|
| 70 |
+
#' '.join(line.split())
|
| 71 |
+
#print(line)
|
| 72 |
+
file1 = open(sys.argv[3],"w+",encoding='utf-8')
|
| 73 |
+
#file1 = open("recent_deliverables_dec2020/Corporate_Law/Hindi/ankita objects 02_Hindi.txt","w+",encoding='utf-8')
|
| 74 |
+
file1.write(line)
|
| 75 |
+
file1.close()
|
| 76 |
+
|
charmap/charmap_Bengali.txt
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 জিরো
|
| 2 |
+
1 ওয়ান
|
| 3 |
+
2 টু
|
| 4 |
+
3 থ্রী
|
| 5 |
+
4 ফোর
|
| 6 |
+
5 ফাইভ
|
| 7 |
+
6 সিক্স
|
| 8 |
+
7 সেবন
|
| 9 |
+
8 এইট
|
| 10 |
+
9 নাইন
|
| 11 |
+
A এ
|
| 12 |
+
a এ
|
| 13 |
+
B বী
|
| 14 |
+
b বী
|
| 15 |
+
C সী
|
| 16 |
+
c সী
|
| 17 |
+
D ডি
|
| 18 |
+
d ডি
|
| 19 |
+
E ই
|
| 20 |
+
e ই
|
| 21 |
+
F এফ
|
| 22 |
+
f এফ
|
| 23 |
+
G জি
|
| 24 |
+
g জি
|
| 25 |
+
H এছ
|
| 26 |
+
h এছ
|
| 27 |
+
I আই
|
| 28 |
+
i আই
|
| 29 |
+
J জে
|
| 30 |
+
j জে
|
| 31 |
+
K কে
|
| 32 |
+
k কে
|
| 33 |
+
L এল
|
| 34 |
+
l এল
|
| 35 |
+
M এম
|
| 36 |
+
m এম
|
| 37 |
+
N এন
|
| 38 |
+
n এন
|
| 39 |
+
O ও
|
| 40 |
+
o ও
|
| 41 |
+
P পি
|
| 42 |
+
p পি
|
| 43 |
+
Q ক্যু
|
| 44 |
+
q ক্যু
|
| 45 |
+
R আর
|
| 46 |
+
r আর
|
| 47 |
+
S এস
|
| 48 |
+
s এস
|
| 49 |
+
T টি
|
| 50 |
+
t টি
|
| 51 |
+
U ইউ
|
| 52 |
+
u ইউ
|
| 53 |
+
V ভি
|
| 54 |
+
v ভি
|
| 55 |
+
W ডাবলু
|
| 56 |
+
w ডাবলু
|
| 57 |
+
X এক্স
|
| 58 |
+
x এক্স
|
| 59 |
+
Y উহাই
|
| 60 |
+
y উহাই
|
| 61 |
+
Z জেডঃ
|
| 62 |
+
z জেডঃ
|
charmap/charmap_Hindi.txt
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 ज़ीरो
|
| 2 |
+
1 वन
|
| 3 |
+
2 टू
|
| 4 |
+
3 थ्री
|
| 5 |
+
4 फोर
|
| 6 |
+
5 फाइव
|
| 7 |
+
6 सिक्स
|
| 8 |
+
7 सेवेन
|
| 9 |
+
8 ऐइट
|
| 10 |
+
9 नाइन
|
| 11 |
+
० ज़ीरो
|
| 12 |
+
१ वन
|
| 13 |
+
२ टू
|
| 14 |
+
३ थ्री
|
| 15 |
+
४ फोर
|
| 16 |
+
५ फाइव
|
| 17 |
+
६ सिक्स
|
| 18 |
+
७ सेवेन
|
| 19 |
+
८ ऐइट
|
| 20 |
+
९ नाइन
|
| 21 |
+
A ए
|
| 22 |
+
a ए
|
| 23 |
+
B बी
|
| 24 |
+
b बी
|
| 25 |
+
C सी
|
| 26 |
+
c सी
|
| 27 |
+
D डी
|
| 28 |
+
d डी
|
| 29 |
+
E इ
|
| 30 |
+
e इ
|
| 31 |
+
F एफ
|
| 32 |
+
f एफ
|
| 33 |
+
G जी
|
| 34 |
+
g जी
|
| 35 |
+
H एच
|
| 36 |
+
h एच
|
| 37 |
+
I आई
|
| 38 |
+
i आई
|
| 39 |
+
J जे
|
| 40 |
+
j जे
|
| 41 |
+
K के
|
| 42 |
+
k के
|
| 43 |
+
L एल
|
| 44 |
+
l एल
|
| 45 |
+
M एम
|
| 46 |
+
m एम
|
| 47 |
+
N एन
|
| 48 |
+
n एन
|
| 49 |
+
O ओ
|
| 50 |
+
o ओ
|
| 51 |
+
P पी
|
| 52 |
+
p पी
|
| 53 |
+
Q क्यू
|
| 54 |
+
q क्यू
|
| 55 |
+
R आर
|
| 56 |
+
r आर
|
| 57 |
+
S एस
|
| 58 |
+
s एस
|
| 59 |
+
T टी
|
| 60 |
+
t टी
|
| 61 |
+
U यू
|
| 62 |
+
u यू
|
| 63 |
+
V वी
|
| 64 |
+
v वी
|
| 65 |
+
W डबलु
|
| 66 |
+
w डबलु
|
| 67 |
+
X एक्स
|
| 68 |
+
x एक्स
|
| 69 |
+
Y व्हाई
|
| 70 |
+
y व्हाई
|
| 71 |
+
Z ज़ेड
|
| 72 |
+
z ज़ेड
|
| 73 |
+
α अल्फा
|
| 74 |
+
φ फ़ाई
|
| 75 |
+
+ प्लस
|
| 76 |
+
= इक्वल
|
| 77 |
+
λ लैम्ब्डा
|
| 78 |
+
∅ नॉट
|
| 79 |
+
ϕ फ़ाई
|
| 80 |
+
𝝅 पाई
|
| 81 |
+
⇒ इम्प्लइज
|
charmap/charmap_Hindi.xlsx
ADDED
|
Binary file (10.8 kB). View file
|
|
|
charmap/charmap_Malayalam.txt
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 സീറോ
|
| 2 |
+
1 വൺ
|
| 3 |
+
2 ടു
|
| 4 |
+
3 ത്രീ
|
| 5 |
+
4 ഫോർ
|
| 6 |
+
5 ഫൈവ്
|
| 7 |
+
6 സിക്സ്
|
| 8 |
+
7 സെവൻ
|
| 9 |
+
8 എയ്റ്റ്
|
| 10 |
+
9 നൈൻ
|
| 11 |
+
0 സീറോ
|
| 12 |
+
1 വൺ
|
| 13 |
+
2 ടു
|
| 14 |
+
3 ത്രീ
|
| 15 |
+
4 ഫോർ
|
| 16 |
+
5 ഫൈവ്
|
| 17 |
+
6 സിക്സ്
|
| 18 |
+
7 സെവൻ
|
| 19 |
+
8 എയ്റ്റ്
|
| 20 |
+
9 നൈൻ
|
| 21 |
+
A എ
|
| 22 |
+
a എ
|
| 23 |
+
B ബി
|
| 24 |
+
b ബി
|
| 25 |
+
C സി
|
| 26 |
+
c സി
|
| 27 |
+
D ഡി
|
| 28 |
+
d ഡി
|
| 29 |
+
E ഇ
|
| 30 |
+
e ഇ
|
| 31 |
+
F എഫ്
|
| 32 |
+
f എഫ്
|
| 33 |
+
G ജി
|
| 34 |
+
g ജി
|
| 35 |
+
H എഛ്
|
| 36 |
+
h എഛ്
|
| 37 |
+
I ഐ
|
| 38 |
+
i ഐ
|
| 39 |
+
J ജെ
|
| 40 |
+
j ജെ
|
| 41 |
+
K കെ
|
| 42 |
+
k കെ
|
| 43 |
+
L എൽ
|
| 44 |
+
l എൽ
|
| 45 |
+
M എം
|
| 46 |
+
m എം
|
| 47 |
+
N എൻ
|
| 48 |
+
n എൻ
|
| 49 |
+
O ഒ
|
| 50 |
+
o ഒ
|
| 51 |
+
P പി
|
| 52 |
+
p പി
|
| 53 |
+
Q ക്യു
|
| 54 |
+
q ക്യു
|
| 55 |
+
R ആർ
|
| 56 |
+
r ആർ
|
| 57 |
+
S എസ്
|
| 58 |
+
s എസ്
|
| 59 |
+
T ടി
|
| 60 |
+
t ടി
|
| 61 |
+
U യു
|
| 62 |
+
u യു
|
| 63 |
+
V വി
|
| 64 |
+
v വി
|
| 65 |
+
W ഡബ്ല്യൂ
|
| 66 |
+
w ഡബ്ല്യൂ
|
| 67 |
+
X എക്സ്
|
| 68 |
+
x എക്സ്
|
| 69 |
+
Y വൈ
|
| 70 |
+
y വൈ
|
| 71 |
+
Z സെഡ്
|
| 72 |
+
z സെഡ്
|
| 73 |
+
α ആൽഫ
|
| 74 |
+
φ ഫി
|
| 75 |
+
+ പ്ലസ്
|
| 76 |
+
= ഈക്വൽ
|
| 77 |
+
λ ലാംബ്ടാ
|
| 78 |
+
∅ നോട്ട്
|
| 79 |
+
ϕ സൈ
|
| 80 |
+
𝝅 പൈ
|
| 81 |
+
⇒ ഇമ്പ്ലെയ്സ്
|
charmap/charmap_Malayalam.xlsx
ADDED
|
Binary file (13.1 kB). View file
|
|
|
charmap/charmap_Marathi.txt
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 ज़ीरो
|
| 2 |
+
1 वन
|
| 3 |
+
2 टू
|
| 4 |
+
3 थ्री
|
| 5 |
+
4 फोर
|
| 6 |
+
5 फाइव
|
| 7 |
+
6 सिक्स
|
| 8 |
+
7 सेवेन
|
| 9 |
+
8 ऐइट
|
| 10 |
+
9 नाइन
|
| 11 |
+
० ज़ीरो
|
| 12 |
+
१ वन
|
| 13 |
+
२ टू
|
| 14 |
+
३ थ्री
|
| 15 |
+
४ फोर
|
| 16 |
+
५ फाइव
|
| 17 |
+
६ सिक्स
|
| 18 |
+
७ सेवेन
|
| 19 |
+
८ ऐइट
|
| 20 |
+
९ नाइन
|
| 21 |
+
A ए
|
| 22 |
+
a ए
|
| 23 |
+
B बी
|
| 24 |
+
b बी
|
| 25 |
+
C सी
|
| 26 |
+
c सी
|
| 27 |
+
D डी
|
| 28 |
+
d डी
|
| 29 |
+
E इ
|
| 30 |
+
e इ
|
| 31 |
+
F एफ
|
| 32 |
+
f एफ
|
| 33 |
+
G जी
|
| 34 |
+
g जी
|
| 35 |
+
H एच
|
| 36 |
+
h एच
|
| 37 |
+
I आई
|
| 38 |
+
i आई
|
| 39 |
+
J जे
|
| 40 |
+
j जे
|
| 41 |
+
K के
|
| 42 |
+
k के
|
| 43 |
+
L एल
|
| 44 |
+
l एल
|
| 45 |
+
M एम
|
| 46 |
+
m एम
|
| 47 |
+
N एन
|
| 48 |
+
n एन
|
| 49 |
+
O ओ
|
| 50 |
+
o ओ
|
| 51 |
+
P पी
|
| 52 |
+
p पी
|
| 53 |
+
Q क्यू
|
| 54 |
+
q क्यू
|
| 55 |
+
R आर
|
| 56 |
+
r आर
|
| 57 |
+
S एस
|
| 58 |
+
s एस
|
| 59 |
+
T टी
|
| 60 |
+
t टी
|
| 61 |
+
U यू
|
| 62 |
+
u यू
|
| 63 |
+
V वी
|
| 64 |
+
v वी
|
| 65 |
+
W डबलु
|
| 66 |
+
w डबलु
|
| 67 |
+
X एक्स
|
| 68 |
+
x एक्स
|
| 69 |
+
Y व्हाई
|
| 70 |
+
y व्हाई
|
| 71 |
+
Z ज़ेड
|
| 72 |
+
z ज़ेड
|
| 73 |
+
α अल्फा
|
| 74 |
+
φ फ़ाई
|
| 75 |
+
+ प्लस
|
| 76 |
+
= इक्वल
|
| 77 |
+
λ लैम्ब्डा
|
| 78 |
+
∅ नॉट
|
| 79 |
+
ϕ फ़ाई
|
| 80 |
+
𝝅 पाई
|
| 81 |
+
⇒ इम्प्लइज
|
charmap/charmap_Marathi.xlsx
ADDED
|
Binary file (10.8 kB). View file
|
|
|
charmap/charmap_Tamil.disabled
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 ஸிரோ
|
| 2 |
+
1 ஒன்னு
|
| 3 |
+
2 டூ
|
| 4 |
+
3 த்ரீ
|
| 5 |
+
4 போர்
|
| 6 |
+
5 பைவ்
|
| 7 |
+
6 சீஸ்
|
| 8 |
+
7 செவென்
|
| 9 |
+
8 எயிட்
|
| 10 |
+
9 நயன்
|
| 11 |
+
A எ
|
| 12 |
+
a எ
|
| 13 |
+
B பி
|
| 14 |
+
b பி
|
| 15 |
+
C சி
|
| 16 |
+
c சி
|
| 17 |
+
D டி
|
| 18 |
+
d டி
|
| 19 |
+
E இ
|
| 20 |
+
e இ
|
| 21 |
+
F எப்
|
| 22 |
+
f எப்
|
| 23 |
+
G ஜி
|
| 24 |
+
g ஜி
|
| 25 |
+
H ஹ்
|
| 26 |
+
h ஹ்
|
| 27 |
+
I ஐ
|
| 28 |
+
i ஐ
|
| 29 |
+
J ஜே
|
| 30 |
+
j ஜே
|
| 31 |
+
K கே
|
| 32 |
+
k கே
|
| 33 |
+
L ல்
|
| 34 |
+
l ல்
|
| 35 |
+
M ம்
|
| 36 |
+
m ம்
|
| 37 |
+
N ன்
|
| 38 |
+
n ன்
|
| 39 |
+
O ஓ
|
| 40 |
+
o ஓ
|
| 41 |
+
P பி
|
| 42 |
+
p பி
|
| 43 |
+
Q கியூ
|
| 44 |
+
q கியூ
|
| 45 |
+
R ர்
|
| 46 |
+
r ர்
|
| 47 |
+
S ஸ்
|
| 48 |
+
s ஸ்
|
| 49 |
+
T டீ
|
| 50 |
+
t டீ
|
| 51 |
+
U யூ
|
| 52 |
+
u யூ
|
| 53 |
+
V வி
|
| 54 |
+
v வி
|
| 55 |
+
W டௌபிள்யூ
|
| 56 |
+
w டௌபிள்யூ
|
| 57 |
+
X எஸ்
|
| 58 |
+
x எஸ்
|
| 59 |
+
Y யை
|
| 60 |
+
y யை
|
| 61 |
+
Z செட்
|
| 62 |
+
z செட்
|
| 63 |
+
α ஆல்பா
|
| 64 |
+
φ பிய்
|
| 65 |
+
+ பிளஸ்
|
| 66 |
+
= ஏகுவாள்
|
| 67 |
+
λ லாம்டா
|
| 68 |
+
∅ நோட்
|
| 69 |
+
ϕ பிய்
|
| 70 |
+
𝝅 பை
|
| 71 |
+
⇒ இம்ப்ளிஸ்
|
| 72 |
+
. பாயிண்ட்
|
| 73 |
+
% பெர்ஸண்டாஜ்
|
| 74 |
+
°C டிகிரிசெல்சியஸ்
|
| 75 |
+
θ தீட்டா
|
| 76 |
+
* இண்டூ
|
charmap/charmap_Tamil.xlsx
ADDED
|
Binary file (11.1 kB). View file
|
|
|
charmap/charmap_Telugu.txt
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
0 జీరొ
|
| 2 |
+
1 వన్
|
| 3 |
+
2 టు
|
| 4 |
+
3 త్రీ
|
| 5 |
+
4 ఫోర్
|
| 6 |
+
5 ఫైవ్
|
| 7 |
+
6 సిక్స్
|
| 8 |
+
7 సెవెన్
|
| 9 |
+
8 ఎఇట్
|
| 10 |
+
9 నైన్
|
| 11 |
+
० జీరొ
|
| 12 |
+
१ వన్
|
| 13 |
+
२ టు
|
| 14 |
+
३ త్రీ
|
| 15 |
+
४ ఫోర్
|
| 16 |
+
५ ఫైవ్
|
| 17 |
+
६ సిక్స్
|
| 18 |
+
७ సెవెన్
|
| 19 |
+
८ ఎఇట్
|
| 20 |
+
९ నైన్
|
| 21 |
+
A ఎ
|
| 22 |
+
a ఎ
|
| 23 |
+
B బి
|
| 24 |
+
b బి
|
| 25 |
+
C సి
|
| 26 |
+
c సి
|
| 27 |
+
D డి
|
| 28 |
+
d డి
|
| 29 |
+
E ఇ
|
| 30 |
+
e ఇ
|
| 31 |
+
F ఎఫ్
|
| 32 |
+
f ఎఫ్
|
| 33 |
+
G జి
|
| 34 |
+
g జి
|
| 35 |
+
H హెచ్
|
| 36 |
+
h హెచ్
|
| 37 |
+
I ఐ
|
| 38 |
+
i ఐ
|
| 39 |
+
J జె
|
| 40 |
+
j జె
|
| 41 |
+
K కె
|
| 42 |
+
k కె
|
| 43 |
+
L ఎల్
|
| 44 |
+
l ఎల్
|
| 45 |
+
M ఎమ్
|
| 46 |
+
m ఎమ్
|
| 47 |
+
N ఎన్
|
| 48 |
+
n ఎన్
|
| 49 |
+
O ఒ
|
| 50 |
+
o ఒ
|
| 51 |
+
P పి
|
| 52 |
+
p పి
|
| 53 |
+
Q క్యు
|
| 54 |
+
q క్యు
|
| 55 |
+
R ఆర్
|
| 56 |
+
r ఆర్
|
| 57 |
+
S ఎస్
|
| 58 |
+
s ఎస్
|
| 59 |
+
T టి
|
| 60 |
+
t టి
|
| 61 |
+
U యు
|
| 62 |
+
u యు
|
| 63 |
+
V వి
|
| 64 |
+
v వి
|
| 65 |
+
W డబ్లు
|
| 66 |
+
w డబ్లు
|
| 67 |
+
X ఎక్స్
|
| 68 |
+
x ఎక్స్
|
| 69 |
+
Y వై
|
| 70 |
+
y వై
|
| 71 |
+
Z జెడ్
|
| 72 |
+
z జెడ్
|
| 73 |
+
α ఆల్ఫ
|
| 74 |
+
φ ఫై
|
| 75 |
+
+ ప్లస్
|
| 76 |
+
= ఈక్వల్
|
| 77 |
+
λ లామ్బ్డ
|
| 78 |
+
∅ నల్
|
| 79 |
+
ϕ ఫై
|
| 80 |
+
𝝅 పై
|
| 81 |
+
⇒ ఇమ్ప్లైస్
|
charmap/charmap_Telugu.xlsx
ADDED
|
Binary file (10 kB). View file
|
|
|
dogri_latest/female/model/config.yaml
ADDED
|
@@ -0,0 +1,320 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
accum_grad: 8
|
| 2 |
+
adapter: lora
|
| 3 |
+
adapter_conf: {}
|
| 4 |
+
allow_multi_rates: false
|
| 5 |
+
allow_variable_data_keys: false
|
| 6 |
+
batch_bins: 3000000
|
| 7 |
+
batch_size: 20
|
| 8 |
+
batch_type: numel
|
| 9 |
+
best_model_criterion:
|
| 10 |
+
- - valid
|
| 11 |
+
- loss
|
| 12 |
+
- min
|
| 13 |
+
- - train
|
| 14 |
+
- loss
|
| 15 |
+
- min
|
| 16 |
+
bpemodel: null
|
| 17 |
+
category_sample_size: 10
|
| 18 |
+
chunk_default_fs: null
|
| 19 |
+
chunk_discard_short_samples: true
|
| 20 |
+
chunk_excluded_key_prefixes: []
|
| 21 |
+
chunk_length: 500
|
| 22 |
+
chunk_max_abs_length: null
|
| 23 |
+
chunk_shift_ratio: 0.5
|
| 24 |
+
cleaner: null
|
| 25 |
+
collect_stats: false
|
| 26 |
+
config: conf/tuning/train_fastspeech2.yaml
|
| 27 |
+
create_graph_in_tensorboard: false
|
| 28 |
+
cudnn_benchmark: false
|
| 29 |
+
cudnn_deterministic: true
|
| 30 |
+
cudnn_enabled: true
|
| 31 |
+
deepspeed_config: null
|
| 32 |
+
detect_anomaly: false
|
| 33 |
+
dist_backend: nccl
|
| 34 |
+
dist_init_method: env://
|
| 35 |
+
dist_launcher: null
|
| 36 |
+
dist_master_addr: localhost
|
| 37 |
+
dist_master_port: 33333
|
| 38 |
+
dist_rank: 0
|
| 39 |
+
dist_world_size: 2
|
| 40 |
+
distributed: true
|
| 41 |
+
drop_last_iter: false
|
| 42 |
+
dry_run: false
|
| 43 |
+
early_stopping_criterion:
|
| 44 |
+
- valid
|
| 45 |
+
- loss
|
| 46 |
+
- min
|
| 47 |
+
energy_extract: energy
|
| 48 |
+
energy_extract_conf:
|
| 49 |
+
fs: 48000
|
| 50 |
+
hop_length: 1024
|
| 51 |
+
n_fft: 8192
|
| 52 |
+
reduction_factor: 1
|
| 53 |
+
win_length: 4096
|
| 54 |
+
energy_normalize: global_mvn
|
| 55 |
+
energy_normalize_conf:
|
| 56 |
+
stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/energy_stats.npz
|
| 57 |
+
exclude_weight_decay: false
|
| 58 |
+
exclude_weight_decay_conf: {}
|
| 59 |
+
feats_extract: fbank
|
| 60 |
+
feats_extract_conf:
|
| 61 |
+
fmax: 24000
|
| 62 |
+
fmin: 0
|
| 63 |
+
fs: 48000
|
| 64 |
+
hop_length: 1024
|
| 65 |
+
n_fft: 8192
|
| 66 |
+
n_mels: 160
|
| 67 |
+
win_length: 4096
|
| 68 |
+
fold_length:
|
| 69 |
+
- 150
|
| 70 |
+
- 819200
|
| 71 |
+
freeze_param: []
|
| 72 |
+
g2p: null
|
| 73 |
+
grad_clip: 1.0
|
| 74 |
+
grad_clip_type: 2.0
|
| 75 |
+
grad_noise: false
|
| 76 |
+
ignore_init_mismatch: false
|
| 77 |
+
init_param: []
|
| 78 |
+
iterator_type: sequence
|
| 79 |
+
keep_nbest_models: 5
|
| 80 |
+
local_rank: 0
|
| 81 |
+
log_interval: null
|
| 82 |
+
log_level: INFO
|
| 83 |
+
max_cache_fd: 32
|
| 84 |
+
max_cache_size: 0.0
|
| 85 |
+
max_epoch: 1000
|
| 86 |
+
model_conf: {}
|
| 87 |
+
multi_task_dataset: false
|
| 88 |
+
multiple_iterator: false
|
| 89 |
+
multiprocessing_distributed: true
|
| 90 |
+
nbest_averaging_interval: 0
|
| 91 |
+
ngpu: 1
|
| 92 |
+
no_forward_run: false
|
| 93 |
+
non_linguistic_symbols: null
|
| 94 |
+
normalize: global_mvn
|
| 95 |
+
normalize_conf:
|
| 96 |
+
stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/feats_stats.npz
|
| 97 |
+
num_att_plot: 3
|
| 98 |
+
num_cache_chunks: 1024
|
| 99 |
+
num_iters_per_epoch: 800
|
| 100 |
+
num_workers: 1
|
| 101 |
+
odim: null
|
| 102 |
+
optim: adam
|
| 103 |
+
optim_conf:
|
| 104 |
+
lr: 1.0
|
| 105 |
+
output_dir: exp/tts_train_fastspeech2_raw_char_None
|
| 106 |
+
patience: null
|
| 107 |
+
pitch_extract: dio
|
| 108 |
+
pitch_extract_conf:
|
| 109 |
+
f0max: 400
|
| 110 |
+
f0min: 80
|
| 111 |
+
fs: 48000
|
| 112 |
+
hop_length: 1024
|
| 113 |
+
n_fft: 8192
|
| 114 |
+
reduction_factor: 1
|
| 115 |
+
pitch_normalize: global_mvn
|
| 116 |
+
pitch_normalize_conf:
|
| 117 |
+
stats_file: /home/speech/Suji/FS2/Fastspeech2_HS/Models_ph3/Dogri_fem_mono/pitch_stats.npz
|
| 118 |
+
pretrain_path: null
|
| 119 |
+
print_config: false
|
| 120 |
+
required:
|
| 121 |
+
- output_dir
|
| 122 |
+
- token_list
|
| 123 |
+
resume: true
|
| 124 |
+
save_strategy: all
|
| 125 |
+
scheduler: noamlr
|
| 126 |
+
scheduler_conf:
|
| 127 |
+
model_size: 384
|
| 128 |
+
warmup_steps: 4000
|
| 129 |
+
seed: 0
|
| 130 |
+
sharded_ddp: false
|
| 131 |
+
shuffle_within_batch: false
|
| 132 |
+
sort_batch: descending
|
| 133 |
+
sort_in_batch: descending
|
| 134 |
+
token_list:
|
| 135 |
+
- <blank>
|
| 136 |
+
- <unk>
|
| 137 |
+
- <space>
|
| 138 |
+
- $
|
| 139 |
+
- ','
|
| 140 |
+
- .
|
| 141 |
+
- M
|
| 142 |
+
- q
|
| 143 |
+
- H
|
| 144 |
+
- k
|
| 145 |
+
- "\u0916"
|
| 146 |
+
- g
|
| 147 |
+
- "\u0918"
|
| 148 |
+
- "\u0919"
|
| 149 |
+
- c
|
| 150 |
+
- C
|
| 151 |
+
- j
|
| 152 |
+
- J
|
| 153 |
+
- "\u091E"
|
| 154 |
+
- "\u091F"
|
| 155 |
+
- "\u0920"
|
| 156 |
+
- "\u0921"
|
| 157 |
+
- "\u0922"
|
| 158 |
+
- "\u0923"
|
| 159 |
+
- t
|
| 160 |
+
- "\u0925"
|
| 161 |
+
- d
|
| 162 |
+
- "\u0927"
|
| 163 |
+
- n
|
| 164 |
+
- "\u0929"
|
| 165 |
+
- p
|
| 166 |
+
- P
|
| 167 |
+
- b
|
| 168 |
+
- B
|
| 169 |
+
- m
|
| 170 |
+
- y
|
| 171 |
+
- r
|
| 172 |
+
- "\u0931"
|
| 173 |
+
- l
|
| 174 |
+
- "\u0D33"
|
| 175 |
+
- Z
|
| 176 |
+
- w
|
| 177 |
+
- "\u0936"
|
| 178 |
+
- "\u0937"
|
| 179 |
+
- s
|
| 180 |
+
- h
|
| 181 |
+
- Y
|
| 182 |
+
- "\u093D"
|
| 183 |
+
- "\u0915"
|
| 184 |
+
- K
|
| 185 |
+
- G
|
| 186 |
+
- z
|
| 187 |
+
- D
|
| 188 |
+
- T
|
| 189 |
+
- f
|
| 190 |
+
- "\u0960"
|
| 191 |
+
- "\u0D7A"
|
| 192 |
+
- N
|
| 193 |
+
- "\u0D7C"
|
| 194 |
+
- "\u0D7D"
|
| 195 |
+
- "\u0D7E"
|
| 196 |
+
- a
|
| 197 |
+
- A
|
| 198 |
+
- i
|
| 199 |
+
- I
|
| 200 |
+
- u
|
| 201 |
+
- U
|
| 202 |
+
- R
|
| 203 |
+
- "\u090D"
|
| 204 |
+
- e
|
| 205 |
+
- E
|
| 206 |
+
- "\u0910"
|
| 207 |
+
- "\u0911"
|
| 208 |
+
- o
|
| 209 |
+
- O
|
| 210 |
+
- "\u0914"
|
| 211 |
+
- "\u0B89"
|
| 212 |
+
- <sos/eos>
|
| 213 |
+
token_type: char
|
| 214 |
+
train_data_path_and_name_and_type:
|
| 215 |
+
- - dump/raw/tr_no_dev/text
|
| 216 |
+
- text
|
| 217 |
+
- text
|
| 218 |
+
- - duration_info/tr_no_dev/durations
|
| 219 |
+
- durations
|
| 220 |
+
- text_int
|
| 221 |
+
- - dump/raw/tr_no_dev/wav.scp
|
| 222 |
+
- speech
|
| 223 |
+
- sound
|
| 224 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/pitch.scp
|
| 225 |
+
- pitch
|
| 226 |
+
- npy
|
| 227 |
+
- - exp/tts_stats_raw_char_None/train/collect_feats/energy.scp
|
| 228 |
+
- energy
|
| 229 |
+
- npy
|
| 230 |
+
train_dtype: float32
|
| 231 |
+
train_shape_file:
|
| 232 |
+
- exp/tts_stats_raw_char_None/train/text_shape.char
|
| 233 |
+
- exp/tts_stats_raw_char_None/train/speech_shape
|
| 234 |
+
tts: fastspeech2
|
| 235 |
+
tts_conf:
|
| 236 |
+
adim: 384
|
| 237 |
+
aheads: 2
|
| 238 |
+
decoder_normalize_before: true
|
| 239 |
+
dlayers: 4
|
| 240 |
+
dunits: 1536
|
| 241 |
+
duration_predictor_chans: 256
|
| 242 |
+
duration_predictor_kernel_size: 3
|
| 243 |
+
duration_predictor_layers: 2
|
| 244 |
+
elayers: 4
|
| 245 |
+
encoder_normalize_before: true
|
| 246 |
+
energy_embed_dropout: 0.0
|
| 247 |
+
energy_embed_kernel_size: 1
|
| 248 |
+
energy_predictor_chans: 256
|
| 249 |
+
energy_predictor_dropout: 0.5
|
| 250 |
+
energy_predictor_kernel_size: 3
|
| 251 |
+
energy_predictor_layers: 2
|
| 252 |
+
eunits: 1536
|
| 253 |
+
init_dec_alpha: 1.0
|
| 254 |
+
init_enc_alpha: 1.0
|
| 255 |
+
init_type: xavier_uniform
|
| 256 |
+
pitch_embed_dropout: 0.0
|
| 257 |
+
pitch_embed_kernel_size: 1
|
| 258 |
+
pitch_predictor_chans: 256
|
| 259 |
+
pitch_predictor_dropout: 0.5
|
| 260 |
+
pitch_predictor_kernel_size: 5
|
| 261 |
+
pitch_predictor_layers: 5
|
| 262 |
+
positionwise_conv_kernel_size: 3
|
| 263 |
+
positionwise_layer_type: conv1d
|
| 264 |
+
postnet_chans: 256
|
| 265 |
+
postnet_filts: 5
|
| 266 |
+
postnet_layers: 5
|
| 267 |
+
reduction_factor: 1
|
| 268 |
+
stop_gradient_from_energy_predictor: false
|
| 269 |
+
stop_gradient_from_pitch_predictor: true
|
| 270 |
+
transformer_dec_attn_dropout_rate: 0.2
|
| 271 |
+
transformer_dec_dropout_rate: 0.2
|
| 272 |
+
transformer_dec_positional_dropout_rate: 0.2
|
| 273 |
+
transformer_enc_attn_dropout_rate: 0.2
|
| 274 |
+
transformer_enc_dropout_rate: 0.2
|
| 275 |
+
transformer_enc_positional_dropout_rate: 0.2
|
| 276 |
+
use_masking: true
|
| 277 |
+
use_scaled_pos_enc: true
|
| 278 |
+
unused_parameters: false
|
| 279 |
+
use_adapter: false
|
| 280 |
+
use_amp: false
|
| 281 |
+
use_deepspeed: false
|
| 282 |
+
use_matplotlib: true
|
| 283 |
+
use_preprocessor: true
|
| 284 |
+
use_tensorboard: true
|
| 285 |
+
use_tf32: false
|
| 286 |
+
use_wandb: false
|
| 287 |
+
val_scheduler_criterion:
|
| 288 |
+
- valid
|
| 289 |
+
- loss
|
| 290 |
+
valid_batch_bins: null
|
| 291 |
+
valid_batch_size: null
|
| 292 |
+
valid_batch_type: null
|
| 293 |
+
valid_data_path_and_name_and_type:
|
| 294 |
+
- - dump/raw/dev/text
|
| 295 |
+
- text
|
| 296 |
+
- text
|
| 297 |
+
- - duration_info/dev/durations
|
| 298 |
+
- durations
|
| 299 |
+
- text_int
|
| 300 |
+
- - dump/raw/dev/wav.scp
|
| 301 |
+
- speech
|
| 302 |
+
- sound
|
| 303 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/pitch.scp
|
| 304 |
+
- pitch
|
| 305 |
+
- npy
|
| 306 |
+
- - exp/tts_stats_raw_char_None/valid/collect_feats/energy.scp
|
| 307 |
+
- energy
|
| 308 |
+
- npy
|
| 309 |
+
valid_iterator_type: null
|
| 310 |
+
valid_max_cache_size: null
|
| 311 |
+
valid_shape_file:
|
| 312 |
+
- exp/tts_stats_raw_char_None/valid/text_shape.char
|
| 313 |
+
- exp/tts_stats_raw_char_None/valid/speech_shape
|
| 314 |
+
version: '202412'
|
| 315 |
+
wandb_entity: null
|
| 316 |
+
wandb_id: null
|
| 317 |
+
wandb_model_log_interval: -1
|
| 318 |
+
wandb_name: null
|
| 319 |
+
wandb_project: null
|
| 320 |
+
write_collected_feats: false
|
dogri_latest/female/model/energy_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0fb130c5668e5ed45e934c17a1538a8756c5eb9c68815ba5d32533e45852eb3a
|
| 3 |
+
size 770
|
dogri_latest/female/model/feats_stats.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b19d99c343e9d668bd1823dc2ca76ded554b799251ff82714836b467044f1f6b
|
| 3 |
+
size 2042
|