Add config/everyvoice-shared-text.yaml for Chichewa
Browse files
config/everyvoice-shared-text.yaml
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
cleaners: [everyvoice.utils.collapse_whitespace, everyvoice.utils.strip_text]
|
| 2 |
+
g2p_engines: {}
|
| 3 |
+
symbols:
|
| 4 |
+
open-bible-chichewa_characters: ['0', '1', '2', '3', '4', '5', '6', '7', '8', '9',
|
| 5 |
+
A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P, R, S, T, U, V, W, Y, Z, a, b,
|
| 6 |
+
c, d, e, f, g, h, i, j, k, l, m, n, o, p, r, s, t, u, v, w, y, z, , ʼ, ‘, ’]
|
| 7 |
+
open-bible-chichewa_phones: [a, b, d, e, f, h, i, j, k, l, m, n, o, p, r, s, t,
|
| 8 |
+
t͡ʃ, u, v, w, z, ɡ, ʒ, ʔ]
|
| 9 |
+
punctuation:
|
| 10 |
+
colons: [':']
|
| 11 |
+
commas: [',']
|
| 12 |
+
ellipses: […]
|
| 13 |
+
exclamations: ['!', ¡]
|
| 14 |
+
hyphens: ['-', —, '*']
|
| 15 |
+
parentheses: [(, ), '[', ']', '{', '}']
|
| 16 |
+
periods: [.]
|
| 17 |
+
question_symbols: ['?', ¿]
|
| 18 |
+
quotemarks: ['"', '''', “, ”, «, »]
|
| 19 |
+
semi_colons: [;]
|
| 20 |
+
silence: [<SIL>]
|
| 21 |
+
to_replace: {}
|