mattbonnell commited on
Commit
4a6c3ec
·
verified ·
1 Parent(s): a316a22

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. vocab.json +48 -48
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  license: apache-2.0
3
- base_model: mattbonnell/wav2vec2-base-wonders-phonemes
4
  tags:
5
  - generated_from_trainer
 
6
  datasets:
7
  - transcribed_calls
8
  model-index:
 
1
  ---
2
  license: apache-2.0
 
3
  tags:
4
  - generated_from_trainer
5
+ base_model: mattbonnell/wav2vec2-base-wonders-phonemes
6
  datasets:
7
  - transcribed_calls
8
  model-index:
vocab.json CHANGED
@@ -1,52 +1,52 @@
1
  {
2
  "[PAD]": 49,
3
  "[UNK]": 48,
4
- "a": 29,
5
- "b": 10,
6
- "c": 34,
7
- "d": 17,
8
- "e": 33,
9
- "f": 31,
10
- "h": 11,
11
- "i": 24,
12
- "j": 42,
13
- "k": 20,
14
- "l": 30,
15
- "m": 7,
16
- "n": 35,
17
- "o": 5,
18
- "p": 40,
19
- "r": 18,
20
- "s": 37,
21
- "t": 43,
22
- "u": 14,
23
- "v": 45,
24
- "w": 23,
25
- "y": 2,
26
- "z": 12,
27
- "|": 19,
28
- "æ": 47,
29
- "ð": 26,
30
- "ŋ": 27,
31
- "ɐ": 1,
32
- "ɑ": 38,
33
- "ɔ": 32,
34
- "ə": 44,
35
- "ɚ": 0,
36
- "ɛ": 41,
37
- "ɜ": 46,
38
- "ɡ": 36,
39
- "ɣ": 6,
40
- "ɪ": 25,
41
- "ɹ": 8,
42
- "ɾ": 3,
43
- "ʃ": 15,
44
- "ʊ": 13,
45
- "ʌ": 21,
46
- "ʒ": 39,
47
- "ʔ": 9,
48
- "ː": 22,
49
- "̩": 28,
50
- "θ": 16,
51
- "ᵻ": 4
52
  }
 
1
  {
2
  "[PAD]": 49,
3
  "[UNK]": 48,
4
+ "a": 0,
5
+ "b": 21,
6
+ "c": 43,
7
+ "d": 46,
8
+ "e": 7,
9
+ "f": 3,
10
+ "h": 27,
11
+ "i": 44,
12
+ "j": 31,
13
+ "k": 14,
14
+ "l": 29,
15
+ "m": 22,
16
+ "n": 24,
17
+ "o": 12,
18
+ "p": 9,
19
+ "r": 15,
20
+ "s": 17,
21
+ "t": 6,
22
+ "u": 33,
23
+ "v": 2,
24
+ "w": 8,
25
+ "y": 18,
26
+ "z": 1,
27
+ "|": 42,
28
+ "æ": 28,
29
+ "ð": 19,
30
+ "ŋ": 20,
31
+ "ɐ": 47,
32
+ "ɑ": 32,
33
+ "ɔ": 35,
34
+ "ə": 10,
35
+ "ɚ": 16,
36
+ "ɛ": 4,
37
+ "ɜ": 38,
38
+ "ɡ": 37,
39
+ "ɣ": 41,
40
+ "ɪ": 5,
41
+ "ɹ": 11,
42
+ "ɾ": 40,
43
+ "ʃ": 26,
44
+ "ʊ": 23,
45
+ "ʌ": 25,
46
+ "ʒ": 13,
47
+ "ʔ": 34,
48
+ "ː": 45,
49
+ "̩": 39,
50
+ "θ": 36,
51
+ "ᵻ": 30
52
  }