codebyzeb commited on
Commit
536c48c
·
verified ·
1 Parent(s): af683c0

Final model for experiment Serbian

Browse files
Files changed (6) hide show
  1. README.md +47 -47
  2. config.json +1 -1
  3. model.safetensors +2 -2
  4. tokenizer.json +30 -44
  5. training_args.bin +1 -1
  6. vocab.json +1 -1
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  library_name: transformers
3
  tags:
4
- - Welsh
5
  - generated_from_trainer
6
  model-index:
7
  - name: childes-segmentation-100k-gpt2_lm-model
@@ -16,53 +16,53 @@ should probably proofread and complete it, then remove this comment. -->
16
  This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
  - epoch: 4000.0
19
- - eval_absolute_seg_boundary_fscore_Boundary Prediction: 0.5797
20
- - eval_absolute_seg_boundary_fscore_Entropy: 0.5438
21
- - eval_absolute_seg_boundary_fscore_Increase in Boundary Prediction: 0.6442
22
- - eval_absolute_seg_boundary_fscore_Increase in Entropy: 0.6066
23
- - eval_absolute_seg_boundary_fscore_Increase in Loss: 0.6391
24
- - eval_absolute_seg_boundary_fscore_Increase in Rank: 0.6575
25
- - eval_absolute_seg_boundary_fscore_Loss: 0.5624
26
- - eval_absolute_seg_boundary_fscore_Majority Vote Cutoff: 0.6868
27
- - eval_absolute_seg_boundary_fscore_Majority Vote Spike: 0.6908
28
- - eval_absolute_seg_boundary_fscore_Rank: 0.5692
29
- - eval_absolute_seg_type_fscore_Boundary Prediction: 0.1765
30
- - eval_absolute_seg_type_fscore_Entropy: 0.2690
31
- - eval_absolute_seg_type_fscore_Increase in Boundary Prediction: 0.1667
32
- - eval_absolute_seg_type_fscore_Increase in Entropy: 0.3180
33
- - eval_absolute_seg_type_fscore_Increase in Loss: 0.3435
34
- - eval_absolute_seg_type_fscore_Increase in Rank: 0.3938
35
- - eval_absolute_seg_type_fscore_Loss: 0.2270
36
- - eval_absolute_seg_type_fscore_Majority Vote Cutoff: 0.3964
37
- - eval_absolute_seg_type_fscore_Majority Vote Spike: 0.4137
38
- - eval_absolute_seg_type_fscore_Rank: 0.2869
39
- - eval_bpc: 4.3835
40
- - eval_loss: 3.0384
41
  - eval_model_preparation_time: 0.0008
42
- - eval_perplexity: 20.8724
43
- - eval_runtime: 7.5077
44
- - eval_samples_per_second: 21.711
45
- - eval_spike_seg_boundary_fscore_Boundary Prediction: 0.6793
46
- - eval_spike_seg_boundary_fscore_Entropy: 0.5896
47
- - eval_spike_seg_boundary_fscore_Increase in Boundary Prediction: 0.6781
48
- - eval_spike_seg_boundary_fscore_Increase in Entropy: 0.6219
49
- - eval_spike_seg_boundary_fscore_Increase in Loss: 0.6493
50
- - eval_spike_seg_boundary_fscore_Increase in Rank: 0.6472
51
- - eval_spike_seg_boundary_fscore_Loss: 0.5906
52
- - eval_spike_seg_boundary_fscore_Majority Vote Cutoff: 0.7049
53
- - eval_spike_seg_boundary_fscore_Majority Vote Spike: 0.6959
54
- - eval_spike_seg_boundary_fscore_Rank: 0.5967
55
- - eval_spike_seg_type_fscore_Boundary Prediction: 0.344
56
- - eval_spike_seg_type_fscore_Entropy: 0.2832
57
- - eval_spike_seg_type_fscore_Increase in Boundary Prediction: 0.3373
58
- - eval_spike_seg_type_fscore_Increase in Entropy: 0.2921
59
- - eval_spike_seg_type_fscore_Increase in Loss: 0.3162
60
- - eval_spike_seg_type_fscore_Increase in Rank: 0.3674
61
- - eval_spike_seg_type_fscore_Loss: 0.2706
62
- - eval_spike_seg_type_fscore_Majority Vote Cutoff: 0.3896
63
- - eval_spike_seg_type_fscore_Majority Vote Spike: 0.3279
64
- - eval_spike_seg_type_fscore_Rank: 0.3246
65
- - eval_steps_per_second: 0.799
66
  - step: 100000
67
 
68
  ## Model description
 
1
  ---
2
  library_name: transformers
3
  tags:
4
+ - Serbian
5
  - generated_from_trainer
6
  model-index:
7
  - name: childes-segmentation-100k-gpt2_lm-model
 
16
  This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
  - epoch: 4000.0
19
+ - eval_absolute_seg_boundary_fscore_Boundary Prediction: 0.5470
20
+ - eval_absolute_seg_boundary_fscore_Entropy: 0.4522
21
+ - eval_absolute_seg_boundary_fscore_Increase in Boundary Prediction: 0.5803
22
+ - eval_absolute_seg_boundary_fscore_Increase in Entropy: 0.4833
23
+ - eval_absolute_seg_boundary_fscore_Increase in Loss: 0.5784
24
+ - eval_absolute_seg_boundary_fscore_Increase in Rank: 0.6139
25
+ - eval_absolute_seg_boundary_fscore_Loss: 0.4960
26
+ - eval_absolute_seg_boundary_fscore_Majority Vote Cutoff: 0.6259
27
+ - eval_absolute_seg_boundary_fscore_Majority Vote Spike: 0.6291
28
+ - eval_absolute_seg_boundary_fscore_Rank: 0.5341
29
+ - eval_absolute_seg_type_fscore_Boundary Prediction: 0.3005
30
+ - eval_absolute_seg_type_fscore_Entropy: 0.2714
31
+ - eval_absolute_seg_type_fscore_Increase in Boundary Prediction: 0.3422
32
+ - eval_absolute_seg_type_fscore_Increase in Entropy: 0.2764
33
+ - eval_absolute_seg_type_fscore_Increase in Loss: 0.3523
34
+ - eval_absolute_seg_type_fscore_Increase in Rank: 0.3931
35
+ - eval_absolute_seg_type_fscore_Loss: 0.2706
36
+ - eval_absolute_seg_type_fscore_Majority Vote Cutoff: 0.4061
37
+ - eval_absolute_seg_type_fscore_Majority Vote Spike: 0.3590
38
+ - eval_absolute_seg_type_fscore_Rank: 0.2985
39
+ - eval_bpc: 4.5128
40
+ - eval_loss: 3.1280
41
  - eval_model_preparation_time: 0.0008
42
+ - eval_perplexity: 22.8288
43
+ - eval_runtime: 12.2624
44
+ - eval_samples_per_second: 12.151
45
+ - eval_spike_seg_boundary_fscore_Boundary Prediction: 0.5811
46
+ - eval_spike_seg_boundary_fscore_Entropy: 0.4902
47
+ - eval_spike_seg_boundary_fscore_Increase in Boundary Prediction: 0.5768
48
+ - eval_spike_seg_boundary_fscore_Increase in Entropy: 0.4836
49
+ - eval_spike_seg_boundary_fscore_Increase in Loss: 0.5501
50
+ - eval_spike_seg_boundary_fscore_Increase in Rank: 0.5845
51
+ - eval_spike_seg_boundary_fscore_Loss: 0.5259
52
+ - eval_spike_seg_boundary_fscore_Majority Vote Cutoff: 0.6380
53
+ - eval_spike_seg_boundary_fscore_Majority Vote Spike: 0.6029
54
+ - eval_spike_seg_boundary_fscore_Rank: 0.5890
55
+ - eval_spike_seg_type_fscore_Boundary Prediction: 0.2831
56
+ - eval_spike_seg_type_fscore_Entropy: 0.2583
57
+ - eval_spike_seg_type_fscore_Increase in Boundary Prediction: 0.2799
58
+ - eval_spike_seg_type_fscore_Increase in Entropy: 0.2175
59
+ - eval_spike_seg_type_fscore_Increase in Loss: 0.2712
60
+ - eval_spike_seg_type_fscore_Increase in Rank: 0.3042
61
+ - eval_spike_seg_type_fscore_Loss: 0.2594
62
+ - eval_spike_seg_type_fscore_Majority Vote Cutoff: 0.3492
63
+ - eval_spike_seg_type_fscore_Majority Vote Spike: 0.2747
64
+ - eval_spike_seg_type_fscore_Rank: 0.3375
65
+ - eval_steps_per_second: 0.408
66
  - step: 100000
67
 
68
  ## Model description
config.json CHANGED
@@ -27,5 +27,5 @@
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
- "vocab_size": 48
31
  }
 
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
+ "vocab_size": 34
31
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78f6926d87d45b54c7fa5fdcbca74dd73ac3ef421ef2beeb587acfa2ecb88b76
3
- size 2539800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe533efbd0b31c095b2145cb7c348667d0ec3699e849cc3981aa0d82694b3c0
3
+ size 2532632
tokenizer.json CHANGED
@@ -115,50 +115,36 @@
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
- "ɔ": 4,
119
- "h": 5,
120
- "m": 6,
121
- "ai": 7,
122
- "ɛ": 8,
123
- "r": 9,
124
- "t": 10,
125
- "ɑː": 11,
126
- "p": 12,
127
- "d": 13,
128
- "": 14,
129
- "b": 15,
130
- "": 16,
131
- "f": 17,
132
- "": 18,
133
- "χ": 19,
134
- "w": 20,
135
- "a": 21,
136
- "n": 22,
137
- "ø": 23,
138
- "j": 24,
139
- "au": 25,
140
- "ə": 26,
141
- "ɔi": 27,
142
- "ð": 28,
143
- "ɪ": 29,
144
- "s": 30,
145
- "ɡ": 31,
146
- "ʊi": 32,
147
- "ʊ": 33,
148
- "əi": 34,
149
- "θ": 35,
150
- "l": 36,
151
- "ʌ": 37,
152
- "ŋ": 38,
153
- "v": 39,
154
- "k": 40,
155
- "ɬ": 41,
156
- "ɪu": 42,
157
- "uː": 43,
158
- "ʃ": 44,
159
- "ɛu": 45,
160
- "d̠ʒ": 46,
161
- "z": 47
162
  },
163
  "unk_token": "UNK"
164
  }
 
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
+ "j": 4,
119
+ "": 5,
120
+ "s̪̻": 6,
121
+ "t̪̻": 7,
122
+ "u": 8,
123
+ "l": 9,
124
+ "": 10,
125
+ "ʒ̺": 11,
126
+ "i": 12,
127
+ "ʋ": 13,
128
+ "d̪̻": 14,
129
+ "": 15,
130
+ "m": 16,
131
+ "n": 17,
132
+ "r": 18,
133
+ "k": 19,
134
+ "t̪̻s̪̻": 20,
135
+ "p": 21,
136
+ "ʃ̺": 22,
137
+ "x": 23,
138
+ "b": 24,
139
+ "ɡ": 25,
140
+ "t̻ʃ̻": 26,
141
+ "f": 27,
142
+ "z̪̻": 28,
143
+ "ɲ": 29,
144
+ "ʎ": 30,
145
+ "d̻ʒ̻": 31,
146
+ "y": 32,
147
+ "w": 33
 
 
 
 
 
 
 
 
 
 
 
 
 
 
148
  },
149
  "unk_token": "UNK"
150
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:193dccba324f20834b381484ac1135bae01184adac5a817a5c4fd3bb127ce078
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52482822ae0aead84723e50320eafa35fe04b4377ff02a99470964996e89b1f0
3
  size 5368
vocab.json CHANGED
@@ -1 +1 @@
1
- {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"ɔ":4,"h":5,"m":6,"ai":7,"ɛ":8,"r":9,"t":10,"ɑː":11,"p":12,"d":13,"":14,"b":15,"":16,"f":17,"":18,"χ":19,"w":20,"a":21,"n":22,"ø":23,"j":24,"au":25,"ə":26,"ɔi":27,"ð":28,"ɪ":29,"s":30,"ɡ":31,"ʊi":32,"ʊ":33,"əi":34,"θ":35,"l":36,"ʌ":37,"ŋ":38,"v":39,"k":40,"ɬ":41,"ɪu":42,"uː":43,"ʃ":44,"ɛu":45,"d̠ʒ":46,"z":47}
 
1
+ {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"j":4,"":5,"s̪̻":6,"t̪̻":7,"u":8,"l":9,"":10,"ʒ̺":11,"i":12,"ʋ":13,"d̪̻":14,"":15,"m":16,"n":17,"r":18,"k":19,"t̪̻s̪̻":20,"p":21,"ʃ̺":22,"x":23,"b":24,"ɡ":25,"t̻ʃ̻":26,"f":27,"z̪̻":28,"ɲ":29,"ʎ":30,"d̻ʒ̻":31,"y":32,"w":33}