codebyzeb commited on
Commit
cd1df9a
·
verified ·
1 Parent(s): 536c48c

Final model for experiment Indonesian

Browse files
Files changed (6) hide show
  1. README.md +47 -47
  2. config.json +1 -1
  3. model.safetensors +2 -2
  4. tokenizer.json +25 -28
  5. training_args.bin +1 -1
  6. vocab.json +1 -1
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  library_name: transformers
3
  tags:
4
- - Serbian
5
  - generated_from_trainer
6
  model-index:
7
  - name: childes-segmentation-100k-gpt2_lm-model
@@ -16,53 +16,53 @@ should probably proofread and complete it, then remove this comment. -->
16
  This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
  - epoch: 4000.0
19
- - eval_absolute_seg_boundary_fscore_Boundary Prediction: 0.5470
20
- - eval_absolute_seg_boundary_fscore_Entropy: 0.4522
21
- - eval_absolute_seg_boundary_fscore_Increase in Boundary Prediction: 0.5803
22
- - eval_absolute_seg_boundary_fscore_Increase in Entropy: 0.4833
23
- - eval_absolute_seg_boundary_fscore_Increase in Loss: 0.5784
24
- - eval_absolute_seg_boundary_fscore_Increase in Rank: 0.6139
25
- - eval_absolute_seg_boundary_fscore_Loss: 0.4960
26
- - eval_absolute_seg_boundary_fscore_Majority Vote Cutoff: 0.6259
27
- - eval_absolute_seg_boundary_fscore_Majority Vote Spike: 0.6291
28
- - eval_absolute_seg_boundary_fscore_Rank: 0.5341
29
- - eval_absolute_seg_type_fscore_Boundary Prediction: 0.3005
30
- - eval_absolute_seg_type_fscore_Entropy: 0.2714
31
- - eval_absolute_seg_type_fscore_Increase in Boundary Prediction: 0.3422
32
- - eval_absolute_seg_type_fscore_Increase in Entropy: 0.2764
33
- - eval_absolute_seg_type_fscore_Increase in Loss: 0.3523
34
- - eval_absolute_seg_type_fscore_Increase in Rank: 0.3931
35
- - eval_absolute_seg_type_fscore_Loss: 0.2706
36
- - eval_absolute_seg_type_fscore_Majority Vote Cutoff: 0.4061
37
- - eval_absolute_seg_type_fscore_Majority Vote Spike: 0.3590
38
- - eval_absolute_seg_type_fscore_Rank: 0.2985
39
- - eval_bpc: 4.5128
40
- - eval_loss: 3.1280
41
  - eval_model_preparation_time: 0.0008
42
- - eval_perplexity: 22.8288
43
- - eval_runtime: 12.2624
44
- - eval_samples_per_second: 12.151
45
- - eval_spike_seg_boundary_fscore_Boundary Prediction: 0.5811
46
- - eval_spike_seg_boundary_fscore_Entropy: 0.4902
47
- - eval_spike_seg_boundary_fscore_Increase in Boundary Prediction: 0.5768
48
- - eval_spike_seg_boundary_fscore_Increase in Entropy: 0.4836
49
- - eval_spike_seg_boundary_fscore_Increase in Loss: 0.5501
50
- - eval_spike_seg_boundary_fscore_Increase in Rank: 0.5845
51
- - eval_spike_seg_boundary_fscore_Loss: 0.5259
52
- - eval_spike_seg_boundary_fscore_Majority Vote Cutoff: 0.6380
53
- - eval_spike_seg_boundary_fscore_Majority Vote Spike: 0.6029
54
- - eval_spike_seg_boundary_fscore_Rank: 0.5890
55
- - eval_spike_seg_type_fscore_Boundary Prediction: 0.2831
56
- - eval_spike_seg_type_fscore_Entropy: 0.2583
57
- - eval_spike_seg_type_fscore_Increase in Boundary Prediction: 0.2799
58
- - eval_spike_seg_type_fscore_Increase in Entropy: 0.2175
59
- - eval_spike_seg_type_fscore_Increase in Loss: 0.2712
60
- - eval_spike_seg_type_fscore_Increase in Rank: 0.3042
61
- - eval_spike_seg_type_fscore_Loss: 0.2594
62
- - eval_spike_seg_type_fscore_Majority Vote Cutoff: 0.3492
63
- - eval_spike_seg_type_fscore_Majority Vote Spike: 0.2747
64
- - eval_spike_seg_type_fscore_Rank: 0.3375
65
- - eval_steps_per_second: 0.408
66
  - step: 100000
67
 
68
  ## Model description
 
1
  ---
2
  library_name: transformers
3
  tags:
4
+ - Indonesian
5
  - generated_from_trainer
6
  model-index:
7
  - name: childes-segmentation-100k-gpt2_lm-model
 
16
  This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
  - epoch: 4000.0
19
+ - eval_absolute_seg_boundary_fscore_Boundary Prediction: 0.5187
20
+ - eval_absolute_seg_boundary_fscore_Entropy: 0.4017
21
+ - eval_absolute_seg_boundary_fscore_Increase in Boundary Prediction: 0.5413
22
+ - eval_absolute_seg_boundary_fscore_Increase in Entropy: 0.4616
23
+ - eval_absolute_seg_boundary_fscore_Increase in Loss: 0.5806
24
+ - eval_absolute_seg_boundary_fscore_Increase in Rank: 0.6071
25
+ - eval_absolute_seg_boundary_fscore_Loss: 0.4839
26
+ - eval_absolute_seg_boundary_fscore_Majority Vote Cutoff: 0.6298
27
+ - eval_absolute_seg_boundary_fscore_Majority Vote Spike: 0.6048
28
+ - eval_absolute_seg_boundary_fscore_Rank: 0.5122
29
+ - eval_absolute_seg_type_fscore_Boundary Prediction: 0.3513
30
+ - eval_absolute_seg_type_fscore_Entropy: 0.2802
31
+ - eval_absolute_seg_type_fscore_Increase in Boundary Prediction: 0.3813
32
+ - eval_absolute_seg_type_fscore_Increase in Entropy: 0.3222
33
+ - eval_absolute_seg_type_fscore_Increase in Loss: 0.3824
34
+ - eval_absolute_seg_type_fscore_Increase in Rank: 0.4208
35
+ - eval_absolute_seg_type_fscore_Loss: 0.3151
36
+ - eval_absolute_seg_type_fscore_Majority Vote Cutoff: 0.4692
37
+ - eval_absolute_seg_type_fscore_Majority Vote Spike: 0.4276
38
+ - eval_absolute_seg_type_fscore_Rank: 0.3621
39
+ - eval_bpc: 4.2803
40
+ - eval_loss: 2.9669
41
  - eval_model_preparation_time: 0.0008
42
+ - eval_perplexity: 19.4309
43
+ - eval_runtime: 23.9581
44
+ - eval_samples_per_second: 5.426
45
+ - eval_spike_seg_boundary_fscore_Boundary Prediction: 0.5220
46
+ - eval_spike_seg_boundary_fscore_Entropy: 0.4477
47
+ - eval_spike_seg_boundary_fscore_Increase in Boundary Prediction: 0.5144
48
+ - eval_spike_seg_boundary_fscore_Increase in Entropy: 0.4307
49
+ - eval_spike_seg_boundary_fscore_Increase in Loss: 0.5371
50
+ - eval_spike_seg_boundary_fscore_Increase in Rank: 0.5614
51
+ - eval_spike_seg_boundary_fscore_Loss: 0.5245
52
+ - eval_spike_seg_boundary_fscore_Majority Vote Cutoff: 0.5996
53
+ - eval_spike_seg_boundary_fscore_Majority Vote Spike: 0.5457
54
+ - eval_spike_seg_boundary_fscore_Rank: 0.5726
55
+ - eval_spike_seg_type_fscore_Boundary Prediction: 0.2919
56
+ - eval_spike_seg_type_fscore_Entropy: 0.2635
57
+ - eval_spike_seg_type_fscore_Increase in Boundary Prediction: 0.2716
58
+ - eval_spike_seg_type_fscore_Increase in Entropy: 0.2197
59
+ - eval_spike_seg_type_fscore_Increase in Loss: 0.2948
60
+ - eval_spike_seg_type_fscore_Increase in Rank: 0.3411
61
+ - eval_spike_seg_type_fscore_Loss: 0.2883
62
+ - eval_spike_seg_type_fscore_Majority Vote Cutoff: 0.4045
63
+ - eval_spike_seg_type_fscore_Majority Vote Spike: 0.2782
64
+ - eval_spike_seg_type_fscore_Rank: 0.3612
65
+ - eval_steps_per_second: 0.209
66
  - step: 100000
67
 
68
  ## Model description
config.json CHANGED
@@ -27,5 +27,5 @@
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
- "vocab_size": 34
31
  }
 
27
  "torch_dtype": "float32",
28
  "transformers_version": "4.44.2",
29
  "use_cache": true,
30
+ "vocab_size": 31
31
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efe533efbd0b31c095b2145cb7c348667d0ec3699e849cc3981aa0d82694b3c0
3
- size 2532632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84fe774c468a033f724e41b8a5406299e48e82cccf7326ca4da90e906360fbcc
3
+ size 2531096
tokenizer.json CHANGED
@@ -115,36 +115,33 @@
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
- "j": 4,
119
- "": 5,
120
- "s̪̻": 6,
121
- "t̪̻": 7,
122
- "u": 8,
123
- "l": 9,
124
- "": 10,
125
- "ʒ̺": 11,
126
- "i": 12,
127
- "ʋ": 13,
128
- "d̪̻": 14,
129
- "": 15,
130
- "m": 16,
131
- "n": 17,
132
- "r": 18,
133
- "k": 19,
134
- "t̪̻s̪̻": 20,
135
  "p": 21,
136
- "ʃ̺": 22,
137
- "x": 23,
138
- "b": 24,
139
- "ɡ": 25,
140
- "t̻ʃ̻": 26,
141
  "f": 27,
142
- "z̪̻": 28,
143
- "ɲ": 29,
144
- "ʎ": 30,
145
- "d̻ʒ̻": 31,
146
- "y": 32,
147
- "w": 33
148
  },
149
  "unk_token": "UNK"
150
  }
 
115
  "PAD": 1,
116
  "WORD_BOUNDARY": 2,
117
  "UTT_BOUNDARY": 3,
118
+ "s": 4,
119
+ "i": 5,
120
+ "n": 6,
121
+ "m": 7,
122
+ "a": 8,
123
+ "j": 9,
124
+ "u": 10,
125
+ "k": 11,
126
+ "o": 12,
127
+ "h": 13,
128
+ "l": 14,
129
+ "t": 15,
130
+ "w": 16,
131
+ "d̠ʒ": 17,
132
+ "ŋ": 18,
133
+ "ə": 19,
134
+ "d": 20,
135
  "p": 21,
136
+ "ɡ": 22,
137
+ "b": 23,
138
+ "r": 24,
139
+ "ɲ": 25,
140
+ "t̠ʃ": 26,
141
  "f": 27,
142
+ "z": 28,
143
+ "ʃ": 29,
144
+ "x": 30
 
 
 
145
  },
146
  "unk_token": "UNK"
147
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52482822ae0aead84723e50320eafa35fe04b4377ff02a99470964996e89b1f0
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0948cb11c8ef3cbbac150d6b065e41c48eafcb71430ca203d424013a0dc9d431
3
  size 5368
vocab.json CHANGED
@@ -1 +1 @@
1
- {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"j":4,"":5,"s̪̻":6,"t̪̻":7,"u":8,"l":9,"":10,"ʒ̺":11,"i":12,"ʋ":13,"d̪̻":14,"":15,"m":16,"n":17,"r":18,"k":19,"t̪̻s̪̻":20,"p":21,"ʃ̺":22,"x":23,"b":24,"ɡ":25,"t̻ʃ̻":26,"f":27,"z̪̻":28,"ɲ":29,"ʎ":30,"d̻ʒ̻":31,"y":32,"w":33}
 
1
+ {"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"s":4,"i":5,"n":6,"m":7,"a":8,"j":9,"u":10,"k":11,"o":12,"h":13,"l":14,"t":15,"w":16,"d̠ʒ":17,"ŋ":18,"ə":19,"d":20,"p":21,"ɡ":22,"b":23,"r":24,"ɲ":25,"t̠ʃ":26,"f":27,"z":28,"ʃ":29,"x":30}