End of training

Browse files

Files changed (11) hide show

.gitattributes +1 -0
README.md +76 -0
config.json +160 -0
model.safetensors +3 -0
runs/Mar06_01-39-41_dgx10/events.out.tfevents.1741221586.dgx10.2696097.0 +3 -0
runs/Mar06_01-55-57_dgx10/events.out.tfevents.1741222561.dgx10.2700023.0 +3 -0
runs/Mar06_01-55-57_dgx10/events.out.tfevents.1741297853.dgx10.2700023.1 +3 -0
special_tokens_map.json +52 -0
tokenizer.json +3 -0
tokenizer_config.json +102 -0
training_args.bin +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,76 @@

+---
+library_name: transformers
+license: mit
+base_model: xlm-roberta-large
+tags:
+- generated_from_trainer
+datasets:
+- generator
+metrics:
+- accuracy
+model-index:
+- name: XLM-RoBERTa-1
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# XLM-RoBERTa-1
+This model is a fine-tuned version of [xlm-roberta-large](https://huggingface.co/xlm-roberta-large) on the generator dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.4935
+- Accuracy: 0.9044
+- Micro Precision: 0.9044
+- Micro Recall: 0.9044
+- Micro F1: 0.9044
+- Macro Precision: 0.8822
+- Macro Recall: 0.8527
+- Macro F1: 0.8599
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 1e-05
+- train_batch_size: 12
+- eval_batch_size: 12
+- seed: 42
+- gradient_accumulation_steps: 2
+- total_train_batch_size: 24
+- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: linear
+- lr_scheduler_warmup_steps: 500
+- num_epochs: 5
+### Training results
+| Training Loss | Epoch  | Step   | Validation Loss | Accuracy | Micro Precision | Micro Recall | Micro F1 | Macro Precision | Macro Recall | Macro F1 |
+|:-------------:|:------:|:------:|:---------------:|:--------:|:---------------:|:------------:|:--------:|:---------------:|:------------:|:--------:|
+| 0.3304        | 1.0000 | 40166  | 0.3911          | 0.8883   | 0.8883          | 0.8883       | 0.8883   | 0.8651          | 0.8285       | 0.8359   |
+| 0.2376        | 2.0    | 80333  | 0.3998          | 0.9014   | 0.9014          | 0.9014       | 0.9014   | 0.8714          | 0.8480       | 0.8523   |
+| 0.1733        | 3.0000 | 120499 | 0.4297          | 0.9059   | 0.9059          | 0.9059       | 0.9059   | 0.8718          | 0.8607       | 0.8610   |
+| 0.1268        | 4.0    | 160666 | 0.4822          | 0.9088   | 0.9088          | 0.9088       | 0.9088   | 0.8807          | 0.8608       | 0.8649   |
+| 0.1038        | 4.9999 | 200830 | 0.5242          | 0.9087   | 0.9087          | 0.9087       | 0.9087   | 0.8753          | 0.8646       | 0.8660   |
+### Framework versions
+- Transformers 4.46.2
+- Pytorch 2.5.1+cu124
+- Datasets 3.1.0
+- Tokenizers 0.20.3

config.json ADDED Viewed

	@@ -0,0 +1,160 @@

+{
+  "_name_or_path": "xlm-roberta-large",
+  "architectures": [
+    "RelationExtractionModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "P0 other",
+    "1": "P19 m\u00edsto narozen\u00ed",
+    "2": "P20 m\u00edsto \u00famrt\u00ed",
+    "3": "P21 pohlav\u00ed",
+    "4": "P22 otec",
+    "5": "P25 matka",
+    "6": "P26 cho\u0165",
+    "7": "P27 st\u00e1tn\u00ed ob\u010danstv\u00ed",
+    "8": "P36 hlavn\u00ed m\u011bsto",
+    "9": "P39 ve funkci",
+    "10": "P47 hrani\u010d\u00ed s",
+    "11": "P50 autor",
+    "12": "P53 rodina",
+    "13": "P54 \u010dlen sportovn\u00edho dru\u017estva",
+    "14": "P97 \u0161lechtick\u00fd titul",
+    "15": "P101 zam\u011b\u0159en\u00ed",
+    "16": "P102 stranick\u00e1 p\u0159\u00edslu\u0161nost",
+    "17": "P105 taxonomick\u00e9 za\u0159azen\u00ed",
+    "18": "P106 povol\u00e1n\u00ed",
+    "19": "P118 liga",
+    "20": "P131 nach\u00e1z\u00ed se v administrativn\u00ed jednotce",
+    "21": "P136 \u017e\u00e1nr",
+    "22": "P137 oper\u00e1tor",
+    "23": "P138 pojmenov\u00e1no po",
+    "24": "P140 vyzn\u00e1n\u00ed",
+    "25": "P150 ni\u017e\u0161\u00ed spr\u00e1vn\u00ed celky",
+    "26": "P155 p\u0159edchoz\u00ed",
+    "27": "P159 s\u00eddlo",
+    "28": "P161 hraje",
+    "29": "P171 nad\u0159azen\u00fd taxon",
+    "30": "P175 interpret",
+    "31": "P176 v\u00fdrobce",
+    "32": "P179 s\u00e9rie",
+    "33": "P206 u vodn\u00ed plochy",
+    "34": "P264 hudebn\u00ed vydavatelstv\u00ed",
+    "35": "P276 m\u00edsto",
+    "36": "P279 nadt\u0159\u00edda",
+    "37": "P360 seznam (\u010deho)",
+    "38": "P361 \u010d\u00e1st (\u010deho)",
+    "39": "P413 pozice hr\u00e1\u010de",
+    "40": "P425 obor tohoto povol\u00e1n\u00ed",
+    "41": "P460 \u00fadajn\u011b tot\u00e9\u017e co",
+    "42": "P461 protiklad",
+    "43": "P463 \u010dlen (\u010deho)",
+    "44": "P495 zem\u011b p\u016fvodu",
+    "45": "P527 skl\u00e1d\u00e1 se z",
+    "46": "P530 diplomatick\u00fd vztah",
+    "47": "P641 sport",
+    "48": "P669 ulice",
+    "49": "P706 oblast",
+    "50": "P708 diec\u00e9ze",
+    "51": "P734 p\u0159\u00edjmen\u00ed",
+    "52": "P735 rodn\u00e9 jm\u00e9no",
+    "53": "P740 m\u00edsto vzniku",
+    "54": "P800 d\u00edlo",
+    "55": "P921 hlavn\u00ed t\u00e9ma d\u00edla",
+    "56": "P974 p\u0159\u00edtok",
+    "57": "P1056 produkuje",
+    "58": "P1303 hudebn\u00ed n\u00e1stroj",
+    "59": "P1376 hlavn\u00ed s\u00eddlo \u010deho",
+    "60": "P1383 zahrnuje s\u00eddlo",
+    "61": "P1889 rozd\u00edln\u00e9 od",
+    "62": "P3373 sourozenec",
+    "63": "P4552 poho\u0159\u00ed"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "P0 other": 0,
+    "P101 zam\u011b\u0159en\u00ed": 15,
+    "P102 stranick\u00e1 p\u0159\u00edslu\u0161nost": 16,
+    "P105 taxonomick\u00e9 za\u0159azen\u00ed": 17,
+    "P1056 produkuje": 57,
+    "P106 povol\u00e1n\u00ed": 18,
+    "P118 liga": 19,
+    "P1303 hudebn\u00ed n\u00e1stroj": 58,
+    "P131 nach\u00e1z\u00ed se v administrativn\u00ed jednotce": 20,
+    "P136 \u017e\u00e1nr": 21,
+    "P137 oper\u00e1tor": 22,
+    "P1376 hlavn\u00ed s\u00eddlo \u010deho": 59,
+    "P138 pojmenov\u00e1no po": 23,
+    "P1383 zahrnuje s\u00eddlo": 60,
+    "P140 vyzn\u00e1n\u00ed": 24,
+    "P150 ni\u017e\u0161\u00ed spr\u00e1vn\u00ed celky": 25,
+    "P155 p\u0159edchoz\u00ed": 26,
+    "P159 s\u00eddlo": 27,
+    "P161 hraje": 28,
+    "P171 nad\u0159azen\u00fd taxon": 29,
+    "P175 interpret": 30,
+    "P176 v\u00fdrobce": 31,
+    "P179 s\u00e9rie": 32,
+    "P1889 rozd\u00edln\u00e9 od": 61,
+    "P19 m\u00edsto narozen\u00ed": 1,
+    "P20 m\u00edsto \u00famrt\u00ed": 2,
+    "P206 u vodn\u00ed plochy": 33,
+    "P21 pohlav\u00ed": 3,
+    "P22 otec": 4,
+    "P25 matka": 5,
+    "P26 cho\u0165": 6,
+    "P264 hudebn\u00ed vydavatelstv\u00ed": 34,
+    "P27 st\u00e1tn\u00ed ob\u010danstv\u00ed": 7,
+    "P276 m\u00edsto": 35,
+    "P279 nadt\u0159\u00edda": 36,
+    "P3373 sourozenec": 62,
+    "P36 hlavn\u00ed m\u011bsto": 8,
+    "P360 seznam (\u010deho)": 37,
+    "P361 \u010d\u00e1st (\u010deho)": 38,
+    "P39 ve funkci": 9,
+    "P413 pozice hr\u00e1\u010de": 39,
+    "P425 obor tohoto povol\u00e1n\u00ed": 40,
+    "P4552 poho\u0159\u00ed": 63,
+    "P460 \u00fadajn\u011b tot\u00e9\u017e co": 41,
+    "P461 protiklad": 42,
+    "P463 \u010dlen (\u010deho)": 43,
+    "P47 hrani\u010d\u00ed s": 10,
+    "P495 zem\u011b p\u016fvodu": 44,
+    "P50 autor": 11,
+    "P527 skl\u00e1d\u00e1 se z": 45,
+    "P53 rodina": 12,
+    "P530 diplomatick\u00fd vztah": 46,
+    "P54 \u010dlen sportovn\u00edho dru\u017estva": 13,
+    "P641 sport": 47,
+    "P669 ulice": 48,
+    "P706 oblast": 49,
+    "P708 diec\u00e9ze": 50,
+    "P734 p\u0159\u00edjmen\u00ed": 51,
+    "P735 rodn\u00e9 jm\u00e9no": 52,
+    "P740 m\u00edsto vzniku": 53,
+    "P800 d\u00edlo": 54,
+    "P921 hlavn\u00ed t\u00e9ma d\u00edla": 55,
+    "P97 \u0161lechtick\u00fd titul": 14,
+    "P974 p\u0159\u00edtok": 56
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.46.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 250002
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:beb92342efa5ce3788ec5a2100c32f556cd32c6fea6e76ae777474e01fed902b
+size 2240416848

runs/Mar06_01-39-41_dgx10/events.out.tfevents.1741221586.dgx10.2696097.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4bd472cd03ceafab66d9b213213d3df0a94df23c6f8016b1d310158c5bd6504a
+size 9852

runs/Mar06_01-55-57_dgx10/events.out.tfevents.1741222561.dgx10.2700023.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:159acffbfb143f476b468d225d25e8c54e0bd9170c5d8b8629f330f57d46ed57
+size 99643

runs/Mar06_01-55-57_dgx10/events.out.tfevents.1741297853.dgx10.2700023.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b86b858d7334c092fcf94d4709237688bc7924a14e9e320ba716bfff8bf88d4
+size 757

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,52 @@

+{
+  "additional_special_tokens": [
+    {
+      "content": "[unused1]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[unused2]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[unused3]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[unused4]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[unused5]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd1ed561533c9d74649ec70d231aaad68ec693dd3e1821c5da8a69e59ce6a56e
+size 17083762

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,102 @@

+{
+  "add_prefix_space": true,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250001": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250002": {
+      "content": "[unused1]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250003": {
+      "content": "[unused2]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250004": {
+      "content": "[unused3]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250005": {
+      "content": "[unused4]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "250006": {
+      "content": "[unused5]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "[unused1]",
+    "[unused2]",
+    "[unused3]",
+    "[unused4]",
+    "[unused5]"
+  ],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2476dc9ac594194dc0989969d790e0761fea836a1e19e5e237763dbf6ff5f5b
+size 5304