cedricbonhomme commited on
Commit
1f4c42f
·
verified ·
1 Parent(s): c268e0d

Upload folder using huggingface_hub

Browse files
Files changed (6) hide show
  1. README.md +77 -0
  2. config.json +43 -0
  3. model.safetensors +3 -0
  4. tokenizer.json +0 -0
  5. tokenizer_config.json +16 -0
  6. training_args.bin +3 -0
README.md ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ base_model: ai-forever/ruRoberta-large
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
+ model-index:
9
+ - name: vulnerability-severity-classification-russian-ruRoberta-large
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # vulnerability-severity-classification-russian-ruRoberta-large
17
+
18
+ This model is a fine-tuned version of [ai-forever/ruRoberta-large](https://huggingface.co/ai-forever/ruRoberta-large) on an unknown dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 2.6495
21
+ - Accuracy: 0.7417
22
+ - F1 Macro: 0.6650
23
+ - Low Precision: 0.6154
24
+ - Low Recall: 0.3380
25
+ - Low F1: 0.4364
26
+ - Medium Precision: 0.7619
27
+ - Medium Recall: 0.8312
28
+ - Medium F1: 0.7951
29
+ - High Precision: 0.6869
30
+ - High Recall: 0.6080
31
+ - High F1: 0.6450
32
+ - Critical Precision: 0.7678
33
+ - Critical Recall: 0.7996
34
+ - Critical F1: 0.7834
35
+
36
+ ## Model description
37
+
38
+ More information needed
39
+
40
+ ## Intended uses & limitations
41
+
42
+ More information needed
43
+
44
+ ## Training and evaluation data
45
+
46
+ More information needed
47
+
48
+ ## Training procedure
49
+
50
+ ### Training hyperparameters
51
+
52
+ The following hyperparameters were used during training:
53
+ - learning_rate: 3e-05
54
+ - train_batch_size: 64
55
+ - eval_batch_size: 64
56
+ - seed: 42
57
+ - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
58
+ - lr_scheduler_type: linear
59
+ - num_epochs: 5
60
+
61
+ ### Training results
62
+
63
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 Macro | Low Precision | Low Recall | Low F1 | Medium Precision | Medium Recall | Medium F1 | High Precision | High Recall | High F1 | Critical Precision | Critical Recall | Critical F1 |
64
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|:-------------:|:----------:|:------:|:----------------:|:-------------:|:---------:|:--------------:|:-----------:|:-------:|:------------------:|:---------------:|:-----------:|
65
+ | 3.0373 | 1.0 | 1167 | 3.0503 | 0.6895 | 0.5626 | 0.7959 | 0.1099 | 0.1931 | 0.7233 | 0.7958 | 0.7578 | 0.6083 | 0.5152 | 0.5579 | 0.6947 | 0.7954 | 0.7416 |
66
+ | 2.9084 | 2.0 | 2334 | 2.8601 | 0.7142 | 0.6048 | 0.8 | 0.1803 | 0.2943 | 0.7523 | 0.8001 | 0.7754 | 0.6923 | 0.5156 | 0.5910 | 0.6660 | 0.8807 | 0.7584 |
67
+ | 2.5937 | 3.0 | 3501 | 2.6529 | 0.7335 | 0.6349 | 0.6967 | 0.2394 | 0.3564 | 0.7565 | 0.8379 | 0.7952 | 0.7126 | 0.5411 | 0.6152 | 0.7092 | 0.8488 | 0.7727 |
68
+ | 2.5230 | 4.0 | 4668 | 2.6348 | 0.7365 | 0.6549 | 0.6170 | 0.3268 | 0.4273 | 0.7403 | 0.8568 | 0.7943 | 0.7208 | 0.5451 | 0.6207 | 0.7526 | 0.8038 | 0.7773 |
69
+ | 2.0599 | 5.0 | 5835 | 2.6495 | 0.7417 | 0.6650 | 0.6154 | 0.3380 | 0.4364 | 0.7619 | 0.8312 | 0.7951 | 0.6869 | 0.6080 | 0.6450 | 0.7678 | 0.7996 | 0.7834 |
70
+
71
+
72
+ ### Framework versions
73
+
74
+ - Transformers 5.5.0
75
+ - Pytorch 2.11.0+cu130
76
+ - Datasets 4.8.4
77
+ - Tokenizers 0.22.2
config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "RobertaForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 1,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": 2,
11
+ "gradient_checkpointing": false,
12
+ "hidden_act": "gelu",
13
+ "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 1024,
15
+ "id2label": {
16
+ "0": "Low",
17
+ "1": "Medium",
18
+ "2": "High",
19
+ "3": "Critical"
20
+ },
21
+ "initializer_range": 0.02,
22
+ "intermediate_size": 4096,
23
+ "is_decoder": false,
24
+ "label2id": {
25
+ "Critical": 3,
26
+ "High": 2,
27
+ "Low": 0,
28
+ "Medium": 1
29
+ },
30
+ "layer_norm_eps": 1e-05,
31
+ "max_position_embeddings": 514,
32
+ "model_type": "roberta",
33
+ "num_attention_heads": 16,
34
+ "num_hidden_layers": 24,
35
+ "pad_token_id": 1,
36
+ "position_embedding_type": "absolute",
37
+ "problem_type": "single_label_classification",
38
+ "tie_word_embeddings": true,
39
+ "transformers_version": "5.5.0",
40
+ "type_vocab_size": 1,
41
+ "use_cache": true,
42
+ "vocab_size": 50265
43
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5c58c51fa174a8225d4337aa54dc87073bec8a5a0933544fe3a406b341e8923
3
+ size 1421503560
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": "<s>",
5
+ "cls_token": "<s>",
6
+ "eos_token": "</s>",
7
+ "errors": "replace",
8
+ "is_local": false,
9
+ "mask_token": "<mask>",
10
+ "model_max_length": 1000000000000000019884624838656,
11
+ "pad_token": "<pad>",
12
+ "sep_token": "</s>",
13
+ "tokenizer_class": "RobertaTokenizer",
14
+ "trim_offsets": true,
15
+ "unk_token": "<unk>"
16
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2da8bcf496a32af15208b36b8293f6626aaf4cd3f1122beaa520bc59a105491
3
+ size 5265
Free AI Image Generator No sign-up. Instant results. Open Now