Upload CASSANDRA cassandra-asl-tram2 weights and metadata (anonymous CCS 2026 artifact)
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- seeds/seed-123/DONE +1 -0
- seeds/seed-123/config.json +59 -0
- seeds/seed-123/eval.json +15 -0
- seeds/seed-123/model.safetensors +3 -0
- seeds/seed-123/seed.txt +1 -0
- seeds/seed-123/seed_probs.npz +3 -0
- seeds/seed-123/special_tokens_map.json +37 -0
- seeds/seed-123/tokenizer.json +0 -0
- seeds/seed-123/tokenizer_config.json +55 -0
- seeds/seed-123/train_config.json +19 -0
- seeds/seed-123/vocab.txt +0 -0
- seeds/seed-2024/DONE +1 -0
- seeds/seed-2024/config.json +59 -0
- seeds/seed-2024/eval.json +15 -0
- seeds/seed-2024/model.safetensors +3 -0
- seeds/seed-2024/seed.txt +1 -0
- seeds/seed-2024/seed_probs.npz +3 -0
- seeds/seed-2024/special_tokens_map.json +37 -0
- seeds/seed-2024/tokenizer.json +0 -0
- seeds/seed-2024/tokenizer_config.json +55 -0
- seeds/seed-2024/train_config.json +19 -0
- seeds/seed-2024/vocab.txt +0 -0
- seeds/seed-3141/DONE +1 -0
- seeds/seed-3141/config.json +59 -0
- seeds/seed-3141/eval.json +15 -0
- seeds/seed-3141/model.safetensors +3 -0
- seeds/seed-3141/seed.txt +1 -0
- seeds/seed-3141/seed_probs.npz +3 -0
- seeds/seed-3141/special_tokens_map.json +37 -0
- seeds/seed-3141/tokenizer.json +0 -0
- seeds/seed-3141/tokenizer_config.json +55 -0
- seeds/seed-3141/train_config.json +19 -0
- seeds/seed-3141/vocab.txt +0 -0
- seeds/seed-42/DONE +1 -0
- seeds/seed-42/config.json +59 -0
- seeds/seed-42/eval.json +15 -0
- seeds/seed-42/model.safetensors +3 -0
- seeds/seed-42/seed.txt +1 -0
- seeds/seed-42/seed_probs.npz +3 -0
- seeds/seed-42/special_tokens_map.json +37 -0
- seeds/seed-42/tokenizer.json +0 -0
- seeds/seed-42/tokenizer_config.json +55 -0
- seeds/seed-42/train_config.json +19 -0
- seeds/seed-42/vocab.txt +0 -0
- seeds/seed-456/DONE +1 -0
- seeds/seed-456/config.json +59 -0
- seeds/seed-456/eval.json +15 -0
- seeds/seed-456/model.safetensors +3 -0
- seeds/seed-456/seed.txt +1 -0
- seeds/seed-456/seed_probs.npz +3 -0
seeds/seed-123/DONE
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
123
|
seeds/seed-123/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architecture": "LabelAttentionClassifier",
|
| 3 |
+
"encoder_model_name": "ibm-research/CTI-BERT",
|
| 4 |
+
"num_labels": 50,
|
| 5 |
+
"hidden_size": 768,
|
| 6 |
+
"labels": [
|
| 7 |
+
"T1003.001",
|
| 8 |
+
"T1005",
|
| 9 |
+
"T1012",
|
| 10 |
+
"T1016",
|
| 11 |
+
"T1021.001",
|
| 12 |
+
"T1027",
|
| 13 |
+
"T1033",
|
| 14 |
+
"T1036.005",
|
| 15 |
+
"T1041",
|
| 16 |
+
"T1047",
|
| 17 |
+
"T1053.005",
|
| 18 |
+
"T1055",
|
| 19 |
+
"T1056.001",
|
| 20 |
+
"T1057",
|
| 21 |
+
"T1059.003",
|
| 22 |
+
"T1068",
|
| 23 |
+
"T1070.004",
|
| 24 |
+
"T1071.001",
|
| 25 |
+
"T1072",
|
| 26 |
+
"T1074.001",
|
| 27 |
+
"T1078",
|
| 28 |
+
"T1082",
|
| 29 |
+
"T1083",
|
| 30 |
+
"T1090",
|
| 31 |
+
"T1095",
|
| 32 |
+
"T1105",
|
| 33 |
+
"T1106",
|
| 34 |
+
"T1110",
|
| 35 |
+
"T1112",
|
| 36 |
+
"T1113",
|
| 37 |
+
"T1140",
|
| 38 |
+
"T1190",
|
| 39 |
+
"T1204.002",
|
| 40 |
+
"T1210",
|
| 41 |
+
"T1218.011",
|
| 42 |
+
"T1219",
|
| 43 |
+
"T1484.001",
|
| 44 |
+
"T1518.001",
|
| 45 |
+
"T1543.003",
|
| 46 |
+
"T1547.001",
|
| 47 |
+
"T1548.002",
|
| 48 |
+
"T1552.001",
|
| 49 |
+
"T1557.001",
|
| 50 |
+
"T1562.001",
|
| 51 |
+
"T1564.001",
|
| 52 |
+
"T1566.001",
|
| 53 |
+
"T1569.002",
|
| 54 |
+
"T1570",
|
| 55 |
+
"T1573.001",
|
| 56 |
+
"T1574.002"
|
| 57 |
+
],
|
| 58 |
+
"dropout": 0.1
|
| 59 |
+
}
|
seeds/seed-123/eval.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chose": "ema",
|
| 3 |
+
"dev_macro_f1": {
|
| 4 |
+
"base": 0.5447683478808304,
|
| 5 |
+
"ema": 0.5450964644737616,
|
| 6 |
+
"swa": 0.5405556130113931
|
| 7 |
+
},
|
| 8 |
+
"tau_0.5": {
|
| 9 |
+
"doc_f1": 0.7436287853187492,
|
| 10 |
+
"macro_f1": 0.5701923642028678,
|
| 11 |
+
"n_scored_docs": 30,
|
| 12 |
+
"n_skipped_empty_docs": 1
|
| 13 |
+
},
|
| 14 |
+
"n_swa_snapshots": 9
|
| 15 |
+
}
|
seeds/seed-123/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12a589f51035a61bebb602e164b26970ab2cc8d4445721e2d2012edf9bf58c67
|
| 3 |
+
size 497946220
|
seeds/seed-123/seed.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
123
|
seeds/seed-123/seed_probs.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1aa1625d9809aa250871fff55fb785879ed7c0235f346408c29888e7ac2423fe
|
| 3 |
+
size 1282290
|
seeds/seed-123/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
seeds/seed-123/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-123/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"4": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_lower_case": true,
|
| 47 |
+
"mask_token": "[MASK]",
|
| 48 |
+
"model_max_length": 512,
|
| 49 |
+
"pad_token": "[PAD]",
|
| 50 |
+
"sep_token": "[SEP]",
|
| 51 |
+
"strip_accents": null,
|
| 52 |
+
"tokenize_chinese_chars": true,
|
| 53 |
+
"tokenizer_class": "BertTokenizer",
|
| 54 |
+
"unk_token": "[UNK]"
|
| 55 |
+
}
|
seeds/seed-123/train_config.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"recipe": "asl",
|
| 3 |
+
"dataset": "tram2",
|
| 4 |
+
"tag": "orig",
|
| 5 |
+
"encoder": "ibm-research/CTI-BERT",
|
| 6 |
+
"max_len": 512,
|
| 7 |
+
"lr": 2e-05,
|
| 8 |
+
"batch_size": 16,
|
| 9 |
+
"epochs": 30,
|
| 10 |
+
"val_size": 0.2,
|
| 11 |
+
"asl_gamma_neg": 4,
|
| 12 |
+
"asl_gamma_pos": 0,
|
| 13 |
+
"asl_clip": 0.05,
|
| 14 |
+
"swa_start_fraction": 0.75,
|
| 15 |
+
"min_positives_per_class": 10,
|
| 16 |
+
"llrd_decay": 0.85,
|
| 17 |
+
"ema_decay": 0.999,
|
| 18 |
+
"fp16": true
|
| 19 |
+
}
|
seeds/seed-123/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-2024/DONE
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
2024
|
seeds/seed-2024/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architecture": "LabelAttentionClassifier",
|
| 3 |
+
"encoder_model_name": "ibm-research/CTI-BERT",
|
| 4 |
+
"num_labels": 50,
|
| 5 |
+
"hidden_size": 768,
|
| 6 |
+
"labels": [
|
| 7 |
+
"T1003.001",
|
| 8 |
+
"T1005",
|
| 9 |
+
"T1012",
|
| 10 |
+
"T1016",
|
| 11 |
+
"T1021.001",
|
| 12 |
+
"T1027",
|
| 13 |
+
"T1033",
|
| 14 |
+
"T1036.005",
|
| 15 |
+
"T1041",
|
| 16 |
+
"T1047",
|
| 17 |
+
"T1053.005",
|
| 18 |
+
"T1055",
|
| 19 |
+
"T1056.001",
|
| 20 |
+
"T1057",
|
| 21 |
+
"T1059.003",
|
| 22 |
+
"T1068",
|
| 23 |
+
"T1070.004",
|
| 24 |
+
"T1071.001",
|
| 25 |
+
"T1072",
|
| 26 |
+
"T1074.001",
|
| 27 |
+
"T1078",
|
| 28 |
+
"T1082",
|
| 29 |
+
"T1083",
|
| 30 |
+
"T1090",
|
| 31 |
+
"T1095",
|
| 32 |
+
"T1105",
|
| 33 |
+
"T1106",
|
| 34 |
+
"T1110",
|
| 35 |
+
"T1112",
|
| 36 |
+
"T1113",
|
| 37 |
+
"T1140",
|
| 38 |
+
"T1190",
|
| 39 |
+
"T1204.002",
|
| 40 |
+
"T1210",
|
| 41 |
+
"T1218.011",
|
| 42 |
+
"T1219",
|
| 43 |
+
"T1484.001",
|
| 44 |
+
"T1518.001",
|
| 45 |
+
"T1543.003",
|
| 46 |
+
"T1547.001",
|
| 47 |
+
"T1548.002",
|
| 48 |
+
"T1552.001",
|
| 49 |
+
"T1557.001",
|
| 50 |
+
"T1562.001",
|
| 51 |
+
"T1564.001",
|
| 52 |
+
"T1566.001",
|
| 53 |
+
"T1569.002",
|
| 54 |
+
"T1570",
|
| 55 |
+
"T1573.001",
|
| 56 |
+
"T1574.002"
|
| 57 |
+
],
|
| 58 |
+
"dropout": 0.1
|
| 59 |
+
}
|
seeds/seed-2024/eval.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chose": "swa",
|
| 3 |
+
"dev_macro_f1": {
|
| 4 |
+
"base": 0.5439013990885383,
|
| 5 |
+
"ema": 0.543554249784528,
|
| 6 |
+
"swa": 0.5475546922893236
|
| 7 |
+
},
|
| 8 |
+
"tau_0.5": {
|
| 9 |
+
"doc_f1": 0.703092004352701,
|
| 10 |
+
"macro_f1": 0.5492939798102902,
|
| 11 |
+
"n_scored_docs": 30,
|
| 12 |
+
"n_skipped_empty_docs": 1
|
| 13 |
+
},
|
| 14 |
+
"n_swa_snapshots": 9
|
| 15 |
+
}
|
seeds/seed-2024/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:159c63dd01083a770248174c04e767b0e2c00c9514e6f9a7a9193636ce1cb7ce
|
| 3 |
+
size 497946220
|
seeds/seed-2024/seed.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
2024
|
seeds/seed-2024/seed_probs.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d912d060e95fc8dc46cd65b513f9f0f7e46f6fe7c570d9cb5b2c1b53a18bcca5
|
| 3 |
+
size 1270124
|
seeds/seed-2024/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
seeds/seed-2024/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-2024/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"4": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_lower_case": true,
|
| 47 |
+
"mask_token": "[MASK]",
|
| 48 |
+
"model_max_length": 512,
|
| 49 |
+
"pad_token": "[PAD]",
|
| 50 |
+
"sep_token": "[SEP]",
|
| 51 |
+
"strip_accents": null,
|
| 52 |
+
"tokenize_chinese_chars": true,
|
| 53 |
+
"tokenizer_class": "BertTokenizer",
|
| 54 |
+
"unk_token": "[UNK]"
|
| 55 |
+
}
|
seeds/seed-2024/train_config.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"recipe": "asl",
|
| 3 |
+
"dataset": "tram2",
|
| 4 |
+
"tag": "repl",
|
| 5 |
+
"encoder": "ibm-research/CTI-BERT",
|
| 6 |
+
"max_len": 512,
|
| 7 |
+
"lr": 2e-05,
|
| 8 |
+
"batch_size": 16,
|
| 9 |
+
"epochs": 30,
|
| 10 |
+
"val_size": 0.2,
|
| 11 |
+
"asl_gamma_neg": 4,
|
| 12 |
+
"asl_gamma_pos": 0,
|
| 13 |
+
"asl_clip": 0.05,
|
| 14 |
+
"swa_start_fraction": 0.75,
|
| 15 |
+
"min_positives_per_class": 10,
|
| 16 |
+
"llrd_decay": 0.85,
|
| 17 |
+
"ema_decay": 0.999,
|
| 18 |
+
"fp16": true
|
| 19 |
+
}
|
seeds/seed-2024/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-3141/DONE
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
3141
|
seeds/seed-3141/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architecture": "LabelAttentionClassifier",
|
| 3 |
+
"encoder_model_name": "ibm-research/CTI-BERT",
|
| 4 |
+
"num_labels": 50,
|
| 5 |
+
"hidden_size": 768,
|
| 6 |
+
"labels": [
|
| 7 |
+
"T1003.001",
|
| 8 |
+
"T1005",
|
| 9 |
+
"T1012",
|
| 10 |
+
"T1016",
|
| 11 |
+
"T1021.001",
|
| 12 |
+
"T1027",
|
| 13 |
+
"T1033",
|
| 14 |
+
"T1036.005",
|
| 15 |
+
"T1041",
|
| 16 |
+
"T1047",
|
| 17 |
+
"T1053.005",
|
| 18 |
+
"T1055",
|
| 19 |
+
"T1056.001",
|
| 20 |
+
"T1057",
|
| 21 |
+
"T1059.003",
|
| 22 |
+
"T1068",
|
| 23 |
+
"T1070.004",
|
| 24 |
+
"T1071.001",
|
| 25 |
+
"T1072",
|
| 26 |
+
"T1074.001",
|
| 27 |
+
"T1078",
|
| 28 |
+
"T1082",
|
| 29 |
+
"T1083",
|
| 30 |
+
"T1090",
|
| 31 |
+
"T1095",
|
| 32 |
+
"T1105",
|
| 33 |
+
"T1106",
|
| 34 |
+
"T1110",
|
| 35 |
+
"T1112",
|
| 36 |
+
"T1113",
|
| 37 |
+
"T1140",
|
| 38 |
+
"T1190",
|
| 39 |
+
"T1204.002",
|
| 40 |
+
"T1210",
|
| 41 |
+
"T1218.011",
|
| 42 |
+
"T1219",
|
| 43 |
+
"T1484.001",
|
| 44 |
+
"T1518.001",
|
| 45 |
+
"T1543.003",
|
| 46 |
+
"T1547.001",
|
| 47 |
+
"T1548.002",
|
| 48 |
+
"T1552.001",
|
| 49 |
+
"T1557.001",
|
| 50 |
+
"T1562.001",
|
| 51 |
+
"T1564.001",
|
| 52 |
+
"T1566.001",
|
| 53 |
+
"T1569.002",
|
| 54 |
+
"T1570",
|
| 55 |
+
"T1573.001",
|
| 56 |
+
"T1574.002"
|
| 57 |
+
],
|
| 58 |
+
"dropout": 0.1
|
| 59 |
+
}
|
seeds/seed-3141/eval.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chose": "ema",
|
| 3 |
+
"dev_macro_f1": {
|
| 4 |
+
"base": 0.5417992408181854,
|
| 5 |
+
"ema": 0.5432634899722102,
|
| 6 |
+
"swa": 0.5401762405323272
|
| 7 |
+
},
|
| 8 |
+
"tau_0.5": {
|
| 9 |
+
"doc_f1": 0.6962908440035396,
|
| 10 |
+
"macro_f1": 0.5171692881057236,
|
| 11 |
+
"n_scored_docs": 30,
|
| 12 |
+
"n_skipped_empty_docs": 1
|
| 13 |
+
},
|
| 14 |
+
"n_swa_snapshots": 9
|
| 15 |
+
}
|
seeds/seed-3141/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fa2822845cb70a773a62136eeee0ad278bd53c6934d02c04b125c8df53ab662
|
| 3 |
+
size 497946220
|
seeds/seed-3141/seed.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
3141
|
seeds/seed-3141/seed_probs.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc90fa21dd786e6cd0c269c8ae0b50779895f6ccdd934d499d77a571ba7234c2
|
| 3 |
+
size 1279508
|
seeds/seed-3141/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
seeds/seed-3141/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-3141/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"4": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_lower_case": true,
|
| 47 |
+
"mask_token": "[MASK]",
|
| 48 |
+
"model_max_length": 512,
|
| 49 |
+
"pad_token": "[PAD]",
|
| 50 |
+
"sep_token": "[SEP]",
|
| 51 |
+
"strip_accents": null,
|
| 52 |
+
"tokenize_chinese_chars": true,
|
| 53 |
+
"tokenizer_class": "BertTokenizer",
|
| 54 |
+
"unk_token": "[UNK]"
|
| 55 |
+
}
|
seeds/seed-3141/train_config.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"recipe": "asl",
|
| 3 |
+
"dataset": "tram2",
|
| 4 |
+
"tag": "repl",
|
| 5 |
+
"encoder": "ibm-research/CTI-BERT",
|
| 6 |
+
"max_len": 512,
|
| 7 |
+
"lr": 2e-05,
|
| 8 |
+
"batch_size": 16,
|
| 9 |
+
"epochs": 30,
|
| 10 |
+
"val_size": 0.2,
|
| 11 |
+
"asl_gamma_neg": 4,
|
| 12 |
+
"asl_gamma_pos": 0,
|
| 13 |
+
"asl_clip": 0.05,
|
| 14 |
+
"swa_start_fraction": 0.75,
|
| 15 |
+
"min_positives_per_class": 10,
|
| 16 |
+
"llrd_decay": 0.85,
|
| 17 |
+
"ema_decay": 0.999,
|
| 18 |
+
"fp16": true
|
| 19 |
+
}
|
seeds/seed-3141/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-42/DONE
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
42
|
seeds/seed-42/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architecture": "LabelAttentionClassifier",
|
| 3 |
+
"encoder_model_name": "ibm-research/CTI-BERT",
|
| 4 |
+
"num_labels": 50,
|
| 5 |
+
"hidden_size": 768,
|
| 6 |
+
"labels": [
|
| 7 |
+
"T1003.001",
|
| 8 |
+
"T1005",
|
| 9 |
+
"T1012",
|
| 10 |
+
"T1016",
|
| 11 |
+
"T1021.001",
|
| 12 |
+
"T1027",
|
| 13 |
+
"T1033",
|
| 14 |
+
"T1036.005",
|
| 15 |
+
"T1041",
|
| 16 |
+
"T1047",
|
| 17 |
+
"T1053.005",
|
| 18 |
+
"T1055",
|
| 19 |
+
"T1056.001",
|
| 20 |
+
"T1057",
|
| 21 |
+
"T1059.003",
|
| 22 |
+
"T1068",
|
| 23 |
+
"T1070.004",
|
| 24 |
+
"T1071.001",
|
| 25 |
+
"T1072",
|
| 26 |
+
"T1074.001",
|
| 27 |
+
"T1078",
|
| 28 |
+
"T1082",
|
| 29 |
+
"T1083",
|
| 30 |
+
"T1090",
|
| 31 |
+
"T1095",
|
| 32 |
+
"T1105",
|
| 33 |
+
"T1106",
|
| 34 |
+
"T1110",
|
| 35 |
+
"T1112",
|
| 36 |
+
"T1113",
|
| 37 |
+
"T1140",
|
| 38 |
+
"T1190",
|
| 39 |
+
"T1204.002",
|
| 40 |
+
"T1210",
|
| 41 |
+
"T1218.011",
|
| 42 |
+
"T1219",
|
| 43 |
+
"T1484.001",
|
| 44 |
+
"T1518.001",
|
| 45 |
+
"T1543.003",
|
| 46 |
+
"T1547.001",
|
| 47 |
+
"T1548.002",
|
| 48 |
+
"T1552.001",
|
| 49 |
+
"T1557.001",
|
| 50 |
+
"T1562.001",
|
| 51 |
+
"T1564.001",
|
| 52 |
+
"T1566.001",
|
| 53 |
+
"T1569.002",
|
| 54 |
+
"T1570",
|
| 55 |
+
"T1573.001",
|
| 56 |
+
"T1574.002"
|
| 57 |
+
],
|
| 58 |
+
"dropout": 0.1
|
| 59 |
+
}
|
seeds/seed-42/eval.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chose": "swa",
|
| 3 |
+
"dev_macro_f1": {
|
| 4 |
+
"base": 0.5383158873383864,
|
| 5 |
+
"ema": 0.53580089596625,
|
| 6 |
+
"swa": 0.5414597211784158
|
| 7 |
+
},
|
| 8 |
+
"tau_0.5": {
|
| 9 |
+
"doc_f1": 0.7292129677362525,
|
| 10 |
+
"macro_f1": 0.5504301683233094,
|
| 11 |
+
"n_scored_docs": 30,
|
| 12 |
+
"n_skipped_empty_docs": 1
|
| 13 |
+
},
|
| 14 |
+
"n_swa_snapshots": 9
|
| 15 |
+
}
|
seeds/seed-42/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3854abd4e100caf629e1d5f30ec42aeb308015e57b21fbd4eb871f3680c557cc
|
| 3 |
+
size 497946220
|
seeds/seed-42/seed.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
42
|
seeds/seed-42/seed_probs.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1d9f8f124a67f9ff1854b4442b27b6b473df0fd09b08791458fefb835ecd2fe
|
| 3 |
+
size 1284401
|
seeds/seed-42/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
seeds/seed-42/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-42/tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"4": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_lower_case": true,
|
| 47 |
+
"mask_token": "[MASK]",
|
| 48 |
+
"model_max_length": 512,
|
| 49 |
+
"pad_token": "[PAD]",
|
| 50 |
+
"sep_token": "[SEP]",
|
| 51 |
+
"strip_accents": null,
|
| 52 |
+
"tokenize_chinese_chars": true,
|
| 53 |
+
"tokenizer_class": "BertTokenizer",
|
| 54 |
+
"unk_token": "[UNK]"
|
| 55 |
+
}
|
seeds/seed-42/train_config.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"recipe": "asl",
|
| 3 |
+
"dataset": "tram2",
|
| 4 |
+
"tag": "orig",
|
| 5 |
+
"encoder": "ibm-research/CTI-BERT",
|
| 6 |
+
"max_len": 512,
|
| 7 |
+
"lr": 2e-05,
|
| 8 |
+
"batch_size": 16,
|
| 9 |
+
"epochs": 30,
|
| 10 |
+
"val_size": 0.2,
|
| 11 |
+
"asl_gamma_neg": 4,
|
| 12 |
+
"asl_gamma_pos": 0,
|
| 13 |
+
"asl_clip": 0.05,
|
| 14 |
+
"swa_start_fraction": 0.75,
|
| 15 |
+
"min_positives_per_class": 10,
|
| 16 |
+
"llrd_decay": 0.85,
|
| 17 |
+
"ema_decay": 0.999,
|
| 18 |
+
"fp16": true
|
| 19 |
+
}
|
seeds/seed-42/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
seeds/seed-456/DONE
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
456
|
seeds/seed-456/config.json
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architecture": "LabelAttentionClassifier",
|
| 3 |
+
"encoder_model_name": "ibm-research/CTI-BERT",
|
| 4 |
+
"num_labels": 50,
|
| 5 |
+
"hidden_size": 768,
|
| 6 |
+
"labels": [
|
| 7 |
+
"T1003.001",
|
| 8 |
+
"T1005",
|
| 9 |
+
"T1012",
|
| 10 |
+
"T1016",
|
| 11 |
+
"T1021.001",
|
| 12 |
+
"T1027",
|
| 13 |
+
"T1033",
|
| 14 |
+
"T1036.005",
|
| 15 |
+
"T1041",
|
| 16 |
+
"T1047",
|
| 17 |
+
"T1053.005",
|
| 18 |
+
"T1055",
|
| 19 |
+
"T1056.001",
|
| 20 |
+
"T1057",
|
| 21 |
+
"T1059.003",
|
| 22 |
+
"T1068",
|
| 23 |
+
"T1070.004",
|
| 24 |
+
"T1071.001",
|
| 25 |
+
"T1072",
|
| 26 |
+
"T1074.001",
|
| 27 |
+
"T1078",
|
| 28 |
+
"T1082",
|
| 29 |
+
"T1083",
|
| 30 |
+
"T1090",
|
| 31 |
+
"T1095",
|
| 32 |
+
"T1105",
|
| 33 |
+
"T1106",
|
| 34 |
+
"T1110",
|
| 35 |
+
"T1112",
|
| 36 |
+
"T1113",
|
| 37 |
+
"T1140",
|
| 38 |
+
"T1190",
|
| 39 |
+
"T1204.002",
|
| 40 |
+
"T1210",
|
| 41 |
+
"T1218.011",
|
| 42 |
+
"T1219",
|
| 43 |
+
"T1484.001",
|
| 44 |
+
"T1518.001",
|
| 45 |
+
"T1543.003",
|
| 46 |
+
"T1547.001",
|
| 47 |
+
"T1548.002",
|
| 48 |
+
"T1552.001",
|
| 49 |
+
"T1557.001",
|
| 50 |
+
"T1562.001",
|
| 51 |
+
"T1564.001",
|
| 52 |
+
"T1566.001",
|
| 53 |
+
"T1569.002",
|
| 54 |
+
"T1570",
|
| 55 |
+
"T1573.001",
|
| 56 |
+
"T1574.002"
|
| 57 |
+
],
|
| 58 |
+
"dropout": 0.1
|
| 59 |
+
}
|
seeds/seed-456/eval.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"chose": "base",
|
| 3 |
+
"dev_macro_f1": {
|
| 4 |
+
"base": 0.5368901292861008,
|
| 5 |
+
"ema": 0.5359361185807793,
|
| 6 |
+
"swa": 0.5310670323478536
|
| 7 |
+
},
|
| 8 |
+
"tau_0.5": {
|
| 9 |
+
"doc_f1": 0.7333488198828281,
|
| 10 |
+
"macro_f1": 0.5704794001767052,
|
| 11 |
+
"n_scored_docs": 30,
|
| 12 |
+
"n_skipped_empty_docs": 1
|
| 13 |
+
},
|
| 14 |
+
"n_swa_snapshots": 9
|
| 15 |
+
}
|
seeds/seed-456/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f86cb76a634ba0499b6c86af3598689890e8137d70da1b4a495dde10e939506
|
| 3 |
+
size 497946220
|
seeds/seed-456/seed.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
456
|
seeds/seed-456/seed_probs.npz
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:396c6ee757167a33a5bca92f58cb006bf917f466b9fbaefdd80ada654d1daac2
|
| 3 |
+
size 1285535
|