End of training
Browse files- README.md +11 -11
- config.json +2 -66
- model.safetensors +2 -2
- runs/Feb26_08-25-13_4bf9424f0cf5/events.out.tfevents.1708935914.4bf9424f0cf5.4637.1 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -17,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
17 |
|
18 |
This model is a fine-tuned version of [distilbert-base-cased](https://huggingface.co/distilbert-base-cased) on the None dataset.
|
19 |
It achieves the following results on the evaluation set:
|
20 |
-
- Loss: 4.
|
21 |
- Accuracy: 0.0
|
22 |
|
23 |
## Model description
|
@@ -49,16 +49,16 @@ The following hyperparameters were used during training:
|
|
49 |
|
50 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy |
|
51 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|
|
52 |
-
| 4.
|
53 |
-
| 4.
|
54 |
-
| 4.
|
55 |
-
| 4.
|
56 |
-
| 4.
|
57 |
-
| 4.
|
58 |
-
| 4.
|
59 |
-
| 4.
|
60 |
-
| 4.
|
61 |
-
| 4.
|
62 |
|
63 |
|
64 |
### Framework versions
|
|
|
17 |
|
18 |
This model is a fine-tuned version of [distilbert-base-cased](https://huggingface.co/distilbert-base-cased) on the None dataset.
|
19 |
It achieves the following results on the evaluation set:
|
20 |
+
- Loss: 4.6439
|
21 |
- Accuracy: 0.0
|
22 |
|
23 |
## Model description
|
|
|
49 |
|
50 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy |
|
51 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|
|
52 |
+
| 4.4693 | 1.0 | 33 | 4.4433 | 0.0 |
|
53 |
+
| 4.4849 | 2.0 | 66 | 4.5026 | 0.0 |
|
54 |
+
| 4.4433 | 3.0 | 99 | 4.5717 | 0.0 |
|
55 |
+
| 4.4234 | 4.0 | 132 | 4.5887 | 0.0 |
|
56 |
+
| 4.4015 | 5.0 | 165 | 4.6163 | 0.0 |
|
57 |
+
| 4.3956 | 6.0 | 198 | 4.6046 | 0.0 |
|
58 |
+
| 4.3878 | 7.0 | 231 | 4.6354 | 0.0 |
|
59 |
+
| 4.3759 | 8.0 | 264 | 4.6372 | 0.0 |
|
60 |
+
| 4.3787 | 9.0 | 297 | 4.6405 | 0.0 |
|
61 |
+
| 4.3678 | 10.0 | 330 | 4.6439 | 0.0 |
|
62 |
|
63 |
|
64 |
### Framework versions
|
config.json
CHANGED
@@ -89,59 +89,14 @@
|
|
89 |
"77": "LABEL_77",
|
90 |
"78": "LABEL_78",
|
91 |
"79": "LABEL_79",
|
92 |
-
"80": "LABEL_80"
|
93 |
-
"81": "LABEL_81",
|
94 |
-
"82": "LABEL_82",
|
95 |
-
"83": "LABEL_83",
|
96 |
-
"84": "LABEL_84",
|
97 |
-
"85": "LABEL_85",
|
98 |
-
"86": "LABEL_86",
|
99 |
-
"87": "LABEL_87",
|
100 |
-
"88": "LABEL_88",
|
101 |
-
"89": "LABEL_89",
|
102 |
-
"90": "LABEL_90",
|
103 |
-
"91": "LABEL_91",
|
104 |
-
"92": "LABEL_92",
|
105 |
-
"93": "LABEL_93",
|
106 |
-
"94": "LABEL_94",
|
107 |
-
"95": "LABEL_95",
|
108 |
-
"96": "LABEL_96",
|
109 |
-
"97": "LABEL_97",
|
110 |
-
"98": "LABEL_98",
|
111 |
-
"99": "LABEL_99",
|
112 |
-
"100": "LABEL_100",
|
113 |
-
"101": "LABEL_101",
|
114 |
-
"102": "LABEL_102",
|
115 |
-
"103": "LABEL_103",
|
116 |
-
"104": "LABEL_104",
|
117 |
-
"105": "LABEL_105",
|
118 |
-
"106": "LABEL_106",
|
119 |
-
"107": "LABEL_107",
|
120 |
-
"108": "LABEL_108",
|
121 |
-
"109": "LABEL_109",
|
122 |
-
"110": "LABEL_110",
|
123 |
-
"111": "LABEL_111",
|
124 |
-
"112": "LABEL_112"
|
125 |
},
|
126 |
"initializer_range": 0.02,
|
127 |
"label2id": {
|
128 |
"LABEL_0": 0,
|
129 |
"LABEL_1": 1,
|
130 |
"LABEL_10": 10,
|
131 |
-
"LABEL_100": 100,
|
132 |
-
"LABEL_101": 101,
|
133 |
-
"LABEL_102": 102,
|
134 |
-
"LABEL_103": 103,
|
135 |
-
"LABEL_104": 104,
|
136 |
-
"LABEL_105": 105,
|
137 |
-
"LABEL_106": 106,
|
138 |
-
"LABEL_107": 107,
|
139 |
-
"LABEL_108": 108,
|
140 |
-
"LABEL_109": 109,
|
141 |
"LABEL_11": 11,
|
142 |
-
"LABEL_110": 110,
|
143 |
-
"LABEL_111": 111,
|
144 |
-
"LABEL_112": 112,
|
145 |
"LABEL_12": 12,
|
146 |
"LABEL_13": 13,
|
147 |
"LABEL_14": 14,
|
@@ -218,26 +173,7 @@
|
|
218 |
"LABEL_79": 79,
|
219 |
"LABEL_8": 8,
|
220 |
"LABEL_80": 80,
|
221 |
-
"
|
222 |
-
"LABEL_82": 82,
|
223 |
-
"LABEL_83": 83,
|
224 |
-
"LABEL_84": 84,
|
225 |
-
"LABEL_85": 85,
|
226 |
-
"LABEL_86": 86,
|
227 |
-
"LABEL_87": 87,
|
228 |
-
"LABEL_88": 88,
|
229 |
-
"LABEL_89": 89,
|
230 |
-
"LABEL_9": 9,
|
231 |
-
"LABEL_90": 90,
|
232 |
-
"LABEL_91": 91,
|
233 |
-
"LABEL_92": 92,
|
234 |
-
"LABEL_93": 93,
|
235 |
-
"LABEL_94": 94,
|
236 |
-
"LABEL_95": 95,
|
237 |
-
"LABEL_96": 96,
|
238 |
-
"LABEL_97": 97,
|
239 |
-
"LABEL_98": 98,
|
240 |
-
"LABEL_99": 99
|
241 |
},
|
242 |
"max_position_embeddings": 512,
|
243 |
"model_type": "distilbert",
|
|
|
89 |
"77": "LABEL_77",
|
90 |
"78": "LABEL_78",
|
91 |
"79": "LABEL_79",
|
92 |
+
"80": "LABEL_80"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
93 |
},
|
94 |
"initializer_range": 0.02,
|
95 |
"label2id": {
|
96 |
"LABEL_0": 0,
|
97 |
"LABEL_1": 1,
|
98 |
"LABEL_10": 10,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
99 |
"LABEL_11": 11,
|
|
|
|
|
|
|
100 |
"LABEL_12": 12,
|
101 |
"LABEL_13": 13,
|
102 |
"LABEL_14": 14,
|
|
|
173 |
"LABEL_79": 79,
|
174 |
"LABEL_8": 8,
|
175 |
"LABEL_80": 80,
|
176 |
+
"LABEL_9": 9
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
177 |
},
|
178 |
"max_position_embeddings": 512,
|
179 |
"model_type": "distilbert",
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89196b0951d881816ae97e5782db86a5a1aef25353df45cae29080501da56c9a
|
3 |
+
size 263387700
|
runs/Feb26_08-25-13_4bf9424f0cf5/events.out.tfevents.1708935914.4bf9424f0cf5.4637.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd495ca7897673218530a4749c42543e9aa6d856dc782f8f9f0b89a289b6717f
|
3 |
+
size 13527
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4856
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:684aa349da091b0dd2c977f7036b5bddc13e9f83696bf84a862a8feab74f6c45
|
3 |
size 4856
|