Update model for torch 2.0
Browse files- loss.tsv +150 -150
- pytorch_model.bin +2 -2
- training.log +0 -0
loss.tsv
CHANGED
|
@@ -1,151 +1,151 @@
|
|
| 1 |
EPOCH TIMESTAMP BAD_EPOCHS LEARNING_RATE TRAIN_LOSS
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
23
|
| 26 |
-
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
| 37 |
-
|
| 38 |
-
|
| 39 |
-
|
| 40 |
-
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
-
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
|
| 61 |
-
|
| 62 |
-
|
| 63 |
-
|
| 64 |
-
|
| 65 |
-
|
| 66 |
-
|
| 67 |
-
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
| 75 |
-
|
| 76 |
-
|
| 77 |
-
|
| 78 |
-
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
-
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
|
| 93 |
-
|
| 94 |
-
|
| 95 |
-
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
|
| 107 |
-
|
| 108 |
-
|
| 109 |
-
|
| 110 |
-
|
| 111 |
-
|
| 112 |
-
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
|
| 116 |
-
|
| 117 |
-
|
| 118 |
-
|
| 119 |
-
|
| 120 |
-
|
| 121 |
-
|
| 122 |
-
|
| 123 |
-
|
| 124 |
-
|
| 125 |
-
|
| 126 |
-
|
| 127 |
-
|
| 128 |
-
|
| 129 |
-
|
| 130 |
-
|
| 131 |
-
|
| 132 |
-
|
| 133 |
-
|
| 134 |
-
|
| 135 |
-
|
| 136 |
-
|
| 137 |
-
|
| 138 |
-
|
| 139 |
-
|
| 140 |
-
|
| 141 |
-
|
| 142 |
-
|
| 143 |
-
|
| 144 |
-
|
| 145 |
-
|
| 146 |
-
|
| 147 |
-
|
| 148 |
-
|
| 149 |
-
|
| 150 |
-
|
| 151 |
-
|
|
|
|
| 1 |
EPOCH TIMESTAMP BAD_EPOCHS LEARNING_RATE TRAIN_LOSS
|
| 2 |
+
1 22:35:47 0 0.1000 0.6185386979491163
|
| 3 |
+
2 22:37:13 0 0.1000 0.35425149667336975
|
| 4 |
+
3 22:38:39 0 0.1000 0.2847189320082355
|
| 5 |
+
4 22:40:05 0 0.1000 0.2511436243545832
|
| 6 |
+
5 22:41:34 0 0.1000 0.23117349088495384
|
| 7 |
+
6 22:43:00 0 0.1000 0.21602252507454017
|
| 8 |
+
7 22:44:26 0 0.1000 0.20519561000249947
|
| 9 |
+
8 22:45:52 0 0.1000 0.19606535345403814
|
| 10 |
+
9 22:47:18 0 0.1000 0.18937375626512343
|
| 11 |
+
10 22:48:44 0 0.1000 0.1840467118037753
|
| 12 |
+
11 22:50:14 0 0.1000 0.17826202811872788
|
| 13 |
+
12 22:51:40 0 0.1000 0.17257516769856251
|
| 14 |
+
13 22:53:06 0 0.1000 0.17004089867849126
|
| 15 |
+
14 22:54:32 0 0.1000 0.1674512182404545
|
| 16 |
+
15 22:55:59 0 0.1000 0.162695748672466
|
| 17 |
+
16 22:57:25 0 0.1000 0.15969865723244933
|
| 18 |
+
17 22:58:55 0 0.1000 0.15709127009749108
|
| 19 |
+
18 23:00:21 0 0.1000 0.15503562445428395
|
| 20 |
+
19 23:01:48 0 0.1000 0.15270262263512277
|
| 21 |
+
20 23:03:14 0 0.1000 0.1510941066990498
|
| 22 |
+
21 23:04:40 0 0.1000 0.14932266930859522
|
| 23 |
+
22 23:06:07 0 0.1000 0.1470182456187978
|
| 24 |
+
23 23:07:37 0 0.1000 0.1457172039258319
|
| 25 |
+
24 23:09:03 0 0.1000 0.14393406125538014
|
| 26 |
+
25 23:10:29 0 0.1000 0.14385275766856767
|
| 27 |
+
26 23:11:55 0 0.1000 0.14190089184282434
|
| 28 |
+
27 23:13:21 0 0.1000 0.14065581695284723
|
| 29 |
+
28 23:14:47 0 0.1000 0.13984803497010026
|
| 30 |
+
29 23:16:13 0 0.1000 0.13779102864588055
|
| 31 |
+
30 23:17:42 0 0.1000 0.13662742603662983
|
| 32 |
+
31 23:19:08 0 0.1000 0.13565194226737304
|
| 33 |
+
32 23:20:34 0 0.1000 0.13518672968977555
|
| 34 |
+
33 23:22:00 0 0.1000 0.13349508199443283
|
| 35 |
+
34 23:23:27 0 0.1000 0.1328433563338708
|
| 36 |
+
35 23:24:54 0 0.1000 0.13239602488796381
|
| 37 |
+
36 23:26:24 0 0.1000 0.13126545035438267
|
| 38 |
+
37 23:27:50 0 0.1000 0.13032329117285507
|
| 39 |
+
38 23:29:15 0 0.1000 0.12967605260009363
|
| 40 |
+
39 23:30:42 0 0.1000 0.12823001531030498
|
| 41 |
+
40 23:32:08 1 0.1000 0.1284607936641232
|
| 42 |
+
41 23:33:34 0 0.1000 0.12681522469629725
|
| 43 |
+
42 23:35:04 1 0.1000 0.12734182916553433
|
| 44 |
+
43 23:36:30 2 0.1000 0.1269227986521394
|
| 45 |
+
44 23:37:56 0 0.1000 0.12565881975659207
|
| 46 |
+
45 23:39:23 0 0.1000 0.12519508085494402
|
| 47 |
+
46 23:40:49 0 0.1000 0.12404177472295658
|
| 48 |
+
47 23:42:15 1 0.1000 0.12408841278395216
|
| 49 |
+
48 23:43:45 0 0.1000 0.12314501778824564
|
| 50 |
+
49 23:45:11 1 0.1000 0.1233327621823897
|
| 51 |
+
50 23:46:37 0 0.1000 0.12299835928596695
|
| 52 |
+
51 23:48:04 0 0.1000 0.12123994974894345
|
| 53 |
+
52 23:49:31 1 0.1000 0.12165050480605238
|
| 54 |
+
53 23:50:57 2 0.1000 0.12190621421044297
|
| 55 |
+
54 23:52:27 3 0.1000 0.12148307878506295
|
| 56 |
+
55 23:53:53 0 0.1000 0.12107830343735118
|
| 57 |
+
56 23:55:20 0 0.1000 0.11973224276370659
|
| 58 |
+
57 23:56:46 0 0.1000 0.1197231555685797
|
| 59 |
+
58 23:58:13 1 0.1000 0.11982733714107378
|
| 60 |
+
59 23:59:40 0 0.1000 0.1186234302452136
|
| 61 |
+
60 00:01:10 1 0.1000 0.11877469808988217
|
| 62 |
+
61 00:02:36 0 0.1000 0.11857459796107021
|
| 63 |
+
62 00:04:02 0 0.1000 0.11788056248318465
|
| 64 |
+
63 00:05:28 0 0.1000 0.11753227896787243
|
| 65 |
+
64 00:06:54 1 0.1000 0.11839604508488215
|
| 66 |
+
65 00:08:21 2 0.1000 0.11754489395727863
|
| 67 |
+
66 00:09:46 0 0.1000 0.11684117560843098
|
| 68 |
+
67 00:11:16 1 0.1000 0.11738160970829112
|
| 69 |
+
68 00:12:43 2 0.1000 0.11714554606522035
|
| 70 |
+
69 00:14:10 0 0.1000 0.11576811394084595
|
| 71 |
+
70 00:15:37 0 0.1000 0.11554254914212171
|
| 72 |
+
71 00:17:03 1 0.1000 0.11647530727936514
|
| 73 |
+
72 00:18:29 2 0.1000 0.11567563767617331
|
| 74 |
+
73 00:19:58 0 0.1000 0.11494111494974645
|
| 75 |
+
74 00:21:24 1 0.1000 0.11502925348073567
|
| 76 |
+
75 00:22:50 0 0.1000 0.11411993730412628
|
| 77 |
+
76 00:24:16 1 0.1000 0.11520848208183947
|
| 78 |
+
77 00:25:42 2 0.1000 0.1141347627556906
|
| 79 |
+
78 00:27:08 3 0.1000 0.11457895267200477
|
| 80 |
+
79 00:28:37 4 0.1000 0.11420622195693127
|
| 81 |
+
80 00:30:03 0 0.0500 0.10795398784493494
|
| 82 |
+
81 00:31:30 0 0.0500 0.10602036640232343
|
| 83 |
+
82 00:32:56 0 0.0500 0.10486684786257999
|
| 84 |
+
83 00:34:22 0 0.0500 0.10366360462302777
|
| 85 |
+
84 00:35:48 0 0.0500 0.10208262046329922
|
| 86 |
+
85 00:37:18 1 0.0500 0.10267644960671718
|
| 87 |
+
86 00:38:44 2 0.0500 0.10220844389540555
|
| 88 |
+
87 00:40:10 0 0.0500 0.10176323697548192
|
| 89 |
+
88 00:41:37 0 0.0500 0.10145811281533831
|
| 90 |
+
89 00:43:04 0 0.0500 0.10073493381539385
|
| 91 |
+
90 00:44:30 0 0.0500 0.10003284362986388
|
| 92 |
+
91 00:46:00 0 0.0500 0.09971309983285824
|
| 93 |
+
92 00:47:27 1 0.0500 0.10014370045603127
|
| 94 |
+
93 00:48:54 0 0.0500 0.09950157016239228
|
| 95 |
+
94 00:50:20 0 0.0500 0.09870167721845441
|
| 96 |
+
95 00:51:46 1 0.0500 0.09888381383314052
|
| 97 |
+
96 00:53:12 2 0.0500 0.09904931203072968
|
| 98 |
+
97 00:54:42 0 0.0500 0.0981977160994476
|
| 99 |
+
98 00:56:08 1 0.0500 0.09840684165225154
|
| 100 |
+
99 00:57:34 2 0.0500 0.09854188623190752
|
| 101 |
+
100 00:59:01 0 0.0500 0.09724489597465445
|
| 102 |
+
101 01:00:27 1 0.0500 0.09800776515795306
|
| 103 |
+
102 01:01:53 2 0.0500 0.09730516631984973
|
| 104 |
+
103 01:03:23 0 0.0500 0.09708681998832927
|
| 105 |
+
104 01:04:48 0 0.0500 0.09667254237364362
|
| 106 |
+
105 01:06:14 1 0.0500 0.09670696384355838
|
| 107 |
+
106 01:07:40 2 0.0500 0.09676833900408663
|
| 108 |
+
107 01:09:06 0 0.0500 0.09592908512829337
|
| 109 |
+
108 01:10:32 1 0.0500 0.09662516932272135
|
| 110 |
+
109 01:11:59 2 0.0500 0.09593727191313531
|
| 111 |
+
110 01:13:28 0 0.0500 0.09564112964561697
|
| 112 |
+
111 01:14:55 1 0.0500 0.09575963952404815
|
| 113 |
+
112 01:16:21 2 0.0500 0.09591712979367935
|
| 114 |
+
113 01:17:47 3 0.0500 0.09568467247528191
|
| 115 |
+
114 01:19:13 0 0.0500 0.095186163811696
|
| 116 |
+
115 01:20:39 0 0.0500 0.0949202717351177
|
| 117 |
+
116 01:22:08 1 0.0500 0.0950977818689685
|
| 118 |
+
117 01:23:34 0 0.0500 0.09404966824933877
|
| 119 |
+
118 01:24:59 1 0.0500 0.09479988241966152
|
| 120 |
+
119 01:26:25 2 0.0500 0.09489803382113102
|
| 121 |
+
120 01:27:51 3 0.0500 0.09449563222705677
|
| 122 |
+
121 01:29:17 4 0.0500 0.09468987507245533
|
| 123 |
+
122 01:30:47 0 0.0250 0.09134418527600222
|
| 124 |
+
123 01:32:13 0 0.0250 0.09082381542069164
|
| 125 |
+
124 01:33:38 0 0.0250 0.09037322334509629
|
| 126 |
+
125 01:35:04 0 0.0250 0.08931219590682289
|
| 127 |
+
126 01:36:29 0 0.0250 0.08891356897803261
|
| 128 |
+
127 01:37:55 1 0.0250 0.08925827653916675
|
| 129 |
+
128 01:39:24 2 0.0250 0.08895860887866681
|
| 130 |
+
129 01:40:49 0 0.0250 0.08861667817147073
|
| 131 |
+
130 01:42:14 0 0.0250 0.08831161051073677
|
| 132 |
+
131 01:43:39 1 0.0250 0.08884769677088612
|
| 133 |
+
132 01:45:05 2 0.0250 0.08859108850919213
|
| 134 |
+
133 01:46:30 3 0.0250 0.08842932986526847
|
| 135 |
+
134 01:47:58 4 0.0250 0.0885590172332143
|
| 136 |
+
135 01:49:23 0 0.0125 0.08705202528985626
|
| 137 |
+
136 01:50:48 0 0.0125 0.085988338016098
|
| 138 |
+
137 01:52:13 1 0.0125 0.08640655156025905
|
| 139 |
+
138 01:53:39 0 0.0125 0.08551047135828416
|
| 140 |
+
139 01:55:03 0 0.0125 0.08537939956909106
|
| 141 |
+
140 01:56:31 0 0.0125 0.08515134156268339
|
| 142 |
+
141 01:57:56 1 0.0125 0.08585624558381849
|
| 143 |
+
142 01:59:20 2 0.0125 0.0854624627008124
|
| 144 |
+
143 02:00:45 0 0.0125 0.08434762984684457
|
| 145 |
+
144 02:02:09 1 0.0125 0.08494414218647221
|
| 146 |
+
145 02:03:34 2 0.0125 0.08493393421362688
|
| 147 |
+
146 02:04:58 3 0.0125 0.08512776477542741
|
| 148 |
+
147 02:06:26 0 0.0125 0.08401921594672918
|
| 149 |
+
148 02:07:50 1 0.0125 0.08420663117349429
|
| 150 |
+
149 02:09:14 0 0.0125 0.0838463399628542
|
| 151 |
+
150 02:10:38 1 0.0125 0.08395460257606586
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee6ea9ae384609494cd862c34b9c75e0989b824305cb73084cbe762e11e647b9
|
| 3 |
+
size 108301323
|
training.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|