Update model for torch 2.0
Browse files- loss.tsv +150 -150
- pytorch_model.bin +2 -2
- training.log +0 -0
loss.tsv
CHANGED
|
@@ -1,151 +1,151 @@
|
|
| 1 |
EPOCH TIMESTAMP BAD_EPOCHS LEARNING_RATE TRAIN_LOSS
|
| 2 |
-
|
| 3 |
-
|
| 4 |
-
|
| 5 |
-
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
|
| 27 |
-
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
| 37 |
-
|
| 38 |
-
|
| 39 |
-
|
| 40 |
-
|
| 41 |
-
|
| 42 |
-
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
-
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
|
| 61 |
-
|
| 62 |
-
|
| 63 |
-
|
| 64 |
-
|
| 65 |
-
|
| 66 |
-
|
| 67 |
-
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
|
| 75 |
-
|
| 76 |
-
|
| 77 |
-
|
| 78 |
-
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
-
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
|
| 93 |
-
|
| 94 |
-
|
| 95 |
-
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
|
| 107 |
-
|
| 108 |
-
|
| 109 |
-
|
| 110 |
-
|
| 111 |
-
|
| 112 |
-
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
|
| 116 |
-
|
| 117 |
-
|
| 118 |
-
|
| 119 |
-
|
| 120 |
-
|
| 121 |
-
|
| 122 |
-
|
| 123 |
-
|
| 124 |
-
|
| 125 |
-
|
| 126 |
-
|
| 127 |
-
|
| 128 |
-
|
| 129 |
-
|
| 130 |
-
|
| 131 |
-
|
| 132 |
-
|
| 133 |
-
|
| 134 |
-
|
| 135 |
-
|
| 136 |
-
|
| 137 |
-
|
| 138 |
-
|
| 139 |
-
|
| 140 |
-
|
| 141 |
-
|
| 142 |
-
|
| 143 |
-
|
| 144 |
-
|
| 145 |
-
|
| 146 |
-
|
| 147 |
-
|
| 148 |
-
|
| 149 |
-
|
| 150 |
-
|
| 151 |
-
|
|
|
|
| 1 |
EPOCH TIMESTAMP BAD_EPOCHS LEARNING_RATE TRAIN_LOSS
|
| 2 |
+
1 22:40:56 0 0.1000 0.0945024522987675
|
| 3 |
+
2 22:51:41 0 0.1000 0.055215560597502246
|
| 4 |
+
3 23:02:23 0 0.1000 0.04952181141699733
|
| 5 |
+
4 23:13:03 0 0.1000 0.046546286818927696
|
| 6 |
+
5 23:23:50 0 0.1000 0.044674422992666364
|
| 7 |
+
6 23:34:40 0 0.1000 0.043379003066180775
|
| 8 |
+
7 23:45:29 0 0.1000 0.04226557562207461
|
| 9 |
+
8 23:56:17 0 0.1000 0.0416480286894472
|
| 10 |
+
9 00:07:06 0 0.1000 0.040844577245091315
|
| 11 |
+
10 00:17:56 0 0.1000 0.04028057295105605
|
| 12 |
+
11 00:28:49 0 0.1000 0.039795858246050086
|
| 13 |
+
12 00:39:37 0 0.1000 0.039294909804427326
|
| 14 |
+
13 00:50:30 0 0.1000 0.03920813497924898
|
| 15 |
+
14 01:01:16 0 0.1000 0.03875447203624966
|
| 16 |
+
15 01:12:02 0 0.1000 0.03840149609313526
|
| 17 |
+
16 01:22:47 0 0.1000 0.03817139669596635
|
| 18 |
+
17 01:33:29 0 0.1000 0.037982044622196606
|
| 19 |
+
18 01:44:09 1 0.1000 0.03801343303779224
|
| 20 |
+
19 01:54:44 0 0.1000 0.03780869265705829
|
| 21 |
+
20 02:05:16 0 0.1000 0.03755916743374315
|
| 22 |
+
21 02:15:44 0 0.1000 0.03743201834629877
|
| 23 |
+
22 02:26:19 0 0.1000 0.03728124974840063
|
| 24 |
+
23 02:36:48 0 0.1000 0.03713726534776972
|
| 25 |
+
24 02:47:18 0 0.1000 0.03693011091447085
|
| 26 |
+
25 02:57:50 0 0.1000 0.036884413869251856
|
| 27 |
+
26 03:08:19 0 0.1000 0.03682199553617605
|
| 28 |
+
27 03:18:49 0 0.1000 0.036754411050049944
|
| 29 |
+
28 03:29:22 0 0.1000 0.03647368471633433
|
| 30 |
+
29 03:39:51 1 0.1000 0.03656561237095109
|
| 31 |
+
30 03:50:23 0 0.1000 0.03638562648649369
|
| 32 |
+
31 04:00:59 1 0.1000 0.03653519022706945
|
| 33 |
+
32 04:11:32 2 0.1000 0.03640496369512824
|
| 34 |
+
33 04:22:06 0 0.1000 0.0362223800162023
|
| 35 |
+
34 04:32:38 1 0.1000 0.036548178269857776
|
| 36 |
+
35 04:43:10 2 0.1000 0.03625923607029886
|
| 37 |
+
36 04:53:39 0 0.1000 0.03613866373458298
|
| 38 |
+
37 05:04:12 1 0.1000 0.03621617400172113
|
| 39 |
+
38 05:14:42 2 0.1000 0.0362809314033135
|
| 40 |
+
39 05:25:15 3 0.1000 0.03633763824480552
|
| 41 |
+
40 05:35:45 0 0.1000 0.03603039296579129
|
| 42 |
+
41 05:46:18 1 0.1000 0.03612727204641081
|
| 43 |
+
42 05:56:52 0 0.1000 0.03602838543831496
|
| 44 |
+
43 06:07:28 1 0.1000 0.03611080840002592
|
| 45 |
+
44 06:18:01 2 0.1000 0.03604925517216913
|
| 46 |
+
45 06:28:33 0 0.1000 0.03588281072517095
|
| 47 |
+
46 06:39:06 1 0.1000 0.03607414460874756
|
| 48 |
+
47 06:49:40 2 0.1000 0.035947956990319864
|
| 49 |
+
48 07:00:13 0 0.1000 0.03577572033543793
|
| 50 |
+
49 07:10:53 1 0.1000 0.03593850683126742
|
| 51 |
+
50 07:21:31 2 0.1000 0.03593144469725898
|
| 52 |
+
51 07:32:08 3 0.1000 0.036042781446044246
|
| 53 |
+
52 07:42:41 0 0.1000 0.03576243344093623
|
| 54 |
+
53 07:53:13 0 0.1000 0.03572553447241531
|
| 55 |
+
54 08:03:47 1 0.1000 0.03576076876407767
|
| 56 |
+
55 08:14:22 2 0.1000 0.03582616523426395
|
| 57 |
+
56 08:24:54 3 0.1000 0.035791065263200604
|
| 58 |
+
57 08:35:32 0 0.1000 0.03564062247409107
|
| 59 |
+
58 08:46:08 1 0.1000 0.0356570904583961
|
| 60 |
+
59 08:56:45 2 0.1000 0.03587479146006599
|
| 61 |
+
60 09:07:15 3 0.1000 0.035747757637357096
|
| 62 |
+
61 09:17:53 4 0.1000 0.035745815488534484
|
| 63 |
+
62 09:28:30 0 0.0500 0.03361754665252171
|
| 64 |
+
63 09:39:04 0 0.0500 0.032645879185562485
|
| 65 |
+
64 09:49:39 0 0.0500 0.0323963112027487
|
| 66 |
+
65 10:00:17 0 0.0500 0.03191217731426602
|
| 67 |
+
66 10:10:48 1 0.0500 0.03205001720592649
|
| 68 |
+
67 10:21:22 0 0.0500 0.03171927868092008
|
| 69 |
+
68 10:32:00 0 0.0500 0.031600463357791736
|
| 70 |
+
69 10:42:36 0 0.0500 0.03130843178445556
|
| 71 |
+
70 10:53:14 0 0.0500 0.031233917161034224
|
| 72 |
+
71 11:03:48 0 0.0500 0.03099105281411341
|
| 73 |
+
72 11:14:20 0 0.0500 0.030801373847075018
|
| 74 |
+
73 11:24:57 0 0.0500 0.03066287707036287
|
| 75 |
+
74 11:35:33 1 0.0500 0.030735509346289415
|
| 76 |
+
75 11:46:06 0 0.0500 0.03052326172995423
|
| 77 |
+
76 11:56:45 1 0.0500 0.030760341770202988
|
| 78 |
+
77 12:07:20 2 0.0500 0.030595462382825588
|
| 79 |
+
78 12:17:52 0 0.0500 0.030505499806037957
|
| 80 |
+
79 12:28:25 0 0.0500 0.03040131969595017
|
| 81 |
+
80 12:38:58 0 0.0500 0.030298029169345105
|
| 82 |
+
81 12:49:34 0 0.0500 0.03027550111058688
|
| 83 |
+
82 13:00:08 0 0.0500 0.030172374185541858
|
| 84 |
+
83 13:10:45 0 0.0500 0.03015809530165669
|
| 85 |
+
84 13:21:18 0 0.0500 0.0300457527750989
|
| 86 |
+
85 13:31:59 0 0.0500 0.0298607931553351
|
| 87 |
+
86 13:42:30 1 0.0500 0.02997382665060291
|
| 88 |
+
87 13:53:12 0 0.0500 0.029791685749383987
|
| 89 |
+
88 14:03:46 0 0.0500 0.029790540848315138
|
| 90 |
+
89 14:14:25 0 0.0500 0.02974745972387388
|
| 91 |
+
90 14:25:05 0 0.0500 0.02968233824684013
|
| 92 |
+
91 14:35:39 0 0.0500 0.0295506687367453
|
| 93 |
+
92 14:46:18 1 0.0500 0.029616575377326673
|
| 94 |
+
93 14:56:49 2 0.0500 0.029683465176525488
|
| 95 |
+
94 15:07:24 0 0.0500 0.029517761894170533
|
| 96 |
+
95 15:18:01 0 0.0500 0.029265579384910485
|
| 97 |
+
96 15:28:38 1 0.0500 0.029299482399863155
|
| 98 |
+
97 15:39:13 2 0.0500 0.029291816675250625
|
| 99 |
+
98 15:49:52 3 0.0500 0.029287658778784358
|
| 100 |
+
99 16:00:31 0 0.0500 0.02926184722432205
|
| 101 |
+
100 16:11:13 0 0.0500 0.029176589431791355
|
| 102 |
+
101 16:21:48 0 0.0500 0.028969541742313382
|
| 103 |
+
102 16:32:17 1 0.0500 0.02929986072847075
|
| 104 |
+
103 16:42:59 2 0.0500 0.029120039839904868
|
| 105 |
+
104 16:53:34 3 0.0500 0.028978051502247033
|
| 106 |
+
105 17:04:11 0 0.0500 0.028855782574974332
|
| 107 |
+
106 17:14:49 1 0.0500 0.02890924310293501
|
| 108 |
+
107 17:25:20 2 0.0500 0.028857010826080397
|
| 109 |
+
108 17:35:56 0 0.0500 0.028769463541263446
|
| 110 |
+
109 17:46:35 0 0.0500 0.028761565737922754
|
| 111 |
+
110 17:57:08 1 0.0500 0.028797699063536738
|
| 112 |
+
111 18:07:43 0 0.0500 0.028537822323331734
|
| 113 |
+
112 18:18:15 1 0.0500 0.028874799087369025
|
| 114 |
+
113 18:28:51 2 0.0500 0.02883941808105008
|
| 115 |
+
114 18:39:26 3 0.0500 0.028714295112168404
|
| 116 |
+
115 18:50:04 4 0.0500 0.02869025807689995
|
| 117 |
+
116 19:00:36 0 0.0250 0.027727492331945304
|
| 118 |
+
117 19:11:07 0 0.0250 0.027136240322025777
|
| 119 |
+
118 19:21:45 0 0.0250 0.027025794396128993
|
| 120 |
+
119 19:32:19 0 0.0250 0.026960871843719383
|
| 121 |
+
120 19:42:56 0 0.0250 0.026916801363631893
|
| 122 |
+
121 19:53:33 0 0.0250 0.026707063543956428
|
| 123 |
+
122 20:04:10 0 0.0250 0.02670125568857497
|
| 124 |
+
123 20:14:42 0 0.0250 0.026629168751181896
|
| 125 |
+
124 20:25:11 1 0.0250 0.02663639696556189
|
| 126 |
+
125 20:35:51 0 0.0250 0.026415031660768813
|
| 127 |
+
126 20:46:23 0 0.0250 0.026245318900787094
|
| 128 |
+
127 20:57:00 0 0.0250 0.02619731826504135
|
| 129 |
+
128 21:07:39 1 0.0250 0.026394183926366846
|
| 130 |
+
129 21:18:15 2 0.0250 0.026321724237692086
|
| 131 |
+
130 21:28:45 0 0.0250 0.026142019388490288
|
| 132 |
+
131 21:39:16 1 0.0250 0.02614339667813874
|
| 133 |
+
132 21:49:55 0 0.0250 0.026121453928749677
|
| 134 |
+
133 22:00:30 0 0.0250 0.026113992706087198
|
| 135 |
+
134 22:11:05 0 0.0250 0.02599400986273492
|
| 136 |
+
135 22:21:44 0 0.0250 0.02590731900729667
|
| 137 |
+
136 22:32:19 1 0.0250 0.025996867312709726
|
| 138 |
+
137 22:42:58 0 0.0250 0.025831662271469442
|
| 139 |
+
138 22:53:36 1 0.0250 0.025881532550800963
|
| 140 |
+
139 23:04:11 2 0.0250 0.02592914494269305
|
| 141 |
+
140 23:14:47 0 0.0250 0.025741110357243937
|
| 142 |
+
141 23:25:24 0 0.0250 0.025724724483570358
|
| 143 |
+
142 23:36:04 1 0.0250 0.025751754993595544
|
| 144 |
+
143 23:46:43 0 0.0250 0.025628510963842825
|
| 145 |
+
144 23:57:21 0 0.0250 0.025590345322637348
|
| 146 |
+
145 00:07:56 1 0.0250 0.025634433774108324
|
| 147 |
+
146 00:18:32 0 0.0250 0.025356779927266513
|
| 148 |
+
147 00:29:11 1 0.0250 0.025525167142790173
|
| 149 |
+
148 00:39:49 2 0.0250 0.025518080840369457
|
| 150 |
+
149 00:50:28 3 0.0250 0.025373666830717716
|
| 151 |
+
150 01:00:59 0 0.0250 0.025303713840188286
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79374cb9eced60d9bb0b3edcaf5a0e0c561b042526c20b911c4e9237a4d7ae4a
|
| 3 |
+
size 1296739140
|
training.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|