hayren commited on
Commit
d7848a2
·
verified ·
1 Parent(s): 8e6d1e7

Delete training_state

Browse files
training_state/optimizer_param_groups.json DELETED
@@ -1,191 +0,0 @@
1
- [
2
- {
3
- "lr": 1e-05,
4
- "betas": [
5
- 0.9,
6
- 0.999
7
- ],
8
- "eps": 1e-08,
9
- "weight_decay": 0.0001,
10
- "amsgrad": false,
11
- "maximize": false,
12
- "foreach": null,
13
- "capturable": false,
14
- "differentiable": false,
15
- "fused": null,
16
- "decoupled_weight_decay": true,
17
- "params": [
18
- 0,
19
- 1,
20
- 2,
21
- 3,
22
- 4,
23
- 5,
24
- 6,
25
- 7,
26
- 8,
27
- 9,
28
- 10,
29
- 11,
30
- 12,
31
- 13,
32
- 14,
33
- 15,
34
- 16,
35
- 17,
36
- 18,
37
- 19,
38
- 20,
39
- 21,
40
- 22,
41
- 23,
42
- 24,
43
- 25,
44
- 26,
45
- 27,
46
- 28,
47
- 29,
48
- 30,
49
- 31,
50
- 32,
51
- 33,
52
- 34,
53
- 35,
54
- 36,
55
- 37,
56
- 38,
57
- 39,
58
- 40,
59
- 41,
60
- 42,
61
- 43,
62
- 44,
63
- 45,
64
- 46,
65
- 47,
66
- 48,
67
- 49,
68
- 50,
69
- 51,
70
- 52,
71
- 53,
72
- 54,
73
- 55,
74
- 56,
75
- 57,
76
- 58,
77
- 59,
78
- 60,
79
- 61,
80
- 62,
81
- 63,
82
- 64,
83
- 65,
84
- 66,
85
- 67,
86
- 68,
87
- 69,
88
- 70,
89
- 71,
90
- 72,
91
- 73,
92
- 74,
93
- 75,
94
- 76,
95
- 77,
96
- 78,
97
- 79,
98
- 80,
99
- 81,
100
- 82,
101
- 83,
102
- 84,
103
- 85,
104
- 86,
105
- 87,
106
- 88,
107
- 89,
108
- 90,
109
- 91,
110
- 92,
111
- 93,
112
- 94,
113
- 95,
114
- 96,
115
- 97,
116
- 98,
117
- 99,
118
- 100,
119
- 101,
120
- 102,
121
- 103,
122
- 104,
123
- 105,
124
- 106,
125
- 107,
126
- 108,
127
- 109,
128
- 110,
129
- 111,
130
- 112,
131
- 113,
132
- 114,
133
- 115,
134
- 116,
135
- 117,
136
- 118,
137
- 119,
138
- 120,
139
- 121,
140
- 122,
141
- 123,
142
- 124,
143
- 125,
144
- 126,
145
- 127,
146
- 128,
147
- 129,
148
- 130,
149
- 131,
150
- 132
151
- ]
152
- },
153
- {
154
- "lr": 1e-05,
155
- "betas": [
156
- 0.9,
157
- 0.999
158
- ],
159
- "eps": 1e-08,
160
- "weight_decay": 0.0001,
161
- "amsgrad": false,
162
- "maximize": false,
163
- "foreach": null,
164
- "capturable": false,
165
- "differentiable": false,
166
- "fused": null,
167
- "decoupled_weight_decay": true,
168
- "params": [
169
- 133,
170
- 134,
171
- 135,
172
- 136,
173
- 137,
174
- 138,
175
- 139,
176
- 140,
177
- 141,
178
- 142,
179
- 143,
180
- 144,
181
- 145,
182
- 146,
183
- 147,
184
- 148,
185
- 149,
186
- 150,
187
- 151,
188
- 152
189
- ]
190
- }
191
- ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_state/optimizer_state.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0adb1e80fdb65377c9dd76a2a72b89702e9284a2f1b4cf25b126f0373776c0e0
3
- size 412997972
 
 
 
 
training_state/rng_state.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e748121e35c59a7e8219bec32e2b267266ef8f9180eb6e780961e572b36f273
3
- size 15708
 
 
 
 
training_state/training_step.json DELETED
@@ -1,3 +0,0 @@
1
- {
2
- "step": 100000
3
- }