Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
bitsandbytes
Commits
369a51c4
Commit
369a51c4
authored
Mar 10, 2023
by
Phil Wang
Browse files
switch all eps to beta2
parent
6c377b39
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
6 deletions
+2
-6
csrc/kernels.cu
csrc/kernels.cu
+2
-6
No files found.
csrc/kernels.cu
View file @
369a51c4
...
@@ -799,8 +799,7 @@ __global__ void kPreconditionOptimizer32bit1State(T* g, T* p,
...
@@ -799,8 +799,7 @@ __global__ void kPreconditionOptimizer32bit1State(T* g, T* p,
s1_vals
[
j
]
=
s1_vals
[
j
]
*
s1_vals
[
j
];
// update norm
s1_vals
[
j
]
=
s1_vals
[
j
]
*
s1_vals
[
j
];
// update norm
break
;
break
;
case
LION
:
case
LION
:
// using eps as beta2
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
(
float
)
g_vals
[
j
]);
// state update
s1_vals
[
j
]
=
s1_vals
[
j
]
*
eps
+
((
1.0
f
-
eps
)
*
(
float
)
g_vals
[
j
]);
// state update
break
;
break
;
case
RMSPROP
:
case
RMSPROP
:
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
])
*
((
float
)
g_vals
[
j
]));
// state update
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
])
*
((
float
)
g_vals
[
j
]));
// state update
...
@@ -903,9 +902,8 @@ __global__ void kOptimizer32bit1State(T *g, T *p,
...
@@ -903,9 +902,8 @@ __global__ void kOptimizer32bit1State(T *g, T *p,
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
+
update_scale
*
(
-
lr
*
(
s1_vals
[
j
]));
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
+
update_scale
*
(
-
lr
*
(
s1_vals
[
j
]));
break
;
break
;
case
LION
:
case
LION
:
// using eps as beta2
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
-
update_scale
*
(
lr
*
sgn
(((
float
)
s1_vals
[
j
])
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
]))));
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
-
update_scale
*
(
lr
*
sgn
(((
float
)
s1_vals
[
j
])
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
]))));
s1_vals
[
j
]
=
s1_vals
[
j
]
*
eps
+
((
1.0
f
-
eps
)
*
((
float
)
g_vals
[
j
]));
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
((
float
)
g_vals
[
j
]));
break
;
break
;
case
RMSPROP
:
case
RMSPROP
:
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
])
*
((
float
)
g_vals
[
j
]));
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_vals
[
j
])
*
((
float
)
g_vals
[
j
]));
...
@@ -1237,7 +1235,6 @@ kPreconditionOptimizerStatic8bit1State(T* p, T* __restrict__ const g, unsigned c
...
@@ -1237,7 +1235,6 @@ kPreconditionOptimizerStatic8bit1State(T* p, T* __restrict__ const g, unsigned c
local_unorm
+=
s1_vals
[
j
]
*
s1_vals
[
j
];
local_unorm
+=
s1_vals
[
j
]
*
s1_vals
[
j
];
break
;
break
;
case
LION
:
case
LION
:
// using eps as beta2
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
g_val
);
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
g_val
);
break
;
break
;
case
RMSPROP
:
case
RMSPROP
:
...
@@ -1354,7 +1351,6 @@ kOptimizerStatic8bit1State(T* p, T* const g, unsigned char* state1,
...
@@ -1354,7 +1351,6 @@ kOptimizerStatic8bit1State(T* p, T* const g, unsigned char* state1,
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
+
(
-
lr
*
update_scale
*
(
s1_vals
[
j
]));
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
+
(
-
lr
*
update_scale
*
(
s1_vals
[
j
]));
break
;
break
;
case
LION
:
case
LION
:
// using eps as beta2
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
-
(
lr
*
sgn
(((
float
)
s1_vals
[
j
])
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_val
))));
p_vals
[
j
]
=
((
float
)
p_vals
[
j
])
-
(
lr
*
sgn
(((
float
)
s1_vals
[
j
])
*
beta1
+
((
1.0
f
-
beta1
)
*
((
float
)
g_val
))));
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
g_val
);
s1_vals
[
j
]
=
s1_vals
[
j
]
*
beta2
+
((
1.0
f
-
beta2
)
*
g_val
);
break
;
break
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment