Commit 8bb7aea1 authored by wenjh's avatar wenjh
Browse files

Merge branch 'develop_v2.7' into release_v2.7

parents bfcd6493 4922108e
......@@ -350,6 +350,12 @@ NVTEDType nvte_tensor_type(const NVTETensor tensor) {
return static_cast<NVTEDType>(t->dtype());
}
// Because of a HIP compiler bug, we need to disable optimizations here
// when compiling for AMD GPUs while test_float8blockwisetensor.py.
// Todo: remove this once the HIP compiler bug is fixed.
#ifdef __HIP_PLATFORM_AMD__
#pragma clang optimize off
#endif
NVTEShape nvte_make_shape(const size_t *data, size_t ndim) {
NVTEShape ret;
if (ndim == 0) {
......@@ -363,6 +369,12 @@ NVTEShape nvte_make_shape(const size_t *data, size_t ndim) {
ret.ndim = ndim;
return ret;
}
// Because of a HIP compiler bug, we need to disable optimizations here
// when compiling for AMD GPUs while test_float8blockwisetensor.py.
// Todo: remove this once the HIP compiler bug is fixed.
#ifdef __HIP_PLATFORM_AMD__
#pragma clang optimize on
#endif
NVTEShape nvte_tensor_shape(const NVTETensor tensor) {
auto *t = transformer_engine::convertNVTETensor(tensor);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment