Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
sunzhq2
bytemlperf-dcu
Commits
24b257f1
Commit
24b257f1
authored
Nov 19, 2024
by
sunzhq2
Browse files
init
parent
920b3c0f
Changes
330
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
376 additions
and
0 deletions
+376
-0
ByteMLPerf/byte_micro_perf/workloads/gelu.json
ByteMLPerf/byte_micro_perf/workloads/gelu.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/gemm.json
ByteMLPerf/byte_micro_perf/workloads/gemm.json
+27
-0
ByteMLPerf/byte_micro_perf/workloads/gemv.json
ByteMLPerf/byte_micro_perf/workloads/gemv.json
+22
-0
ByteMLPerf/byte_micro_perf/workloads/group_gemm.json
ByteMLPerf/byte_micro_perf/workloads/group_gemm.json
+15
-0
ByteMLPerf/byte_micro_perf/workloads/host2device.json
ByteMLPerf/byte_micro_perf/workloads/host2device.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/index_add.json
ByteMLPerf/byte_micro_perf/workloads/index_add.json
+21
-0
ByteMLPerf/byte_micro_perf/workloads/layernorm.json
ByteMLPerf/byte_micro_perf/workloads/layernorm.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/log.json
ByteMLPerf/byte_micro_perf/workloads/log.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/mul.json
ByteMLPerf/byte_micro_perf/workloads/mul.json
+22
-0
ByteMLPerf/byte_micro_perf/workloads/p2p.json
ByteMLPerf/byte_micro_perf/workloads/p2p.json
+26
-0
ByteMLPerf/byte_micro_perf/workloads/reduce_max.json
ByteMLPerf/byte_micro_perf/workloads/reduce_max.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/reduce_min.json
ByteMLPerf/byte_micro_perf/workloads/reduce_min.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/reduce_sum.json
ByteMLPerf/byte_micro_perf/workloads/reduce_sum.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/reducescatter.json
ByteMLPerf/byte_micro_perf/workloads/reducescatter.json
+22
-0
ByteMLPerf/byte_micro_perf/workloads/scatter.json
ByteMLPerf/byte_micro_perf/workloads/scatter.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/silu.json
ByteMLPerf/byte_micro_perf/workloads/silu.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/sin.json
ByteMLPerf/byte_micro_perf/workloads/sin.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/softmax.json
ByteMLPerf/byte_micro_perf/workloads/softmax.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/sort.json
ByteMLPerf/byte_micro_perf/workloads/sort.json
+17
-0
ByteMLPerf/byte_micro_perf/workloads/sqrt.json
ByteMLPerf/byte_micro_perf/workloads/sqrt.json
+17
-0
No files found.
ByteMLPerf/byte_micro_perf/workloads/gelu.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"gelu"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/gemm.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"gemm"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"M"
:
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
"KN"
:
[
[
1024
,
1024
],
[
4096
,
4096
],
[
8192
,
8192
],
[
12288
,
12288
],
[
16384
,
32
],
[
16384
,
128
],
[
16384
,
1024
],
[
32
,
16384
],
[
128
,
16384
],
[
1024
,
16384
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
,
"int8"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/gemv.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"gemv"
,
"iterations"
:
100
,
"input_shape_groups"
:
[
{
"M"
:
[
1
],
"K"
:
[
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
],
"N"
:
[
4096
,
8192
]
},
{
"M"
:
[
1
],
"K"
:
[
4096
,
8192
],
"N"
:
[
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
]
}
],
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
,
"int8"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/group_gemm.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"group_gemm"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"gemm_group"
:
[
1
,
2
,
3
,
4
,
5
,
6
,
7
,
8
],
"batch"
:
[
1
,
2
,
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
],
"KN"
:
[[
32
,
16384
],
[
16384
,
32
],
[
16384
,
16384
]]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
,
"int8"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/host2device.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"host2device"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
1024
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/index_add.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"index_add"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
],
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/layernorm.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"layernorm"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/log.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"log"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/mul.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"mul"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
],
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/p2p.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"p2p"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
,
1048576
,
2097152
],
[
1024
]
],
[
[
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
,
1048576
,
2097152
],
[
1024
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
],
"group"
:
[
2
,
4
,
8
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/reduce_max.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"reduce_max"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/reduce_min.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"reduce_min"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/reduce_sum.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"reduce_sum"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/reducescatter.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"reducescatter"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
,
1048576
,
2097152
],
[
1024
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
],
"group"
:
[
2
,
4
,
8
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/scatter.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"scatter"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/silu.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"silu"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/sin.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"sin"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/softmax.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"softmax"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/sort.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"sort"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
1024
],
[
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
,
262144
,
524288
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
ByteMLPerf/byte_micro_perf/workloads/sqrt.json
0 → 100644
View file @
24b257f1
{
"operator"
:
"sqrt"
,
"iterations"
:
100
,
"input_shape_groups"
:
{
"inputs"
:
[
[
[
4
,
8
,
16
,
32
,
64
,
128
,
256
,
512
,
1024
,
2048
,
4096
,
8192
,
16384
,
32768
,
65536
,
131072
],
[
8192
]
]
]
},
"dtype"
:
[
"float32"
,
"bfloat16"
,
"float16"
]
}
\ No newline at end of file
Prev
1
…
10
11
12
13
14
15
16
17
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment