Skip to content

Commit

Permalink
Merge pull request #862 from ROCm/mi210-configs
Browse files Browse the repository at this point in the history
configs for mi210
  • Loading branch information
manoj-freyr authored Dec 12, 2024
2 parents faaaf2e + 45ae78e commit 7b47d45
Show file tree
Hide file tree
Showing 7 changed files with 1,010 additions and 0 deletions.
51 changes: 51 additions & 0 deletions rvs/conf/MI210/babel.conf
Original file line number Diff line number Diff line change
@@ -0,0 +1,51 @@
# ################################################################################
# #
# # Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
# #
# # MIT LICENSE:
# # Permission is hereby granted, free of charge, to any person obtaining a copy of
# # this software and associated documentation files (the "Software"), to deal in
# # the Software without restriction, including without limitation the rights to
# # use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
# # of the Software, and to permit persons to whom the Software is furnished to do
# # so, subject to the following conditions:
# #
# # The above copyright notice and this permission notice shall be included in all
# # copies or substantial portions of the Software.
# #
# # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# # SOFTWARE.
# #
# ###############################################################################

# BABEL test
#
# Preconditions:
# Set device to all. If you need to run the rvs only on a subset of GPUs, please run rvs with -g
# option, collect the GPUs IDs (e.g.: GPU[ 5 - 50599] -> 50599 is the GPU ID) and then specify
# all the GPUs IDs separated by white space (e.g.: device: 50599 3245)
# Set parallel execution to false
# Set buffer size to reflect the buffer you want to test
# Set run count to 1 (test will run once)
#

actions:
- name: babel-256MiB
device: all
module: babel # Name of the module
parallel: true # Parallel true or false
count: 1 # Number of times you want to repeat the test from the begin ( A clean start every time)
num_iter: 5000 # Number of iterations, this many kernels are launched simultaneosuly and stresses the system
array_size: 268435456 # Buffer size the test operates, this is 256 MiB
test_type: 1 # type of test, 1: Float, 2: Double, 3: Triad float, 4: Triad double
mibibytes: true # mibibytes (MiB) or megabytes (MB), true for MiB
o/p_csv: false # o/p as csv file
subtest: 5 # 1: copy 2: copy+mul 3: copy+mul+add 4: copy+mul+add+traid 5: copy+mul+add+traid+dot
dwords_per_lane: 4 # Number of dwords per lane
chunks_per_block: 4 # Number of chunks per block

174 changes: 174 additions & 0 deletions rvs/conf/MI210/gpup_single.conf
Original file line number Diff line number Diff line change
@@ -0,0 +1,174 @@
# ################################################################################
# #
# # Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
# #
# # MIT LICENSE:
# # Permission is hereby granted, free of charge, to any person obtaining a copy of
# # this software and associated documentation files (the "Software"), to deal in
# # the Software without restriction, including without limitation the rights to
# # use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
# # of the Software, and to permit persons to whom the Software is furnished to do
# # so, subject to the following conditions:
# #
# # The above copyright notice and this permission notice shall be included in all
# # copies or substantial portions of the Software.
# #
# # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# # SOFTWARE.
# #
# ###############################################################################

# Run test with testscript or binary:
#
# Using Testscript -
# cd /opt/rocm/share/rocm-validation-suite/testscripts
# sudo ./gpup.new.sh
#
# Using Binary -
# cd /opt/rocm/share/rocm-validation-suite/conf
# cd /opt/rocm/bin
# sudo ./rvs -c /opt/rocm/share/rocm-validation-suite/conf/gpup_single.conf
#
# Note: Paths may vary with the ROCm version or ROCm installation path.

# GPUP test #1
#
# Preconditions:
# all AMD compatible GPUs
# all types of devices
# all gpu properties, all io_links properties
#
# Expected result:
# Test passes with displaying all properties values for any GPUs

actions:
- name: RVS-GPUP-TC1
device: all
module: gpup
properties:
all:
io_links-properties:
all:

# GPUP test #2
#
# Preconditions:
# all AMD compatible GPUs
# all types of devices
# no regular expressions
# only a subset of gpu properties, only a subset of io_link properties
#
# Expected result:
# Test passes with displaying subsets of properties and io_link properties values for any GPUs

- name: RVS-GPUP-TC2
device: all
module: gpup
properties:
simd_count:
mem_banks_count:
io_links_count:
vendor_id:
location_id:
max_engine_clk_ccompute:
io_links-properties:
version_major:
type:
version_major:
version_minor:
node_from:
node_to:
recommended_transfer_size:
flags:

# GPUP test #3
#
# Preconditions:
# only a subset of AMD compatible GPUs (device filtering)
# all types of devices
# all gpu properties, all io_link properties
#
# Expected result:
# Test passes with displaying all properties and io_link properties values for subset of GPUs
#
# Note:
# Testing specific device, if device numbers are changed in system it should be changed in the test

- name: RVS-GPUP-TC3
device: all
module: gpup
properties:
all:
io_links-properties:
all:

# GPUP test #4
#
# Preconditions:
# all AMD compatible GPUs
# a given device type (deviceid filtering), this must be filled based on deviceid in sysfs/ ./rvs -g.
# Default is 0=> no filtering
# all gpu properties, all io_link properties
#
# Expected result:
# Test passes with displaying all properties and io_link properties values for all GPUs and given deviceid

- name: RVS-GPUP-TC4
device: all
module: gpup
deviceid: 0
properties:
all:
io_links-properties:
all:

# GPUP test #5
#
# Preconditions:
# only a subset of AMD compatible GPUs (device filtering)
# a given device type (deviceid filtering) this must be filled based on deviceid in sysfs/ ./rvs -g
# Default is 0=> no filtering
# all gpu properties, all io_link properties
#
# Expected result:
# Test passes with displaying all properties and io_link properties values for subset of GPUs and given deviceid
#
# Note:
# Testing specific device, if device numbers are changed in system it should be changed in the test

- name: RVS-GPUP-TC5
device: all
module: gpup
deviceid: 0
properties:
all:
io_links-properties:
all:

# GPUP test #6
#
# Preconditions:
# only a subset of AMD compatible GPUs (device filtering)
# a given device type (deviceid filtering) this must be filled based on deviceid in sysfs/ ./rvs -g
# Default is 0=> no filtering
# only a subset of gpu properties, only a subset of io_link properties
#
# Expected result:
# Test passes with displaying subset of properties and io_link properties values for subset of GPUs and given deviceid
#
# Note:
# Testing specific device, if device numbers are changed in system it should be changed in the test

- name: RVS-GPUP-TC6
device: all
module: gpup
deviceid: 0
properties:
mem_banks_count:
io_links-properties:
version_major:
130 changes: 130 additions & 0 deletions rvs/conf/MI210/gst_single.conf
Original file line number Diff line number Diff line change
@@ -0,0 +1,130 @@
# ################################################################################
# #
# # Copyright (c) 2024 Advanced Micro Devices, Inc. All rights reserved.
# #
# # MIT LICENSE:
# # Permission is hereby granted, free of charge, to any person obtaining a copy of
# # this software and associated documentation files (the "Software"), to deal in
# # the Software without restriction, including without limitation the rights to
# # use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
# # of the Software, and to permit persons to whom the Software is furnished to do
# # so, subject to the following conditions:
# #
# # The above copyright notice and this permission notice shall be included in all
# # copies or substantial portions of the Software.
# #
# # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# # SOFTWARE.
# #
# ###############################################################################



# GST test
#
# Preconditions:
# Set device to all. If you need to run the rvs only on a subset of GPUs, please run rvs with -g
# option, collect the GPUs IDs (e.g.: GPU[ 5 - 50599] -> 50599 is the GPU ID) and then specify
# all the GPUs IDs separated by white space
# Set parallel execution to false
# Set matrix_size to 8640 (for Vega 10 cards). For Vega 20, the recommended matrix_size is 8640
# Set run count to 2 (each test will run twice)
# Set copy_matrix to false (the matrices will be copied to GPUs only once)
#
# Run test with:
# cd bin
# sudo ./rvs -c conf/gst_1.conf -d 3
#
# Expected result:
# The test on each GPU passes (TRUE) if the GPU achieves 5000 gflops
# in maximum 7 seconds and then the GPU sustains the gflops
# for the rest of the test duration (total duration is 18 seconds).
# A single Gflops violation (with a 7% tolerance) is allowed.
# FALSE otherwise

actions:
- name: gpustress-41000-fp32-false
device: all
module: gst
parallel: false
count: 1
duration: 10000
copy_matrix: false
target_stress: 41000
matrix_size_a: 28000
matrix_size_b: 28000
matrix_size_c: 28000
data_type: fp32_r
lda: 28000
ldb: 28000
ldc: 28000
blas_source: hipblaslt

- name: gpustress-3000-dgemm-false
device: all
module: gst
parallel: false
count: 1
#hot_calls: 1000
duration: 15000
copy_matrix: false
target_stress: 30000
matrix_size_a: 8192
matrix_size_b: 8192
matrix_size_c: 8192
matrix_init: trig
ops_type: dgemm
lda: 8192
ldb: 8192
ldc: 8192

- name: gst-8096-150000-fp16
device: all
module: gst
log_interval: 3000
ramp_interval: 5000
duration: 15000
copy_matrix: false
target_stress: 150000
matrix_size_a: 8096
matrix_size_b: 8096
matrix_size_c: 8096
data_type: fp16_r
lda: 8096
ldb: 8096
ldc: 8096
ldd: 8096
transa: 1
transb: 0
alpha: 1
beta: 0
blas_source: hipblaslt

- name: gst-1215Tflops-4K4K8K-rand-fp8
device: all
module: gst
log_interval: 3000
ramp_interval: 5000
duration: 15000
hot_calls: 500
copy_matrix: false
target_stress: 160000
matrix_size_a: 8192
matrix_size_b: 8192
matrix_size_c: 8192
matrix_init: rand
data_type: i8_r
lda: 8192
ldb: 8192
ldc: 8192
transa: 1
transb: 0
alpha: 1
beta: 0
blas_source: hipblaslt

Loading

0 comments on commit 7b47d45

Please sign in to comment.