1
0
Fork 0

aomp, llvm 2nd pass disable

main
Jeff Moe 2024-02-07 13:20:46 -07:00
parent 0ec8cbad4a
commit da5f1a33bc
5 changed files with 80 additions and 78 deletions

View File

@ -1,5 +1,21 @@
# Perhaps.
# Ug, mono.
sudo apt install cli-common-dev
https://github.com/ROCm/aomp
cd aomp/
git checkout rocm-6.0.2
virtualenv venv
source venv/bin/activate
pip install -U setuptools pip wheel
pip install CppHeaderParser argparse lit lxml termcolor pandas
pip install git+https://github.com/efficios/barectf
rm -rf build
exit
# Using upstream build scripts. Fails.
export AOMP_VERSION=18.0
export AOMP_REPOS=$HOME/devel/ROCm/aomp${AOMP_VERSION}
export MAKEFLAGS="-j128"
mkdir -p $AOMP_REPOS
cd $AOMP_REPOS
git clone -b aomp-18.0-1 https://github.com/ROCm-Developer-Tools/aomp
@ -7,9 +23,3 @@ $AOMP_REPOS/aomp/bin/clone_aomp.sh
$AOMP_REPOS/aomp/bin/build_prereq.sh
nohup $AOMP_REPOS/aomp/bin/build_aomp.sh &
# virtualenv venv
# source venv/bin/activate
# pip install -U setuptools pip wheel
# pip install CppHeaderParser argparse lit lxml termcolor pandas
# pip install git+https://github.com/efficios/barectf

View File

@ -23,8 +23,7 @@ There is a ROCm optimized version of HPL.
`<https://github.com/ROCm/rocHPL>`_
* It looks like it hasn't been updated for ROCm release 6.0.2 though.
The ``gfx1100`` isn't listed.
* It looks like it hasn't been updated for ROCm release 6.0.2 though. The ``gfx1100`` isn't listed.
* Depends on ``roctracer`` and ``roctx``.
* May need MPI recompiled for GPU.
* OpenMP may be needed too (if not here, elsewhere).

View File

@ -9,7 +9,7 @@ msgid ""
msgstr ""
"Project-Id-Version: tinyrocs: Direct to Chip Liquid Cooled GPU AI Cluster 0\n"
"Report-Msgid-Bugs-To: \n"
"POT-Creation-Date: 2024-02-07 11:49-0700\n"
"POT-Creation-Date: 2024-02-07 13:19-0700\n"
"PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
"Last-Translator: FULL NAME <EMAIL@ADDRESS>\n"
"Language: en\n"
@ -67,136 +67,143 @@ msgid "`<https://github.com/ROCm/rocHPL>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:26
msgid "It looks like it hasn't been updated for ROCm release 6.0.2 though."
msgid ""
"It looks like it hasn't been updated for ROCm release 6.0.2 though. The "
"``gfx1100`` isn't listed."
msgstr ""
#: ../../../_source/benchmarks.rst:27
msgid ""
"The ``gfx1100`` isn't listed. * Depends on ``roctracer`` and ``roctx``. * "
"May need MPI recompiled for GPU. * OpenMP may be needed too (if not here, "
"elsewhere)."
msgid "Depends on ``roctracer`` and ``roctx``."
msgstr ""
#: ../../../_source/benchmarks.rst:33
#: ../../../_source/benchmarks.rst:28
msgid "May need MPI recompiled for GPU."
msgstr ""
#: ../../../_source/benchmarks.rst:29
msgid "OpenMP may be needed too (if not here, elsewhere)."
msgstr ""
#: ../../../_source/benchmarks.rst:32
msgid "DGEMM"
msgstr ""
#: ../../../_source/benchmarks.rst:34
#: ../../../_source/benchmarks.rst:33
msgid ""
"DGEMM \"measures the floating point rate of execution of double precision "
"real matrix-matrix multiplication.\""
msgstr ""
#: ../../../_source/benchmarks.rst:37
#: ../../../_source/benchmarks.rst:36
msgid "STREAM"
msgstr ""
#: ../../../_source/benchmarks.rst:38
#: ../../../_source/benchmarks.rst:37
msgid ""
"STREAM is \"a simple synthetic benchmark program that measures sustainable "
"memory bandwidth (in GB/s) and the corresponding computation rate for simple "
"vector kernel.\""
msgstr ""
#: ../../../_source/benchmarks.rst:41
#: ../../../_source/benchmarks.rst:40
msgid "`<https://www.cs.virginia.edu/stream>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:44
#: ../../../_source/benchmarks.rst:43
msgid "PTRANS"
msgstr ""
#: ../../../_source/benchmarks.rst:45
#: ../../../_source/benchmarks.rst:44
msgid ""
"PTRANS (parallel matrix transpose) \"exercises the communications where "
"pairs of processors communicate with each other simultaneously. It is a "
"useful test of the total communications capacity of the network.\""
msgstr ""
#: ../../../_source/benchmarks.rst:49
#: ../../../_source/benchmarks.rst:48
msgid "`<https://www.netlib.org/parkbench/html/matrix-kernels.html>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:52
#: ../../../_source/benchmarks.rst:51
msgid "RandomAccess"
msgstr ""
#: ../../../_source/benchmarks.rst:53
#: ../../../_source/benchmarks.rst:52
msgid ""
"\"RandomAccess measures the rate of integer random updates of memory (GUPS)."
"\""
msgstr ""
#: ../../../_source/benchmarks.rst:55
#: ../../../_source/benchmarks.rst:54
msgid "`<https://hpcchallenge.org/projectsfiles/hpcc/RandomAccess.html>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:58
#: ../../../_source/benchmarks.rst:57
msgid "FFT"
msgstr ""
#: ../../../_source/benchmarks.rst:59
#: ../../../_source/benchmarks.rst:58
msgid ""
"\"FFT measures the floating point rate of execution of double precision "
"complex one-dimensional Discrete Fourier Transform (DFT).\""
msgstr ""
#: ../../../_source/benchmarks.rst:62
#: ../../../_source/benchmarks.rst:61
msgid "`<http://www.ffte.jp>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:65
#: ../../../_source/benchmarks.rst:64
msgid "Communication Bandwidth and Latency"
msgstr ""
#: ../../../_source/benchmarks.rst:66
#: ../../../_source/benchmarks.rst:65
msgid ""
"Communication bandwidth and latency is \"a set of tests to measure latency "
"and bandwidth of a number of simultaneous communication patterns; based on "
"b_eff (effective bandwidth benchmark).\""
msgstr ""
#: ../../../_source/benchmarks.rst:69
#: ../../../_source/benchmarks.rst:68
msgid "`<https://fs.hlrs.de/projects/par/mpi/b_eff>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:72
#: ../../../_source/benchmarks.rst:71
msgid "``hpcc``"
msgstr ""
#: ../../../_source/benchmarks.rst:73
#: ../../../_source/benchmarks.rst:72
msgid "HPC Challenge benchmarks."
msgstr ""
#: ../../../_source/benchmarks.rst:75
#: ../../../_source/benchmarks.rst:74
msgid "`<https://hpcchallenge.org/hpcc>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:77
#: ../../../_source/benchmarks.rst:76
msgid "The HPC Challenge benchmarks are in the Debian ``hpcc`` package."
msgstr ""
#: ../../../_source/benchmarks.rst:84
#: ../../../_source/benchmarks.rst:83
msgid "See the Output section of this documentation for benchmark results."
msgstr ""
#: ../../../_source/benchmarks.rst:88
#: ../../../_source/benchmarks.rst:87
msgid "tinygrad"
msgstr ""
#: ../../../_source/benchmarks.rst:89
#: ../../../_source/benchmarks.rst:88
msgid "Benchmarks in tinygrad."
msgstr ""
#: ../../../_source/benchmarks.rst:92
#: ../../../_source/benchmarks.rst:91
msgid "mlnotcommons"
msgstr ""
#: ../../../_source/benchmarks.rst:93
#: ../../../_source/benchmarks.rst:92
msgid "Proprietary with a few libre datasets and benchmarks available."
msgstr ""
#: ../../../_source/benchmarks.rst:95
#: ../../../_source/benchmarks.rst:94
msgid ""
"Don't let \"Commons\" in the name lead you to think this is available to the "
"mere public. Lots of proprietary bits involved, closed lists, corporate "
@ -205,28 +212,28 @@ msgid ""
"that serve the public). This isn't like Wikipedia Commons at all."
msgstr ""
#: ../../../_source/benchmarks.rst:101
#: ../../../_source/benchmarks.rst:100
msgid ""
"The upstream tinycorp is working on implementing some of their benchmarks "
"using ``tinygrad`` and AMD GPUs."
msgstr ""
#: ../../../_source/benchmarks.rst:104
#: ../../../_source/benchmarks.rst:103
msgid "`<https://mlcommons.org/datasets>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:106
#: ../../../_source/benchmarks.rst:105
msgid "`<https://mlcommons.org/benchmarks>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:108
#: ../../../_source/benchmarks.rst:107
msgid "`<https://github.com/mlcommons>`_"
msgstr ""
#: ../../../_source/benchmarks.rst:112
#: ../../../_source/benchmarks.rst:111
msgid "``examples/mlperf/model_spec.py``"
msgstr ""
#: ../../../_source/benchmarks.rst:113
#: ../../../_source/benchmarks.rst:112
msgid "Test run, just hitting one GPU."
msgstr ""

View File

@ -8,7 +8,7 @@ msgid ""
msgstr ""
"Project-Id-Version: tinyrocs 0\n"
"Report-Msgid-Bugs-To: \n"
"POT-Creation-Date: 2024-02-07 12:27-0700\n"
"POT-Creation-Date: 2024-02-07 13:20-0700\n"
"PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
"Last-Translator: FULL NAME <EMAIL@ADDRESS>\n"
"Language: en\n"
@ -347,20 +347,3 @@ msgstr ""
#: ../../../_source/toolchain-6.0.2.rst:270
msgid "``hipBLAS`` plz."
msgstr ""
#: ../../../_source/toolchain-6.0.2.rst:277
msgid "aomp"
msgstr ""
#: ../../../_source/toolchain-6.0.2.rst:278
msgid "``aomp``."
msgstr ""
#: ../../../_source/toolchain-6.0.2.rst:285
msgid "LLVM Pass Two"
msgstr ""
#: ../../../_source/toolchain-6.0.2.rst:286
msgid ""
"XXX Skip this for now ? XXX. Needed for flang (fortran). Needed for OpenMP."
msgstr ""

View File

@ -273,19 +273,22 @@ hipBLAS
:language: bash
aomp
----
``aomp``.
.. literalinclude:: _static/toolchain/rocm-6.0.2/build-aomp.sh
:language: bash
.. aomp
.. ----
.. ``aomp``.
.. The scripts download binary RPMs to extract and other meh build
.. workarounds.
.. Build scripts note working for now due to some missing lib in binary package.
..
.. .. literalinclude:: _static/toolchain/rocm-6.0.2/build-aomp.sh
.. :language: bash
LLVM Pass Two
-------------
XXX Skip this for now ? XXX. Needed for flang (fortran).
Needed for OpenMP.
.. literalinclude:: _static/toolchain/rocm-6.0.2/build-llvm-second.sh
:language: bash
.. LLVM Pass Two
.. -------------
.. XXX Skip this for now ? XXX. Needed for flang (fortran).
.. Needed for OpenMP.
..
.. .. literalinclude:: _static/toolchain/rocm-6.0.2/build-llvm-second.sh
.. :language: bash