mirror of
https://github.com/ROCm/ROCm.git
synced 2026-01-10 23:28:03 -05:00
Compare commits
55 Commits
rocm-2.6
...
roc-2.10.0
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
65f1d2ee30 | ||
|
|
21cc30341c | ||
|
|
107bbd8abc | ||
|
|
77e77172a4 | ||
|
|
f0d15004a0 | ||
|
|
a899984e4e | ||
|
|
29576d17a3 | ||
|
|
92a74beed5 | ||
|
|
4ac14e8095 | ||
|
|
04379e089e | ||
|
|
886af2c92f | ||
|
|
afa76ba6a4 | ||
|
|
da16cd49f3 | ||
|
|
d54224f6f5 | ||
|
|
84efdd8493 | ||
|
|
8bd9a52740 | ||
|
|
fbf04f0680 | ||
|
|
33b01a9d73 | ||
|
|
6df6f25b24 | ||
|
|
06b723a026 | ||
|
|
ac085f166f | ||
|
|
269e6dde84 | ||
|
|
664d08dd66 | ||
|
|
9c038ae6cd | ||
|
|
8b11d2d51c | ||
|
|
cd14a94f45 | ||
|
|
cd0c1a7158 | ||
|
|
c135c6ca16 | ||
|
|
29398068cb | ||
|
|
36f1dc6467 | ||
|
|
215a0ca513 | ||
|
|
3af7f0c2b6 | ||
|
|
5798b691bf | ||
|
|
81ca4c3ae8 | ||
|
|
c6c9850a46 | ||
|
|
e6adf53679 | ||
|
|
e88d9b533c | ||
|
|
0a41c5df4e | ||
|
|
e5fab6d043 | ||
|
|
efbfe487e2 | ||
|
|
48f8ce93b8 | ||
|
|
9623efac90 | ||
|
|
258740b489 | ||
|
|
b178fa0666 | ||
|
|
1f0e2c2d7a | ||
|
|
ae0503cad3 | ||
|
|
725f57b531 | ||
|
|
70f9bf263e | ||
|
|
445ac506cb | ||
|
|
360fa794e1 | ||
|
|
128e3af2bd | ||
|
|
71993cf7c6 | ||
|
|
a9bb319d96 | ||
|
|
6d5e854277 | ||
|
|
b1b081fa8f |
BIN
AMD_ROCm_v2.10_Release_Notes.pdf
Normal file
BIN
AMD_ROCm_v2.10_Release_Notes.pdf
Normal file
Binary file not shown.
57
default.xml
57
default.xml
@@ -12,7 +12,7 @@
|
||||
<remote name="gpuopen-tools"
|
||||
fetch="https://github.com/GPUOpen-Tools/" />
|
||||
|
||||
<default revision="refs/tags/roc-2.6.0"
|
||||
<default revision="refs/tags/roc-2.10.0"
|
||||
remote="roc-github"
|
||||
sync-c="true"
|
||||
sync-j="4" />
|
||||
@@ -21,10 +21,11 @@
|
||||
<project name="ROCT-Thunk-Interface" />
|
||||
<project name="ROCR-Runtime" />
|
||||
<project name="ROC-smi" />
|
||||
<project name="rocm-cmake" revision="ac45c6e269d1fd1dbd5dfc81cfe47a7452c96daf" />
|
||||
<project name="rocm-cmake" />
|
||||
<project name="rocminfo" />
|
||||
<project name="rocprofiler" remote="rocm-devtools" revision="refs/tags/roc-2.6.0"/>
|
||||
<project name="roctracer" remote="rocm-devtools" revision="refs/tags/roc-2.6.0"/>
|
||||
|
||||
<project name="rocprofiler" remote="rocm-devtools" revision="refs/tags/roc-2.10.0" />
|
||||
<project name="roctracer" remote="rocm-devtools" revision="roc-2.10.x" />
|
||||
<!-- If you want to get the full OpenCL runtime, there is a separate repo
|
||||
manifest that is more authoritative than the copy in this file. It can
|
||||
be found at the following URL:
|
||||
@@ -32,44 +33,44 @@
|
||||
<remote name="KhronosGroup" fetch="https://github.com/KhronosGroup/" />
|
||||
<project name="ROCm-OpenCL-Runtime" />
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/driver" name="ROCm-OpenCL-Driver"/>
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/llvm" name="llvm" revision="refs/tags/roc-ocl-2.6.0" />
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/llvm" name="llvm" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/llvm/tools/clang" name="clang" />
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/llvm/tools/lld" name="lld" revision="refs/tags/roc-ocl-2.6.0" />
|
||||
<project path="ROCm-OpenCL-Runtime/library/amdgcn" name="ROCm-Device-Libs" revision="refs/tags/roc-ocl-2.6.0" />
|
||||
<project path="ROCm-OpenCL-Runtime/api/opencl/khronos/icd" name="OpenCL-ICD-Loader" remote="KhronosGroup" revision="261c1288aadd9dcc4637aca08332f603e6c13715" />
|
||||
<project path="ROCm-OpenCL-Runtime/compiler/llvm/tools/lld" name="lld" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
<project path="ROCm-OpenCL-Runtime/library/amdgcn" name="ROCm-Device-Libs" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
|
||||
<project path="ROCm-OpenCL-Runtime/api/opencl/khronos/icd" name="OpenCL-ICD-Loader" remote="KhronosGroup" revision="6c03f8b58fafd9dd693eaac826749a5cfad515f8" />
|
||||
<project name="clang-ocl" />
|
||||
<!-- HCC needs to be recursively synced to get it submodules -->
|
||||
<project name="hcc" sync-s="true" revision="refs/tags/roc-hcc-2.6.0" />
|
||||
<project name="hcc" sync-s="true" revision="refs/tags/roc-hcc-2.10.0" />
|
||||
<project name="HCC-Example-Application" remote="rocm-devtools" revision="ffd6533305e79eed667badd3c4cdb7879a1281b8" />
|
||||
<project name="HIP" remote="rocm-devtools" />
|
||||
<project name="HIP" remote="rocm-devtools" revision="refs/tags/roc-2.10.0" />
|
||||
<project name="HIP-Examples" remote="rocm-devtools" />
|
||||
<!-- The following projects are all associated with the AMDGPU LLVM compiler -->
|
||||
<project name="llvm" path="llvm_amd-common" revision="refs/tags/roc-hcc-2.6.0" />
|
||||
<project name="lld" path="llvm_amd-common/lld" revision="refs/tags/roc-ocl-2.6.0" />
|
||||
<project name="llvm" path="llvm_amd-common" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
<project name="lld" path="llvm_amd-common/lld" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
<project name="clang" path="llvm_amd-common/clang" />
|
||||
<project name="ROCm-Device-Libs" revision="refs/tags/roc-hcc-2.6.0" />
|
||||
<project name="atmi" revision="refs/tags/rocm_2.6.0" />
|
||||
<project name="ROCm-Device-Libs" revision="refs/tags/roc-ocl-2.10.0" />
|
||||
<project name="atmi" revision="refs/tags/rocm_2.10.0" />
|
||||
<project name="ROCm-CompilerSupport" />
|
||||
<project name="rocr_debug_agent" remote="rocm-devtools" />
|
||||
<project name="rocm_bandwidth_test" />
|
||||
<project name="RCP" remote="gpuopen-tools" revision="3a49405a1500067c49d181844ec90aea606055bb" />
|
||||
|
||||
<!-- ROCm Libraries -->
|
||||
<project name="rocBLAS" remote="rocm-swplat" revision="refs/tags/rocm-2.6" />
|
||||
<project name="hipBLAS" remote="rocm-swplat" revision="refs/tags/rocm-2.6" />
|
||||
<project name="rocFFT" remote="rocm-swplat" revision="refs/tags/v0.9.4" />
|
||||
<project name="rocRAND" remote="rocm-swplat" revision="refs/tags/2.6.0" />
|
||||
<project name="rocSPARSE" remote="rocm-swplat" revision="refs/tags/rocm-2.6" />
|
||||
<project name="hipSPARSE" remote="rocm-swplat" revision="refs/tags/rocm-2.6" />
|
||||
<project name="rocALUTION" remote="rocm-swplat" revision="refs/tags/rocm-2.6" />
|
||||
<project name="MIOpenGEMM" remote="rocm-swplat" revision="9547fb9e8499a5a9f16da83b1e6b749de82dd9fb" />
|
||||
<project name="MIOpen" remote="rocm-swplat" revision="refs/tags/roc-2.6.0" />
|
||||
<project name="Thrust" remote="rocm-swplat" revision="refs/tags/2.6.0" sync-s="true" />
|
||||
<project name="rocBLAS" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="hipBLAS" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="rocFFT" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="rocRAND" remote="rocm-swplat" revision="refs/tags/2.10.0" />
|
||||
<project name="rocSPARSE" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="hipSPARSE" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="rocALUTION" remote="rocm-swplat" revision="refs/tags/rocm-2.10" />
|
||||
<project name="MIOpenGEMM" remote="rocm-swplat" revision="6275a879995b58a6e0b8cca7b1ad8421a5e02ade" />
|
||||
<project name="MIOpen" remote="rocm-swplat" revision="refs/tags/roc-2.10.0" />
|
||||
<project name="rocm_smi_lib" />
|
||||
<project name="rccl" remote="rocm-swplat" revision="refs/tags/2.6.0" />
|
||||
<project name="MIVisionX" remote="gpuopen-libs" revision="refs/tags/1.3.0" />
|
||||
<project name="rocThrust" remote="rocm-swplat" revision="refs/tags/2.6.0" />
|
||||
<project name="hipCUB" remote="rocm-swplat" revision="refs/tags/2.6.0" />
|
||||
<project name="rccl" remote="rocm-swplat" revision="refs/tags/2.10.0" />
|
||||
<project name="MIVisionX" remote="gpuopen-libs" revision="refs/tags/1.5" />
|
||||
<project name="rocThrust" remote="rocm-swplat" revision="refs/tags/2.10.0" />
|
||||
<project name="hipCUB" remote="rocm-swplat" revision="refs/tags/2.10.0" />
|
||||
<project name="rocPRIM" remote="rocm-swplat" revision="refs/tags/2.10.0" />
|
||||
|
||||
</manifest>
|
||||
|
||||
@@ -1,7 +1,12 @@
|
||||
## ROCm Version History
|
||||
This file contains archived version history information for the [ROCm project](https://github.com/RadeonOpenCompute/ROCm)
|
||||
|
||||
### Current ROCm Version: 2.6
|
||||
### Current ROCm Version: 2.10
|
||||
- [New features and enhancements in ROCm 2.9](#new-features-and-enhancements-in-rocm-29)
|
||||
- [New features and enhancements in ROCm 2.8](#new-features-and-enhancements-in-rocm-28)
|
||||
- [New features and enhancements in ROCm 2.7.2](#new-features-and-enhancements-in-rocm-272)
|
||||
- [New features and enhancements in ROCm 2.7](#new-features-and-enhancements-in-rocm-27)
|
||||
- [New features and enhancements in ROCm 2.6](#new-features-and-enhancements-in-rocm-26)
|
||||
- [New features and enhancements in ROCm 2.5](#new-features-and-enhancements-in-rocm-25)
|
||||
- [New features and enhancements in ROCm 2.4](#new-features-and-enhancements-in-rocm-24)
|
||||
- [New features and enhancements in ROCm 2.3](#new-features-and-enhancements-in-rocm-23)
|
||||
@@ -17,6 +22,147 @@ This file contains archived version history information for the [ROCm project](h
|
||||
- [New Features as of ROCm 1.7](#new-features-as-of-rocm-17)
|
||||
- [New Features as of ROCm 1.5](#new-features-as-of-rocm-15)
|
||||
|
||||
|
||||
|
||||
|
||||
### New features and enhancements in ROCm 2.9
|
||||
|
||||
#### Initial release for Radeon Augmentation Library(RALI)
|
||||
The AMD Radeon Augmentation Library (RALI) is designed to efficiently decode and process images from a variety of storage formats and modify them through a processing graph programmable by the user. RALI currently provides C API.
|
||||
|
||||
#### Quantization in MIGraphX v0.4
|
||||
MIGraphX 0.4 introduces support for fp16 and int8 quantization. For additional details, as well as other new MIGraphX features, see [MIGraphX documentation](https://github.com/ROCmSoftwarePlatform/AMDMIGraphX/wiki/Getting-started:-using-the-new-features-of-MIGraphX-0.4).
|
||||
|
||||
#### rocSparse csrgemm
|
||||
csrgemm enables the user to perform matrix-matrix multiplication with two sparse matrices in CSR format.
|
||||
|
||||
#### Singularity Support
|
||||
ROCm 2.9 adds support for Singularity container version 2.5.2.
|
||||
|
||||
#### Initial release of rocTX
|
||||
ROCm 2.9 introduces rocTX, which provides a C API for code markup for performance profiling. This initial release of rocTX supports annotation of code ranges and ASCII markers. For an example, see this [code](https://github.com/ROCm-Developer-Tools/roctracer/blob/amd-master/test/MatrixTranspose_test/MatrixTranspose.cpp).
|
||||
|
||||
#### Added support for Ubuntu 18.04.3
|
||||
Ubuntu 18.04.3 is now supported in ROCm 2.9.
|
||||
|
||||
|
||||
|
||||
### New features and enhancements in ROCm 2.8
|
||||
|
||||
#### Support for NCCL2.4.8 API
|
||||
Implements ncclCommAbort() and ncclCommGetAsyncError() to match the NCCL 2.4.x API
|
||||
|
||||
### New features and enhancements in ROCm 2.7.2
|
||||
|
||||
This release is a hotfix for ROCm release 2.7.
|
||||
|
||||
#### Issues fixed in ROCm 2.7.2
|
||||
|
||||
##### A defect in upgrades from older ROCm releases has been fixed.
|
||||
|
||||
##### rocprofiler --hiptrace and --hsatrace fails to load roctracer library
|
||||
In ROCm 2.7.2, rocprofiler --hiptrace and --hsatrace fails to load roctracer library defect has been fixed.
|
||||
To generate traces, please provide directory path also using the parameter: -d <$directoryPath> for example:
|
||||
```shell
|
||||
/opt/rocm/bin/rocprof --hsa-trace -d $PWD/traces /opt/rocm/hip/samples/0_Intro/bit_extract/bit_extract
|
||||
```
|
||||
All traces and results will be saved under $PWD/traces path
|
||||
|
||||
#### Upgrading from ROCm 2.7 to 2.7.2
|
||||
|
||||
To upgrade, please remove 2.7 completely as specified [for ubuntu](#how-to-uninstall-from-ubuntu-1604-or-Ubuntu-1804) or [for centos/rhel](#how-to-uninstall-rocm-from-centosrhel-76), and install 2.7.2 as per instructions [install instructions](#installing-from-amd-rocm-repositories)
|
||||
|
||||
#### Other notes
|
||||
|
||||
To use rocprofiler features, the following steps need to be completed before using rocprofiler:
|
||||
|
||||
##### Step-1: Install roctracer
|
||||
|
||||
###### Ubuntu 16.04 or Ubuntu 18.04:
|
||||
|
||||
```shell
|
||||
sudo apt install roctracer-dev
|
||||
```
|
||||
|
||||
###### CentOS/RHEL 7.6:
|
||||
|
||||
```shell
|
||||
sudo yum install roctracer-dev
|
||||
```
|
||||
##### Step-2: Add /opt/rocm/roctracer/lib to LD_LIBRARY_PATH
|
||||
|
||||
### New features and enhancements in ROCm 2.7
|
||||
|
||||
#### [rocFFT] Real FFT Functional
|
||||
Improved real/complex 1D even-length transforms of unit stride. Performance improvements of up to 4.5x are observed. Large problem sizes should see approximately 2x.
|
||||
|
||||
#### rocRand Enhancements and Optimizations
|
||||
- Added support for new datatypes: uchar, ushort, half.
|
||||
- Improved performance on "Vega 7nm" chips, such as on the Radeon Instinct MI50
|
||||
- mtgp32 uniform double performance changes due generation algorithm standardization. Better quality random numbers now generated with 30% decrease in performance
|
||||
- Up to 5% performance improvements for other algorithms
|
||||
|
||||
#### RAS
|
||||
Added support for RAS on Radeon Instinct MI50, including:
|
||||
- Memory error detection
|
||||
- Memory error detection counter
|
||||
|
||||
#### ROCm-SMI enhancements
|
||||
Added ROCm-SMI CLI and LIB support for FW version, compute running processes, utilization rates, utilization counter, link error counter, and unique ID.
|
||||
|
||||
### New features and enhancements in ROCm 2.6
|
||||
|
||||
#### ROCmInfo enhancements
|
||||
ROCmInfo was extended to do the following:
|
||||
For ROCr API call errors including initialization determine if the error could be explained by:
|
||||
- ROCk (driver) is not loaded / available
|
||||
- User does not have membership in appropriate group - "video"
|
||||
- If not above print the error string that is mapped to the returned error code
|
||||
- If no error string is available, print the error code in hex
|
||||
|
||||
#### Thrust - Functional Support on Vega20
|
||||
ROCm2.6 contains the first official release of rocThrust and hipCUB. rocThrust is a port of thrust, a parallel algorithm library. hipCUB is a port of CUB, a reusable software component library. Thrust/CUB has been ported to the HIP/ROCm platform to use the rocPRIM library. The HIP ported library works on HIP/ROCm platforms.
|
||||
|
||||
Note: rocThrust and hipCUB library replaces https://github.com/ROCmSoftwarePlatform/thrust (hip-thrust), i.e. hip-thrust has been separated into two libraries, rocThrust and hipCUB. Existing hip-thrust users are encouraged to port their code to rocThrust and/or hipCUB. Hip-thrust will be removed from official distribution later this year.
|
||||
|
||||
#### MIGraphX v0.3
|
||||
MIGraphX optimizer adds support to read models frozen from Tensorflow framework. Further details and an example usage at https://github.com/ROCmSoftwarePlatform/AMDMIGraphX/wiki/Getting-started:-using-the-new-features-of-MIGraphX-0.3
|
||||
|
||||
#### MIOpen 2.0
|
||||
- This release contains several new features including an immediate mode for selecting convolutions, bfloat16 support, new layers, modes, and algorithms.
|
||||
- MIOpenDriver, a tool for benchmarking and developing kernels is now shipped with MIOpen.
|
||||
BFloat16 now supported in HIP requires an updated rocBLAS as a GEMM backend.
|
||||
- Immediate mode API now provides the ability to quickly obtain a convolution kernel.
|
||||
- MIOpen now contains HIP source kernels and implements the ImplicitGEMM kernels. This is a new feature and is currently disabled by default. Use the environmental variable "MIOPEN_DEBUG_CONV_IMPLICIT_GEMM=1" to activation this feature. ImplicitGEMM requires an up to date HIP version of at least 1.5.9211.
|
||||
- A new "loss" catagory of layers has been added, of which, CTC loss is the first. See the API reference for more details.
|
||||
2.0 is the last release of active support for gfx803 architectures. In future releases, MIOpen will not actively debug and develop new features specifically for gfx803.
|
||||
- System Find-Db in memory cache is disabled by default. Please see build instructions to enable this feature.
|
||||
Additional documentation can be found here: https://rocmsoftwareplatform.github.io/MIOpen/doc/html/
|
||||
|
||||
#### Bloat16 software support in rocBLAS/Tensile
|
||||
Added mixed precision bfloat16/IEEE f32 to gemm_ex. The input and output matrices are bfloat16. All arithmetic is in IEEE f32.
|
||||
|
||||
#### AMD Infinity Fabric™ Link enablement
|
||||
The ability to connect four Radeon Instinct MI60 or Radeon Instinct MI50 boards in two hives or two Radeon Instinct MI60 or Radeon Instinct MI50 boards in four hives via AMD Infinity Fabric™ Link GPU interconnect technology has been added.
|
||||
|
||||
#### ROCm-smi features and bug fixes
|
||||
- mGPU & Vendor check
|
||||
- Fix clock printout if DPM is disabled
|
||||
- Fix finding marketing info on CentOS
|
||||
- Clarify some error messages
|
||||
|
||||
#### ROCm-smi-lib enhancements
|
||||
- Documentation updates
|
||||
- Improvements to *name_get functions
|
||||
|
||||
#### RCCL2 Enablement
|
||||
RCCL2 supports collectives intranode communication using PCIe, Infinity Fabric™, and pinned host memory, as well as internode communication using Ethernet (TCP/IP sockets) and Infiniband/RoCE (Infiniband Verbs). Note: For Infiniband/RoCE, RDMA is not currently supported.
|
||||
|
||||
#### rocFFT enhancements
|
||||
- Added: Debian package with FFT test, benchmark, and sample programs
|
||||
- Improved: hipFFT interfaces
|
||||
- Improved: rocFFT CPU reference code, plan generation code and logging code
|
||||
|
||||
### New features and enhancements in ROCm 2.5
|
||||
|
||||
#### UCX 1.6 support
|
||||
|
||||
Reference in New Issue
Block a user