CLRX  1
An unofficial OpenCL extensions designed for Radeon GPUs
GPUId.h
Go to the documentation of this file.
1 /*
2  * CLRadeonExtender - Unofficial OpenCL Radeon Extensions Library
3  * Copyright (C) 2014-2017 Mateusz Szpakowski
4  *
5  * This library is free software; you can redistribute it and/or
6  * modify it under the terms of the GNU Lesser General Public
7  * License as published by the Free Software Foundation; either
8  * version 2.1 of the License, or (at your option) any later version.
9  *
10  * This library is distributed in the hope that it will be useful,
11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13  * Lesser General Public License for more details.
14  *
15  * You should have received a copy of the GNU Lesser General Public
16  * License along with this library; if not, write to the Free Software
17  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
18  */
23 #ifndef __CLRX_GPUID_H__
24 #define __CLRX_GPUID_H__
25 
26 #include <CLRX/Config.h>
27 #include <CLRX/utils/Utilities.h>
28 #include <string>
29 
31 namespace CLRX
32 {
33 /*
34  * GPU identification utilities
35  */
36 
38 enum class GPUDeviceType: cxbyte
39 {
40  CAPE_VERDE = 0,
41  PITCAIRN,
42  TAHITI,
43  OLAND,
44  BONAIRE,
45  SPECTRE,
46  SPOOKY,
47  KALINDI,
48  HAINAN,
49  HAWAII,
50  ICELAND,
51  TONGA,
52  MULLINS,
53  FIJI,
54  CARRIZO,
55  DUMMY,
56  GOOSE,
57  HORSE,
58  STONEY,
59  ELLESMERE,
60  BAFFIN,
61  GFX804,
62  GFX900,
63  GFX901,
64  GPUDEVICE_MAX = GFX901,
65 
71  RADEON_R9_290 = HAWAII
72 };
73 
76 {
77  GCN1_0 = 0,
78  GCN1_1,
79  GCN1_2,
80  GCN1_4,
81  GPUARCH_MAX = GCN1_4
82 };
83 
85 extern GPUDeviceType getGPUDeviceTypeFromName(const char* name);
86 
88 extern const char* getGPUDeviceTypeName(GPUDeviceType deviceType);
89 
91 extern GPUArchitecture getGPUArchitectureFromName(const char* name);
92 
95 
98 
100 extern const char* getGPUArchitectureName(GPUArchitecture architecture);
101 
102 enum: Flags {
103  REGCOUNT_NO_VCC = 1,
104  REGCOUNT_NO_FLAT = 2,
105  REGCOUNT_NO_XNACK = 4,
106  REGCOUNT_NO_EXTRA = 0xffff
107 };
108 
109 enum: cxuint {
110  REGTYPE_SGPR = 0,
111  REGTYPE_VGPR
112 };
113 
114 enum : Flags
115 {
116  GCN_VCC = 1,
117  GCN_FLAT = 2,
118  GCN_XNACK = 4
119 };
120 
121 enum: Flags {
122  GPUSETUP_TGSIZE_EN = 1,
123  GPUSETUP_SCRATCH_EN = 2
124 };
125 
126 enum: cxuint {
127  MAX_REGTYPES_NUM = 4
128 };
129 
131 extern cxuint getGPUMaxRegistersNum(GPUArchitecture architecture, cxuint regType,
132  Flags flags = 0);
133 
135 extern cxuint getGPUMaxRegsNumByArchMask(uint16_t archMask, cxuint regType);
136 
138 extern void getGPUSetupMinRegistersNum(GPUArchitecture architecture, cxuint dimMask,
139  cxuint userDataNum, Flags flags, cxuint* gprsOut);
140 
142 extern size_t getGPUMaxLocalSize(GPUArchitecture architecture);
143 
145 extern size_t getGPUMaxGDSSize(GPUArchitecture architecture);
146 
148 extern cxuint getGPUExtraRegsNum(GPUArchitecture architecture, cxuint regType,
149  Flags flags);
150 
153 {
154  uint32_t major;
155  uint32_t minor;
156  uint32_t stepping;
157 };
158 
160 uint32_t calculatePgmRSrc1(GPUArchitecture arch, cxuint vgprsNum, cxuint sgprsNum,
161  cxuint priority, cxuint floatMode, bool privMode, bool dx10clamp,
162  bool debugMode, bool ieeeMode);
163 
165 uint32_t calculatePgmRSrc2(GPUArchitecture arch, bool scratchEn, cxuint userDataNum,
166  bool trapPresent, cxuint dimMask, cxuint defDimValues, bool tgSizeEn,
167  cxuint ldsSize, cxuint exceptions);
168 
169 };
170 
171 #endif
uint32_t Flags
type for declaring various flags
Definition: Utilities.h:97
first iteration (Radeon HD7000 series)
GPUArchitecture getGPUArchitectureFromDeviceType(GPUDeviceType deviceType)
get GPUArchitecture from GPU device type
GPUArchitecture getGPUArchitectureFromName(const char *name)
get GPU architecture from name
GPUArchitecture
GPU architecture.
Definition: GPUId.h:75
GPUDeviceType getLowestGPUDeviceTypeFromArchitecture(GPUArchitecture arch)
get lowest GPU device for architecture
uint32_t major
arch major number
Definition: GPUId.h:154
Configuration header.
void getGPUSetupMinRegistersNum(GPUArchitecture architecture, cxuint dimMask, cxuint userDataNum, Flags flags, cxuint *gprsOut)
get minimal number of required registers
uint32_t calculatePgmRSrc2(GPUArchitecture arch, bool scratchEn, cxuint userDataNum, bool trapPresent, cxuint dimMask, cxuint defDimValues, bool tgSizeEn, cxuint ldsSize, cxuint exceptions)
calculate PGMRSRC2 register value
uint32_t stepping
arch stepping number
Definition: GPUId.h:156
const char * getGPUDeviceTypeName(GPUDeviceType deviceType)
get GPU device type name
size_t getGPUMaxLocalSize(GPUArchitecture architecture)
get maximum local size for GPU architecture
cxuint getGPUMaxRegistersNum(GPUArchitecture architecture, cxuint regType, Flags flags=0)
get maximum available registers for GPU (type: 0 - scalar, 1 - vector)
unsigned char cxbyte
unsigned byte
Definition: Config.h:213
uint32_t calculatePgmRSrc1(GPUArchitecture arch, cxuint vgprsNum, cxuint sgprsNum, cxuint priority, cxuint floatMode, bool privMode, bool dx10clamp, bool debugMode, bool ieeeMode)
calculate PGMRSRC1 register value
main namespace
Definition: AsmDefs.h:38
GFX9 architecture (AMD RX VEGA)
unsigned int cxuint
unsigned int
Definition: Config.h:221
structure helper for AMDGPU architecture version
Definition: GPUId.h:152
size_t getGPUMaxGDSSize(GPUArchitecture architecture)
get maximum GDS size for GPU architecture
cxuint getGPUMaxRegsNumByArchMask(uint16_t archMask, cxuint regType)
get maximum available registers for GPU (type: 0 - scalar, 1 - vector)
GPUDeviceType
type of GPU device
Definition: GPUId.h:38
third iteration (Radeon Rx 300 series and Tonga)
utilities for other libraries and programs
const char * getGPUArchitectureName(GPUArchitecture architecture)
get GPU architecture name
GPUDeviceType getGPUDeviceTypeFromName(const char *name)
get GPU device type from name
uint32_t minor
arch minor number
Definition: GPUId.h:155
cxuint getGPUExtraRegsNum(GPUArchitecture architecture, cxuint regType, Flags flags)
get extra registers (like VCC,FLAT_SCRATCH)
second iteration (Radeon Rx 200 series)