1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
1372
1373
1374
1375
1376
1377
1378
1379
1380
1381
1382
1383
1384
1385
1386
1387
1388
1389
1390
1391
1392
1393
1394
1395
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
1511
1512
1513
1514
1515
1516
1517
1518
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
1560
1561
1562
1563
1564
1565
1566
1567
1568
1569
1570
1571
1572
1573
1574
1575
1576
1577
1578
1579
1580
1581
1582
1583
1584
1585
1586
1587
1588
1589
1590
1591
1592
1593
1594
1595
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
1619
1620
1621
1622
1623
1624
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
1673
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
1684
1685
1686
1687
1688
1689
1690
1691
1692
1693
1694
1695
1696
1697
1698
1699
1700
1701
1702
1703
1704
1705
1706
1707
1708
1709
1710
1711
1712
1713
1714
1715
1716
1717
1718
1719
1720
1721
1722
1723
1724
1725
1726
1727
1728
1729
1730
1731
1732
1733
1734
1735
1736
1737
1738
1739
1740
1741
1742
1743
1744
1745
1746
1747
1748
1749
1750
1751
1752
1753
1754
1755
1756
1757
1758
1759
1760
1761
1762
1763
1764
1765
1766
1767
1768
1769
1770
1771
1772
1773
1774
1775
1776
1777
1778
1779
1780
1781
1782
1783
1784
1785
1786
1787
1788
1789
1790
1791
1792
1793
1794
1795
1796
1797
1798
1799
1800
1801
1802
1803
1804
1805
1806
1807
1808
1809
1810
1811
1812
1813
1814
1815
1816
1817
1818
1819
1820
1821
1822
1823
1824
1825
1826
1827
1828
1829
1830
1831
1832
1833
1834
1835
1836
1837
1838
1839
1840
1841
1842
1843
1844
1845
1846
1847
1848
1849
1850
1851
1852
1853
1854
1855
1856
1857
1858
1859
1860
1861
1862
1863
1864
1865
1866
1867
1868
1869
1870
1871
1872
1873
1874
1875
1876
1877
1878
1879
1880
1881
1882
1883
1884
1885
1886
1887
1888
1889
1890
1891
1892
1893
1894
1895
1896
1897
1898
1899
1900
1901
1902
1903
1904
1905
1906
1907
1908
1909
1910
1911
1912
1913
1914
1915
1916
1917
1918
1919
1920
1921
1922
1923
1924
1925
1926
1927
1928
1929
1930
1931
1932
1933
1934
1935
1936
1937
1938
1939
1940
1941
1942
1943
1944
1945
1946
1947
1948
1949
1950
1951
1952
1953
1954
1955
1956
1957
1958
1959
1960
1961
1962
1963
1964
1965
1966
1967
1968
1969
|
////////////////////////////////////////////////////////////////////////////////
//
// Copyright (C) 2014-2020 Advanced Micro Devices Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person or organization
// obtaining a copy of the software and accompanying documentation covered by
// this license (the "Software") to use, reproduce, display, distribute,
// execute, and transmit the Software, and to prepare derivative works of the
// Software, and to permit third-parties to whom the Software is furnished to
// do so, all subject to the following:
//
// The copyright notices in the Software and this entire statement, including
// the above license grant, this restriction and the following disclaimer,
// must be included in all copies of the Software, in whole or in part, and
// all derivative works of the Software, unless such copies or derivative
// works are solely in the form of machine-executable object code generated by
// a source language processor.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
// SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
// FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS IN THE SOFTWARE.
//
////////////////////////////////////////////////////////////////////////////////
// HSA AMD extension.
#ifndef HSA_RUNTIME_EXT_AMD_H_
#define HSA_RUNTIME_EXT_AMD_H_
#include "hsa.h"
#include "hsa_ext_image.h"
#define HSA_AMD_INTERFACE_VERSION_MAJOR 1
#define HSA_AMD_INTERFACE_VERSION_MINOR 0
#ifdef __cplusplus
extern "C" {
#endif
/**
* @brief Enumeration constants added to ::hsa_status_t.
*
* @remark Additions to hsa_status_t
*/
enum {
/**
* The memory pool is invalid.
*/
HSA_STATUS_ERROR_INVALID_MEMORY_POOL = 40,
/**
* Agent accessed memory beyond the maximum legal address.
*/
HSA_STATUS_ERROR_MEMORY_APERTURE_VIOLATION = 41,
/**
* Agent executed an invalid shader instruction.
*/
HSA_STATUS_ERROR_ILLEGAL_INSTRUCTION = 42,
};
/**
* @brief Agent attributes.
*/
typedef enum hsa_amd_agent_info_s {
/**
* Chip identifier. The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_CHIP_ID = 0xA000,
/**
* Size of a cacheline in bytes. The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_CACHELINE_SIZE = 0xA001,
/**
* The number of compute unit available in the agent. The type of this
* attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_COMPUTE_UNIT_COUNT = 0xA002,
/**
* The maximum clock frequency of the agent in MHz. The type of this
* attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_MAX_CLOCK_FREQUENCY = 0xA003,
/**
* Internal driver node identifier. The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_DRIVER_NODE_ID = 0xA004,
/**
* Max number of watch points on memory address ranges to generate exception
* events when the watched addresses are accessed. The type of this
* attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_MAX_ADDRESS_WATCH_POINTS = 0xA005,
/**
* Agent BDF_ID, named LocationID in thunk. The type of this attribute is
* uint32_t.
*/
HSA_AMD_AGENT_INFO_BDFID = 0xA006,
/**
* Memory Interface width, the return value type is uint32_t.
* This attribute is deprecated.
*/
HSA_AMD_AGENT_INFO_MEMORY_WIDTH = 0xA007,
/**
* Max Memory Clock, the return value type is uint32_t.
*/
HSA_AMD_AGENT_INFO_MEMORY_MAX_FREQUENCY = 0xA008,
/**
* Board name of Agent - populated from MarketingName of Kfd Node
* The value is an Ascii string of 64 chars.
*/
HSA_AMD_AGENT_INFO_PRODUCT_NAME = 0xA009,
/**
* Maximum number of waves possible in a Compute Unit.
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_MAX_WAVES_PER_CU = 0xA00A,
/**
* Number of SIMD's per compute unit CU
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_NUM_SIMDS_PER_CU = 0xA00B,
/**
* Number of Shader Engines (SE) in Gpu
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_NUM_SHADER_ENGINES = 0xA00C,
/**
* Number of Shader Arrays Per Shader Engines in Gpu
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_NUM_SHADER_ARRAYS_PER_SE = 0xA00D,
/**
* Address of the HDP flush registers. Use of these registers does not conform to the HSA memory
* model and should be treated with caution.
* The type of this attribute is hsa_amd_hdp_flush_t.
*/
HSA_AMD_AGENT_INFO_HDP_FLUSH = 0xA00E,
/**
* PCIe domain for the agent. Pairs with HSA_AMD_AGENT_INFO_BDFID
* to give the full physical location of the Agent.
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_DOMAIN = 0xA00F,
/**
* Queries for support of cooperative queues. See ::HSA_QUEUE_TYPE_COOPERATIVE.
* The type of this attribute is bool.
*/
HSA_AMD_AGENT_INFO_COOPERATIVE_QUEUES = 0xA010,
/**
* Queries UUID of an agent. The value is an Ascii string with a maximum
* of 21 chars including NUL. The string value consists of two parts: header
* and body. The header identifies device type (GPU, CPU, DSP) while body
* encodes UUID as a 16 digit hex string
*
* Agents that do not support UUID will return the string "GPU-XX" or
* "CPU-XX" or "DSP-XX" depending upon their device type ::hsa_device_type_t
*/
HSA_AMD_AGENT_INFO_UUID = 0xA011,
/**
* Queries for the ASIC revision of an agent. The value is an integer that
* increments for each revision. This can be used by user-level software to
* change how it operates, depending on the hardware version. This allows
* selective workarounds for hardware errata.
* The type of this attribute is uint32_t.
*/
HSA_AMD_AGENT_INFO_ASIC_REVISION = 0xA012
} hsa_amd_agent_info_t;
typedef struct hsa_amd_hdp_flush_s {
uint32_t* HDP_MEM_FLUSH_CNTL;
uint32_t* HDP_REG_FLUSH_CNTL;
} hsa_amd_hdp_flush_t;
/**
* @brief Region attributes.
*/
typedef enum hsa_amd_region_info_s {
/**
* Determine if host can access the region. The type of this attribute
* is bool.
*/
HSA_AMD_REGION_INFO_HOST_ACCESSIBLE = 0xA000,
/**
* Base address of the region in flat address space.
*/
HSA_AMD_REGION_INFO_BASE = 0xA001,
/**
* Memory Interface width, the return value type is uint32_t.
* This attribute is deprecated. Use HSA_AMD_AGENT_INFO_MEMORY_WIDTH.
*/
HSA_AMD_REGION_INFO_BUS_WIDTH = 0xA002,
/**
* Max Memory Clock, the return value type is uint32_t.
* This attribute is deprecated. Use HSA_AMD_AGENT_INFO_MEMORY_MAX_FREQUENCY.
*/
HSA_AMD_REGION_INFO_MAX_CLOCK_FREQUENCY = 0xA003
} hsa_amd_region_info_t;
/**
* @brief Coherency attributes of fine grain region.
*/
typedef enum hsa_amd_coherency_type_s {
/**
* Coherent region.
*/
HSA_AMD_COHERENCY_TYPE_COHERENT = 0,
/**
* Non coherent region.
*/
HSA_AMD_COHERENCY_TYPE_NONCOHERENT = 1
} hsa_amd_coherency_type_t;
/**
* @brief Get the coherency type of the fine grain region of an agent.
*
* @param[in] agent A valid agent.
*
* @param[out] type Pointer to a memory location where the HSA runtime will
* store the coherency type of the fine grain region.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p type is NULL.
*/
hsa_status_t HSA_API hsa_amd_coherency_get_type(hsa_agent_t agent,
hsa_amd_coherency_type_t* type);
/**
* @brief Set the coherency type of the fine grain region of an agent.
* Deprecated. This is supported on KV platforms. For backward compatibility
* other platforms will spuriously succeed.
*
* @param[in] agent A valid agent.
*
* @param[in] type The coherency type to be set.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p type is invalid.
*/
hsa_status_t HSA_API hsa_amd_coherency_set_type(hsa_agent_t agent,
hsa_amd_coherency_type_t type);
/**
* @brief Structure containing profiling dispatch time information.
*
* Times are reported as ticks in the domain of the HSA system clock.
* The HSA system clock tick and frequency is obtained via hsa_system_get_info.
*/
typedef struct hsa_amd_profiling_dispatch_time_s {
/**
* Dispatch packet processing start time.
*/
uint64_t start;
/**
* Dispatch packet completion time.
*/
uint64_t end;
} hsa_amd_profiling_dispatch_time_t;
/**
* @brief Structure containing profiling async copy time information.
*
* Times are reported as ticks in the domain of the HSA system clock.
* The HSA system clock tick and frequency is obtained via hsa_system_get_info.
*/
typedef struct hsa_amd_profiling_async_copy_time_s {
/**
* Async copy processing start time.
*/
uint64_t start;
/**
* Async copy completion time.
*/
uint64_t end;
} hsa_amd_profiling_async_copy_time_t;
/**
* @brief Enable or disable profiling capability of a queue.
*
* @param[in] queue A valid queue.
*
* @param[in] enable 1 to enable profiling. 0 to disable profiling.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE The queue is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p queue is NULL.
*/
hsa_status_t HSA_API
hsa_amd_profiling_set_profiler_enabled(hsa_queue_t* queue, int enable);
/**
* @brief Enable or disable asynchronous memory copy profiling.
*
* @details The runtime will provide the copy processing start timestamp and
* completion timestamp of each call to hsa_amd_memory_async_copy if the
* async copy profiling is enabled prior to the call to
* hsa_amd_memory_async_copy. The completion signal object is used to
* hold the last async copy start and end timestamp. The client can retrieve
* these timestamps via call to hsa_amd_profiling_get_async_copy_time.
*
* @param[in] enable True to enable profiling. False to disable profiling.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES Failed on allocating resources
* needed to profile the asynchronous copy.
*/
hsa_status_t HSA_API
hsa_amd_profiling_async_copy_enable(bool enable);
/**
* @brief Retrieve packet processing time stamps.
*
* @param[in] agent The agent with which the signal was last used. For
* instance, if the profiled dispatch packet is dispatched onto queue Q,
* which was created on agent A, then this parameter must be A.
*
* @param[in] signal A signal used as the completion signal of the dispatch
* packet to retrieve time stamps from. This dispatch packet must have been
* issued to a queue with profiling enabled and have already completed. Also
* the signal must not have yet been used in any other packet following the
* completion of the profiled dispatch packet.
*
* @param[out] time Packet processing timestamps in the HSA system clock
* domain.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL The signal is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p time is NULL.
*/
hsa_status_t HSA_API hsa_amd_profiling_get_dispatch_time(
hsa_agent_t agent, hsa_signal_t signal,
hsa_amd_profiling_dispatch_time_t* time);
/**
* @brief Retrieve asynchronous copy timestamps.
*
* @details Async copy profiling is enabled via call to
* hsa_amd_profiling_async_copy_enable.
*
* @param[in] signal A signal used as the completion signal of the call to
* hsa_amd_memory_async_copy.
*
* @param[out] time Async copy processing timestamps in the HSA system clock
* domain.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL The signal is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p time is NULL.
*/
hsa_status_t HSA_API hsa_amd_profiling_get_async_copy_time(
hsa_signal_t signal, hsa_amd_profiling_async_copy_time_t* time);
/**
* @brief Computes the frequency ratio and offset between the agent clock and
* HSA system clock and converts the agent's tick to HSA system domain tick.
*
* @param[in] agent The agent used to retrieve the agent_tick. It is user's
* responsibility to make sure the tick number is from this agent, otherwise,
* the behavior is undefined.
*
* @param[in] agent_tick The tick count retrieved from the specified @p agent.
*
* @param[out] system_tick The translated HSA system domain clock counter tick.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p system_tick is NULL;
*/
hsa_status_t HSA_API
hsa_amd_profiling_convert_tick_to_system_domain(hsa_agent_t agent,
uint64_t agent_tick,
uint64_t* system_tick);
/**
* @brief Signal attribute flags.
*/
typedef enum {
/**
* Signal will only be consumed by AMD GPUs. Limits signal consumption to
* AMD GPU agents only. Ignored if @p num_consumers is not zero (all agents).
*/
HSA_AMD_SIGNAL_AMD_GPU_ONLY = 1,
/**
* Signal may be used for interprocess communication.
* IPC signals can be read, written, and waited on from any process.
* Profiling using an IPC enabled signal is only supported in a single process
* at a time. Producing profiling data in one process and consuming it in
* another process is undefined.
*/
HSA_AMD_SIGNAL_IPC = 2,
} hsa_amd_signal_attribute_t;
/**
* @brief Create a signal with specific attributes.
*
* @param[in] initial_value Initial value of the signal.
*
* @param[in] num_consumers Size of @p consumers. A value of 0 indicates that
* any agent might wait on the signal.
*
* @param[in] consumers List of agents that might consume (wait on) the
* signal. If @p num_consumers is 0, this argument is ignored; otherwise, the
* HSA runtime might use the list to optimize the handling of the signal
* object. If an agent not listed in @p consumers waits on the returned
* signal, the behavior is undefined. The memory associated with @p consumers
* can be reused or freed after the function returns.
*
* @param[in] attributes Requested signal attributes. Multiple signal attributes
* may be requested by combining them with bitwise OR. Requesting no attributes
* (@p attributes == 0) results in the same signal as would have been obtained
* via hsa_signal_create.
*
* @param[out] signal Pointer to a memory location where the HSA runtime will
* store the newly created signal handle. Must not be NULL.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
* the required resources.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p signal is NULL, @p
* num_consumers is greater than 0 but @p consumers is NULL, or @p consumers
* contains duplicates.
*/
hsa_status_t HSA_API hsa_amd_signal_create(hsa_signal_value_t initial_value, uint32_t num_consumers,
const hsa_agent_t* consumers, uint64_t attributes,
hsa_signal_t* signal);
/**
* @brief Asyncronous signal handler function type.
*
* @details Type definition of callback function to be used with
* hsa_amd_signal_async_handler. This callback is invoked if the associated
* signal and condition are met. The callback receives the value of the signal
* which satisfied the associated wait condition and a user provided value. If
* the callback returns true then the callback will be called again if the
* associated signal and condition are satisfied again. If the callback returns
* false then it will not be called again.
*
* @param[in] value Contains the value of the signal observed by
* hsa_amd_signal_async_handler which caused the signal handler to be invoked.
*
* @param[in] arg Contains the user provided value given when the signal handler
* was registered with hsa_amd_signal_async_handler
*
* @retval true resumes monitoring the signal with this handler (as if calling
* hsa_amd_signal_async_handler again with identical parameters)
*
* @retval false stops monitoring the signal with this handler (handler will
* not be called again for this signal)
*
*/
typedef bool (*hsa_amd_signal_handler)(hsa_signal_value_t value, void* arg);
/**
* @brief Register asynchronous signal handler function.
*
* @details Allows registering a callback function and user provided value with
* a signal and wait condition. The callback will be invoked if the associated
* signal and wait condition are satisfied. Callbacks will be invoked serially
* but in an arbitrary order so callbacks should be independent of each other.
* After being invoked a callback may continue to wait for its associated signal
* and condition and, possibly, be invoked again. Or the callback may stop
* waiting. If the callback returns true then it will continue waiting and may
* be called again. If false then the callback will not wait again and will not
* be called again for the associated signal and condition. It is possible to
* register the same callback multiple times with the same or different signals
* and/or conditions. Each registration of the callback will be treated entirely
* independently.
*
* @param[in] signal hsa signal to be asynchronously monitored
*
* @param[in] cond condition value to monitor for
*
* @param[in] value signal value used in condition expression
*
* @param[in] handler asynchronous signal handler invoked when signal's
* condition is met
*
* @param[in] arg user provided value which is provided to handler when handler
* is invoked
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL signal is not a valid hsa_signal_t
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT handler is invalid (NULL)
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime is out of
* resources or blocking signals are not supported by the HSA driver component.
*
*/
hsa_status_t HSA_API
hsa_amd_signal_async_handler(hsa_signal_t signal,
hsa_signal_condition_t cond,
hsa_signal_value_t value,
hsa_amd_signal_handler handler, void* arg);
/**
* @brief Call a function asynchronously
*
* @details Provides access to the runtime's asynchronous event handling thread
* for general asynchronous functions. Functions queued this way are executed
* in the same manner as if they were a signal handler who's signal is
* satisfied.
*
* @param[in] callback asynchronous function to be invoked
*
* @param[in] arg user provided value which is provided to handler when handler
* is invoked
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT handler is invalid (NULL)
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime is out of
* resources or blocking signals are not supported by the HSA driver component.
*
*/
hsa_status_t HSA_API
hsa_amd_async_function(void (*callback)(void* arg), void* arg);
/**
* @brief Wait for any signal-condition pair to be satisfied.
*
* @details Allows waiting for any of several signal and conditions pairs to be
* satisfied. The function returns the index into the list of signals of the
* first satisfying signal-condition pair. The value of the satisfying signal's
* value is returned in satisfying_value unless satisfying_value is NULL. This
* function provides only relaxed memory semantics.
*/
uint32_t HSA_API
hsa_amd_signal_wait_any(uint32_t signal_count, hsa_signal_t* signals,
hsa_signal_condition_t* conds,
hsa_signal_value_t* values, uint64_t timeout_hint,
hsa_wait_state_t wait_hint,
hsa_signal_value_t* satisfying_value);
/**
* @brief Query image limits.
*
* @param[in] agent A valid agent.
*
* @param[in] attribute HSA image info attribute to query.
*
* @param[out] value Pointer to an application-allocated buffer where to store
* the value of the attribute. If the buffer passed by the application is not
* large enough to hold the value of @p attribute, the behavior is undefined.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE @p value is NULL or @p attribute <
* HSA_EXT_AGENT_INFO_IMAGE_1D_MAX_ELEMENTS or @p attribute >
* HSA_EXT_AGENT_INFO_IMAGE_ARRAY_MAX_LAYERS.
*
*/
hsa_status_t HSA_API hsa_amd_image_get_info_max_dim(hsa_agent_t agent,
hsa_agent_info_t attribute,
void* value);
/**
* @brief Set a CU affinity to specific queues within the process, this function
* call is "atomic".
*
* @param[in] queue A pointer to HSA queue.
*
* @param[in] num_cu_mask_count Size of CUMask bit array passed in.
*
* @param[in] cu_mask Bit-vector representing the CU mask.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE @p queue is NULL or invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p num_cu_mask_count is not
* multiple of 32 or @p cu_mask is NULL.
*
* @retval ::HSA_STATUS_ERROR failed to call thunk api
*
*/
hsa_status_t HSA_API hsa_amd_queue_cu_set_mask(const hsa_queue_t* queue,
uint32_t num_cu_mask_count,
const uint32_t* cu_mask);
/**
* @brief Memory segments associated with a memory pool.
*/
typedef enum {
/**
* Global segment. Used to hold data that is shared by all agents.
*/
HSA_AMD_SEGMENT_GLOBAL = 0,
/**
* Read-only segment. Used to hold data that remains constant during the
* execution of a kernel.
*/
HSA_AMD_SEGMENT_READONLY = 1,
/**
* Private segment. Used to hold data that is local to a single work-item.
*/
HSA_AMD_SEGMENT_PRIVATE = 2,
/**
* Group segment. Used to hold data that is shared by the work-items of a
* work-group.
*/
HSA_AMD_SEGMENT_GROUP = 3,
} hsa_amd_segment_t;
/**
* @brief A memory pool encapsulates physical storage on an agent
* along with a memory access model.
*
* @details A memory pool encapsulates a physical partition of an agent's
* memory system along with a memory access model. Division of a single
* memory system into separate pools allows querying each partition's access
* path properties (see ::hsa_amd_agent_memory_pool_get_info). Allocations
* from a pool are preferentially bound to that pool's physical partition.
* Binding to the pool's preferential physical partition may not be
* possible or persistent depending on the system's memory policy
* and/or state which is beyond the scope of HSA APIs.
*
* For example, a multi-node NUMA memory system may be represented by multiple
* pool's with each pool providing size and access path information for the
* partition it represents. Allocations from a pool are preferentially bound
* to the pool's partition (which in this example is a NUMA node) while
* following its memory access model. The actual placement may vary or migrate
* due to the system's NUMA policy and state, which is beyond the scope of
* HSA APIs.
*/
typedef struct hsa_amd_memory_pool_s {
/**
* Opaque handle.
*/
uint64_t handle;
} hsa_amd_memory_pool_t;
typedef enum hsa_amd_memory_pool_global_flag_s {
/**
* The application can use allocations in the memory pool to store kernel
* arguments, and provide the values for the kernarg segment of
* a kernel dispatch.
*/
HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_KERNARG_INIT = 1,
/**
* Updates to memory in this pool conform to HSA memory consistency model.
* If this flag is set, then ::HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED
* must not be set.
*/
HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_FINE_GRAINED = 2,
/**
* Writes to memory in this pool can be performed by a single agent at a time.
*/
HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED = 4
} hsa_amd_memory_pool_global_flag_t;
/**
* @brief Memory pool features.
*/
typedef enum {
/**
* Segment where the memory pool resides. The type of this attribute is
* ::hsa_amd_segment_t.
*/
HSA_AMD_MEMORY_POOL_INFO_SEGMENT = 0,
/**
* Flag mask. The value of this attribute is undefined if the value of
* ::HSA_AMD_MEMORY_POOL_INFO_SEGMENT is not ::HSA_AMD_SEGMENT_GLOBAL. The type
* of
* this attribute is uint32_t, a bit-field of
* ::hsa_amd_memory_pool_global_flag_t
* values.
*/
HSA_AMD_MEMORY_POOL_INFO_GLOBAL_FLAGS = 1,
/**
* Size of this pool, in bytes. The type of this attribute is size_t.
*/
HSA_AMD_MEMORY_POOL_INFO_SIZE = 2,
/**
* Indicates whether memory in this pool can be allocated using
* ::hsa_amd_memory_pool_allocate. The type of this attribute is bool.
*
* The value of this flag is always false for memory pools in the group and
* private segments.
*/
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED = 5,
/**
* Allocation granularity of buffers allocated by
* ::hsa_amd_memory_pool_allocate
* in this memory pool. The size of a buffer allocated in this pool is a
* multiple of the value of this attribute. The value of this attribute is
* only defined if ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED is true for
* this pool. The type of this attribute is size_t.
*/
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE = 6,
/**
* Alignment of buffers allocated by ::hsa_amd_memory_pool_allocate in this
* pool. The value of this attribute is only defined if
* ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED is true for this pool, and
* must be a power of 2. The type of this attribute is size_t.
*/
HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT = 7,
/**
* This memory_pool can be made directly accessible by all the agents in the
* system (::hsa_amd_agent_memory_pool_get_info does not return
* ::HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED for any agent). The type of this
* attribute is bool.
*/
HSA_AMD_MEMORY_POOL_INFO_ACCESSIBLE_BY_ALL = 15,
/**
* Maximum aggregate allocation size in bytes. The type of this attribute
* is size_t.
*/
HSA_AMD_MEMORY_POOL_INFO_ALLOC_MAX_SIZE = 16,
} hsa_amd_memory_pool_info_t;
/**
* @brief Get the current value of an attribute of a memory pool.
*
* @param[in] memory_pool A valid memory pool.
*
* @param[in] attribute Attribute to query.
*
* @param[out] value Pointer to a application-allocated buffer where to store
* the value of the attribute. If the buffer passed by the application is not
* large enough to hold the value of @p attribute, the behavior is undefined.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
*/
hsa_status_t HSA_API
hsa_amd_memory_pool_get_info(hsa_amd_memory_pool_t memory_pool,
hsa_amd_memory_pool_info_t attribute,
void* value);
/**
* @brief Iterate over the memory pools associated with a given agent, and
* invoke an application-defined callback on every iteration.
*
* @details An agent can directly access buffers located in some memory pool, or
* be enabled to access them by the application (see ::hsa_amd_agents_allow_access),
* yet that memory pool may not be returned by this function for that given
* agent.
*
* A memory pool of fine-grained type must be associated only with the host.
*
* @param[in] agent A valid agent.
*
* @param[in] callback Callback to be invoked on the same thread that called
* ::hsa_amd_agent_iterate_memory_pools, serially, once per memory pool that is
* associated with the agent. The HSA runtime passes two arguments to the
* callback: the memory pool, and the application data. If @p callback
* returns a status other than ::HSA_STATUS_SUCCESS for a particular iteration,
* the traversal stops and ::hsa_amd_agent_iterate_memory_pools returns that status
* value.
*
* @param[in] data Application data that is passed to @p callback on every
* iteration. May be NULL.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
*/
hsa_status_t HSA_API hsa_amd_agent_iterate_memory_pools(
hsa_agent_t agent,
hsa_status_t (*callback)(hsa_amd_memory_pool_t memory_pool, void* data),
void* data);
/**
* @brief Allocate a block of memory (or buffer) in the specified pool.
*
* @param[in] memory_pool Memory pool where to allocate memory from. The memory
* pool must have the ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED flag set.
*
* @param[in] size Allocation size, in bytes. Must not be zero. This value is
* rounded up to the nearest multiple of
* ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE in @p memory_pool.
*
* @param[in] flags A bit-field that is used to specify allocation
* directives. Reserved parameter, must be 0.
*
* @param[out] ptr Pointer to the location where to store the base virtual
* address of
* the allocated block. The returned base address is aligned to the value of
* ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT in @p memory_pool. If the
* allocation fails, the returned value is undefined.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES No memory is available.
*
* @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL The memory pool is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ALLOCATION The host is not allowed to
* allocate memory in @p memory_pool, or @p size is greater than
* the value of HSA_AMD_MEMORY_POOL_INFO_ALLOC_MAX_SIZE in @p memory_pool.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL, or @p size is 0,
* or flags is not 0.
*
*/
hsa_status_t HSA_API
hsa_amd_memory_pool_allocate(hsa_amd_memory_pool_t memory_pool, size_t size,
uint32_t flags, void** ptr);
/**
* @brief Deallocate a block of memory previously allocated using
* ::hsa_amd_memory_pool_allocate.
*
* @param[in] ptr Pointer to a memory block. If @p ptr does not match a value
* previously returned by ::hsa_amd_memory_pool_allocate, the behavior is undefined.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
*/
hsa_status_t HSA_API hsa_amd_memory_pool_free(void* ptr);
/**
* @brief Asynchronously copy a block of memory from the location pointed to by
* @p src on the @p src_agent to the memory block pointed to by @p dst on the @p
* dst_agent.
* Because the DMA engines used may not be in the same coherency domain, the caller must ensure
* that buffers are system-level coherent. In general this requires the sending device to have
* released the buffer to system scope prior to executing the copy API and the receiving device
* must execute a system scope acquire fence prior to use of the destination buffer.
*
* @param[out] dst Buffer where the content is to be copied.
*
* @param[in] dst_agent Agent associated with the @p dst. The agent must be able to directly
* access both the source and destination buffers in their current locations.
*
* @param[in] src A valid pointer to the source of data to be copied. The source
* buffer must not overlap with the destination buffer, otherwise the copy will succeed
* but contents of @p dst is undefined.
*
* @param[in] src_agent Agent associated with the @p src. The agent must be able to directly
* access both the source and destination buffers in their current locations.
*
* @param[in] size Number of bytes to copy. If @p size is 0, no copy is
* performed and the function returns success. Copying a number of bytes larger
* than the size of the buffers pointed by @p dst or @p src results in undefined
* behavior.
*
* @param[in] num_dep_signals Number of dependent signals. Can be 0.
*
* @param[in] dep_signals List of signals that must be waited on before the copy
* operation starts. The copy will start after every signal has been observed with
* the value 0. The dependent signal should not include completion signal from hsa_amd_memory_async_copy
* operation to be issued in future as that can result in a deadlock. If @p num_dep_signals is 0, this
* argument is ignored.
*
* @param[in] completion_signal Signal used to indicate completion of the copy
* operation. When the copy operation is finished, the value of the signal is
* decremented. The runtime indicates that an error has occurred during the copy
* operation by setting the value of the completion signal to a negative
* number. The signal handle must not be 0.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. The
* application is responsible for checking for asynchronous error conditions
* (see the description of @p completion_signal).
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL @p completion_signal is invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The source or destination
* pointers are NULL, or the completion signal is 0.
*/
hsa_status_t HSA_API
hsa_amd_memory_async_copy(void* dst, hsa_agent_t dst_agent, const void* src,
hsa_agent_t src_agent, size_t size,
uint32_t num_dep_signals,
const hsa_signal_t* dep_signals,
hsa_signal_t completion_signal);
/*
[Provisional API]
Pitched memory descriptor.
All elements must be 4 byte aligned. Pitch and slice are in bytes.
*/
typedef struct hsa_pitched_ptr_s {
void* base;
size_t pitch;
size_t slice;
} hsa_pitched_ptr_t;
/*
[Provisional API]
Copy direction flag.
*/
typedef enum {
hsaHostToHost = 0,
hsaHostToDevice = 1,
hsaDeviceToHost = 2,
hsaDeviceToDevice = 3
} hsa_amd_copy_direction_t;
/*
[Provisional API]
SDMA 3D memory copy API. The same requirements must be met by src and dst as in
hsa_amd_memory_async_copy.
Both src and dst must be directly accessible to the copy_agent during the copy, src and dst rects
must not overlap.
CPU agents are not supported. API requires SDMA and will return an error if SDMA is not available.
Offsets and range carry x in bytes, y and z in rows and layers.
*/
hsa_status_t HSA_API hsa_amd_memory_async_copy_rect(
const hsa_pitched_ptr_t* dst, const hsa_dim3_t* dst_offset, const hsa_pitched_ptr_t* src,
const hsa_dim3_t* src_offset, const hsa_dim3_t* range, hsa_agent_t copy_agent,
hsa_amd_copy_direction_t dir, uint32_t num_dep_signals, const hsa_signal_t* dep_signals,
hsa_signal_t completion_signal);
/**
* @brief Type of accesses to a memory pool from a given agent.
*/
typedef enum {
/**
* The agent cannot directly access any buffer in the memory pool.
*/
HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED = 0,
/**
* The agent can directly access a buffer located in the pool; the application
* does not need to invoke ::hsa_amd_agents_allow_access.
*/
HSA_AMD_MEMORY_POOL_ACCESS_ALLOWED_BY_DEFAULT = 1,
/**
* The agent can directly access a buffer located in the pool, but only if the
* application has previously requested access to that buffer using
* ::hsa_amd_agents_allow_access.
*/
HSA_AMD_MEMORY_POOL_ACCESS_DISALLOWED_BY_DEFAULT = 2
} hsa_amd_memory_pool_access_t;
/**
* @brief Properties of the relationship between an agent a memory pool.
*/
typedef enum {
/**
* Hyper-transport bus type.
*/
HSA_AMD_LINK_INFO_TYPE_HYPERTRANSPORT = 0,
/**
* QPI bus type.
*/
HSA_AMD_LINK_INFO_TYPE_QPI = 1,
/**
* PCIe bus type.
*/
HSA_AMD_LINK_INFO_TYPE_PCIE = 2,
/**
* Infiniband bus type.
*/
HSA_AMD_LINK_INFO_TYPE_INFINBAND = 3,
/**
* xGMI link type.
*/
HSA_AMD_LINK_INFO_TYPE_XGMI = 4
} hsa_amd_link_info_type_t;
/**
* @brief Link properties when accessing the memory pool from the specified
* agent.
*/
typedef struct hsa_amd_memory_pool_link_info_s {
/**
* Minimum transfer latency (rounded to ns).
*/
uint32_t min_latency;
/**
* Maximum transfer latency (rounded to ns).
*/
uint32_t max_latency;
/**
* Minimum link interface bandwidth in MB/s.
*/
uint32_t min_bandwidth;
/**
* Maximum link interface bandwidth in MB/s.
*/
uint32_t max_bandwidth;
/**
* Support for 32-bit atomic transactions.
*/
bool atomic_support_32bit;
/**
* Support for 64-bit atomic transactions.
*/
bool atomic_support_64bit;
/**
* Support for cache coherent transactions.
*/
bool coherent_support;
/**
* The type of bus/link.
*/
hsa_amd_link_info_type_t link_type;
/**
* NUMA distance of memory pool relative to querying agent
*/
uint32_t numa_distance;
} hsa_amd_memory_pool_link_info_t;
/**
* @brief Properties of the relationship between an agent a memory pool.
*/
typedef enum {
/**
* Access to buffers located in the memory pool. The type of this attribute
* is ::hsa_amd_memory_pool_access_t.
*
* An agent can always directly access buffers currently located in a memory
* pool that is associated (the memory_pool is one of the values returned by
* ::hsa_amd_agent_iterate_memory_pools on the agent) with that agent. If the
* buffer is currently located in a memory pool that is not associated with
* the agent, and the value returned by this function for the given
* combination of agent and memory pool is not
* HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED, the application still needs to invoke
* ::hsa_amd_agents_allow_access in order to gain direct access to the buffer.
*
* If the given agent can directly access buffers the pool, the result is not
* HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. If the memory pool is associated with
* the agent, or it is of fined-grained type, the result must not be
* HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. If the memory pool is not associated
* with the agent, and does not reside in the global segment, the result must
* be HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED.
*/
HSA_AMD_AGENT_MEMORY_POOL_INFO_ACCESS = 0,
/**
* Number of links to hop when accessing the memory pool from the specified
* agent. The value of this attribute is zero if the memory pool is associated
* with the agent, or if the access type is
* HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. The type of this attribute is
* uint32_t.
*/
HSA_AMD_AGENT_MEMORY_POOL_INFO_NUM_LINK_HOPS = 1,
/**
* Details of each link hop when accessing the memory pool starting from the
* specified agent. The type of this attribute is an array size of
* HSA_AMD_AGENT_MEMORY_POOL_INFO_NUM_LINK_HOPS with each element containing
* ::hsa_amd_memory_pool_link_info_t.
*/
HSA_AMD_AGENT_MEMORY_POOL_INFO_LINK_INFO = 2
} hsa_amd_agent_memory_pool_info_t;
/**
* @brief Get the current value of an attribute of the relationship between an
* agent and a memory pool.
*
* @param[in] agent Agent.
*
* @param[in] memory_pool Memory pool.
*
* @param[in] attribute Attribute to query.
*
* @param[out] value Pointer to a application-allocated buffer where to store
* the value of the attribute. If the buffer passed by the application is not
* large enough to hold the value of @p attribute, the behavior is undefined.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
*/
hsa_status_t HSA_API hsa_amd_agent_memory_pool_get_info(
hsa_agent_t agent, hsa_amd_memory_pool_t memory_pool,
hsa_amd_agent_memory_pool_info_t attribute, void* value);
/**
* @brief Enable direct access to a buffer from a given set of agents.
*
* @details
*
* Upon return, only the listed agents and the agent associated with the
* buffer's memory pool have direct access to the @p ptr.
*
* Any agent that has access to the buffer before and after the call to
* ::hsa_amd_agents_allow_access will also have access while
* ::hsa_amd_agents_allow_access is in progress.
*
* The caller is responsible for ensuring that each agent in the list
* must be able to access the memory pool containing @p ptr
* (using ::hsa_amd_agent_memory_pool_get_info with ::HSA_AMD_AGENT_MEMORY_POOL_INFO_ACCESS attribute),
* otherwise error code is returned.
*
* @param[in] num_agents Size of @p agents.
*
* @param[in] agents List of agents. If @p num_agents is 0, this argument is
* ignored.
*
* @param[in] flags A list of bit-field that is used to specify access
* information in a per-agent basis. This is currently reserved and must be NULL.
*
* @param[in] ptr A buffer previously allocated using ::hsa_amd_memory_pool_allocate.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p num_agents is 0, or @p agents
* is NULL, @p flags is not NULL, or attempting to enable access to agent(s)
* because @p ptr is allocated from an inaccessible pool.
*
*/
hsa_status_t HSA_API
hsa_amd_agents_allow_access(uint32_t num_agents, const hsa_agent_t* agents,
const uint32_t* flags, const void* ptr);
/**
* @brief Query if buffers currently located in some memory pool can be
* relocated to a destination memory pool.
*
* @details If the returned value is non-zero, a migration of a buffer to @p
* dst_memory_pool using ::hsa_amd_memory_migrate may nevertheless fail due to
* resource limitations.
*
* @param[in] src_memory_pool Source memory pool.
*
* @param[in] dst_memory_pool Destination memory pool.
*
* @param[out] result Pointer to a memory location where the result of the query
* is stored. Must not be NULL. If buffers currently located in @p
* src_memory_pool can be relocated to @p dst_memory_pool, the result is
* true.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL One of the memory pools is
* invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p result is NULL.
*/
hsa_status_t HSA_API
hsa_amd_memory_pool_can_migrate(hsa_amd_memory_pool_t src_memory_pool,
hsa_amd_memory_pool_t dst_memory_pool,
bool* result);
/**
* @brief Relocate a buffer to a new memory pool.
*
* @details When a buffer is migrated, its virtual address remains the same but
* its physical contents are moved to the indicated memory pool.
*
* After migration, only the agent associated with the destination pool will have access.
*
* The caller is also responsible for ensuring that the allocation in the
* source memory pool where the buffer is currently located can be migrated to the
* specified destination memory pool (using ::hsa_amd_memory_pool_can_migrate returns a value of true
* for the source and destination memory pools), otherwise behavior is undefined.
*
* The caller must ensure that the buffer is not accessed while it is migrated.
*
* @param[in] ptr Buffer to be relocated. The buffer must have been released to system
* prior to call this API. The buffer will be released to system upon completion.
*
* @param[in] memory_pool Memory pool where to place the buffer.
*
* @param[in] flags A bit-field that is used to specify migration
* information. Must be zero.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL The destination memory pool is
* invalid.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in
* allocating the necessary resources.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p flags is not 0.
*/
hsa_status_t HSA_API hsa_amd_memory_migrate(const void* ptr,
hsa_amd_memory_pool_t memory_pool,
uint32_t flags);
/**
*
* @brief Pin a host pointer allocated by C/C++ or OS allocator (i.e. ordinary system DRAM) and
* return a new pointer accessible by the @p agents. If the @p host_ptr overlaps with previously
* locked memory, then the overlap area is kept locked (i.e multiple mappings are permitted). In
* this case, the same input @p host_ptr may give different locked @p agent_ptr and when it does,
* they are not necessarily coherent (i.e. accessing either @p agent_ptr is not equivalent).
* Accesses to @p agent_ptr are coarse grained.
*
* @param[in] host_ptr A buffer allocated by C/C++ or OS allocator.
*
* @param[in] size The size to be locked.
*
* @param[in] agents Array of agent handle to gain access to the @p host_ptr.
* If this parameter is NULL and the @p num_agent is 0, all agents
* in the platform will gain access to the @p host_ptr.
*
* @param[out] agent_ptr Pointer to the location where to store the new address.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in
* allocating the necessary resources.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT One or more agent in @p agents is
* invalid.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is 0 or @p host_ptr or
* @p agent_ptr is NULL or @p agents not NULL but @p num_agent is 0 or @p agents
* is NULL but @p num_agent is not 0.
*/
hsa_status_t HSA_API hsa_amd_memory_lock(void* host_ptr, size_t size,
hsa_agent_t* agents, int num_agent,
void** agent_ptr);
/**
*
* @brief Pin a host pointer allocated by C/C++ or OS allocator (i.e. ordinary system DRAM) and
* return a new pointer accessible by the @p agents. If the @p host_ptr overlaps with previously
* locked memory, then the overlap area is kept locked (i.e. multiple mappings are permitted).
* In this case, the same input @p host_ptr may give different locked @p agent_ptr and when it
* does, they are not necessarily coherent (i.e. accessing either @p agent_ptr is not equivalent).
* Acesses to the memory via @p agent_ptr have the same access properties as memory allocated from
* @p pool as determined by ::hsa_amd_memory_pool_get_info and ::hsa_amd_agent_memory_pool_get_info
* (ex. coarse/fine grain, platform atomic support, link info). Physical composition and placement
* of the memory (ex. page size, NUMA binding) is not changed.
*
* @param[in] host_ptr A buffer allocated by C/C++ or OS allocator.
*
* @param[in] size The size to be locked.
*
* @param[in] agents Array of agent handle to gain access to the @p host_ptr.
* If this parameter is NULL and the @p num_agent is 0, all agents
* in the platform will gain access to the @p host_ptr.
*
* @param[in] pool Global memory pool owned by a CPU agent.
*
* @param[in] flags A bit-field that is used to specify allocation
* directives. Reserved parameter, must be 0.
*
* @param[out] agent_ptr Pointer to the location where to store the new address.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in
* allocating the necessary resources.
*
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT One or more agent in @p agents is
* invalid or can not access @p pool.
*
* @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL @p pool is invalid or not owned
* by a CPU agent.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is 0 or @p host_ptr or
* @p agent_ptr is NULL or @p agents not NULL but @p num_agent is 0 or @p agents
* is NULL but @p num_agent is not 0 or flags is not 0.
*/
hsa_status_t HSA_API hsa_amd_memory_lock_to_pool(void* host_ptr, size_t size, hsa_agent_t* agents,
int num_agent, hsa_amd_memory_pool_t pool,
uint32_t flags, void** agent_ptr);
/**
*
* @brief Unpin the host pointer previously pinned via ::hsa_amd_memory_lock or
* ::hsa_amd_memory_lock_to_pool.
*
* @details The behavior is undefined if the host pointer being unpinned does not
* match previous pinned address or if the host pointer was already deallocated.
*
* @param[in] host_ptr A buffer allocated by C/C++ or OS allocator that was
* pinned previously via ::hsa_amd_memory_lock or ::hsa_amd_memory_lock_to_pool.
*
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*/
hsa_status_t HSA_API hsa_amd_memory_unlock(void* host_ptr);
/**
* @brief Sets the first @p count of uint32_t of the block of memory pointed by
* @p ptr to the specified @p value.
*
* @param[in] ptr Pointer to the block of memory to fill.
*
* @param[in] value Value to be set.
*
* @param[in] count Number of uint32_t element to be set to the value.
*
* @retval HSA_STATUS_SUCCESS The function has been executed successfully.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL or
* not 4 bytes aligned
*
* @retval HSA_STATUS_ERROR_INVALID_ALLOCATION if the given memory
* region was not allocated with HSA runtime APIs.
*
*/
hsa_status_t HSA_API
hsa_amd_memory_fill(void* ptr, uint32_t value, size_t count);
/**
* @brief Maps an interop object into the HSA flat address space and establishes
* memory residency. The metadata pointer is valid during the lifetime of the
* map (until hsa_amd_interop_unmap_buffer is called).
* Multiple calls to hsa_amd_interop_map_buffer with the same interop_handle
* result in multiple mappings with potentially different addresses and
* different metadata pointers. Concurrent operations on these addresses are
* not coherent. Memory must be fenced to system scope to ensure consistency,
* between mappings and with any views of this buffer in the originating
* software stack.
*
* @param[in] num_agents Number of agents which require access to the memory
*
* @param[in] agents List of accessing agents.
*
* @param[in] interop_handle Handle of interop buffer (dmabuf handle in Linux)
*
* @param [in] flags Reserved, must be 0
*
* @param[out] size Size in bytes of the mapped object
*
* @param[out] ptr Base address of the mapped object
*
* @param[out] metadata_size Size of metadata in bytes, may be NULL
*
* @param[out] metadata Pointer to metadata, may be NULL
*
* @retval HSA_STATUS_SUCCESS if successfully mapped
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT all other errors
*/
hsa_status_t HSA_API hsa_amd_interop_map_buffer(uint32_t num_agents,
hsa_agent_t* agents,
int interop_handle,
uint32_t flags,
size_t* size,
void** ptr,
size_t* metadata_size,
const void** metadata);
/**
* @brief Removes a previously mapped interop object from HSA's flat address space.
* Ends lifetime for the mapping's associated metadata pointer.
*/
hsa_status_t HSA_API hsa_amd_interop_unmap_buffer(void* ptr);
/**
* @brief Encodes an opaque vendor specific image format. The length of data
* depends on the underlying format. This structure must not be copied as its
* true length can not be determined.
*/
typedef struct hsa_amd_image_descriptor_s {
/*
Version number of the descriptor
*/
uint32_t version;
/*
Vendor and device PCI IDs for the format as VENDOR_ID<<16|DEVICE_ID.
*/
uint32_t deviceID;
/*
Start of vendor specific data.
*/
uint32_t data[1];
} hsa_amd_image_descriptor_t;
/**
* @brief Creates an image from an opaque vendor specific image format.
* Does not modify data at image_data. Intended initially for
* accessing interop images.
*
* @param agent[in] Agent on which to create the image
*
* @param[in] image_descriptor[in] Vendor specific image format
*
* @param[in] image_data Pointer to image backing store
*
* @param[in] access_permission Access permissions for the image object
*
* @param[out] image Created image object.
*
* @retval HSA_STATUS_SUCCESS Image created successfully
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT Bad or mismatched descriptor,
* null image_data, or mismatched access_permission.
*/
hsa_status_t HSA_API hsa_amd_image_create(
hsa_agent_t agent,
const hsa_ext_image_descriptor_t *image_descriptor,
const hsa_amd_image_descriptor_t *image_layout,
const void *image_data,
hsa_access_permission_t access_permission,
hsa_ext_image_t *image
);
/**
* @brief Denotes the type of memory in a pointer info query.
*/
typedef enum {
/*
Memory is not known to the HSA driver. Unallocated or unlocked system memory.
*/
HSA_EXT_POINTER_TYPE_UNKNOWN = 0,
/*
Memory was allocated with an HSA memory allocator.
*/
HSA_EXT_POINTER_TYPE_HSA = 1,
/*
System memory which has been locked for use with an HSA agent.
Memory of this type is normal malloc'd memory and is always accessible to
the CPU. Pointer info queries may not include CPU agents in the accessible
agents list as the CPU has implicit access.
*/
HSA_EXT_POINTER_TYPE_LOCKED = 2,
/*
Memory originated in a graphics component and is shared with ROCr.
*/
HSA_EXT_POINTER_TYPE_GRAPHICS = 3,
/*
Memory has been shared with the local process via ROCr IPC APIs.
*/
HSA_EXT_POINTER_TYPE_IPC = 4
} hsa_amd_pointer_type_t;
/**
* @brief Describes a memory allocation known to ROCr.
* Within a ROCr major version this structure can only grow.
*/
typedef struct hsa_amd_pointer_info_s {
/*
Size in bytes of this structure. Used for version control within a major ROCr
revision. Set to sizeof(hsa_amd_pointer_t) prior to calling
hsa_amd_pointer_info. If the runtime supports an older version of pointer
info then size will be smaller on return. Members starting after the return
value of size will not be updated by hsa_amd_pointer_info.
*/
uint32_t size;
/*
The type of allocation referenced.
*/
hsa_amd_pointer_type_t type;
/*
Base address at which non-host agents may access the allocation.
*/
void* agentBaseAddress;
/*
Base address at which the host agent may access the allocation.
*/
void* hostBaseAddress;
/*
Size of the allocation
*/
size_t sizeInBytes;
/*
Application provided value.
*/
void* userData;
/*
Reports an agent which "owns" (ie has preferred access to) the pool in which the allocation was
made. When multiple agents share equal access to a pool (ex: multiple CPU agents, or multi-die
GPU boards) any such agent may be returned.
*/
hsa_agent_t agentOwner;
} hsa_amd_pointer_info_t;
/**
* @brief Retrieves information about the allocation referenced by the given
* pointer. Optionally returns the number and list of agents which can
* directly access the allocation.
*
* @param[in] ptr Pointer which references the allocation to retrieve info for.
*
* @param[in, out] info Pointer to structure to be filled with allocation info.
* Data member size must be set to the size of the structure prior to calling
* hsa_amd_pointer_info. On return size will be set to the size of the
* pointer info structure supported by the runtime, if smaller. Members
* beyond the returned value of size will not be updated by the API.
* Must not be NULL.
*
* @param[in] alloc Function pointer to an allocator used to allocate the
* @p accessible array. If NULL @p accessible will not be returned.
*
* @param[out] num_agents_accessible Recieves the count of agents in
* @p accessible. If NULL @p accessible will not be returned.
*
* @param[out] accessible Recieves a pointer to the array, allocated by @p alloc,
* holding the list of agents which may directly access the allocation.
* May be NULL.
*
* @retval HSA_STATUS_SUCCESS Info retrieved successfully
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT NULL in @p ptr or @p info.
*/
hsa_status_t HSA_API hsa_amd_pointer_info(void* ptr,
hsa_amd_pointer_info_t* info,
void* (*alloc)(size_t),
uint32_t* num_agents_accessible,
hsa_agent_t** accessible);
/**
* @brief Associates an arbitrary pointer with an allocation known to ROCr.
* The pointer can be fetched by hsa_amd_pointer_info in the userData field.
*
* @param[in] ptr Pointer to the first byte of an allocation known to ROCr
* with which to associate @p userdata.
*
* @param[in] userdata Abitrary pointer to associate with the allocation.
*
* @retval HSA_STATUS_SUCCESS @p userdata successfully stored.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is not known to ROCr.
*/
hsa_status_t HSA_API hsa_amd_pointer_info_set_userdata(void* ptr,
void* userdata);
/**
* @brief 256-bit process independent identifier for a ROCr shared memory
* allocation.
*/
typedef struct hsa_amd_ipc_memory_s {
uint32_t handle[8];
} hsa_amd_ipc_memory_t;
/**
* @brief Prepares an allocation for interprocess sharing and creates a
* handle of type hsa_amd_ipc_memory_t uniquely identifying the allocation. A
* handle is valid while the allocation it references remains accessible in
* any process. In general applications should confirm that a shared memory
* region has been attached (via hsa_amd_ipc_memory_attach) in the remote
* process prior to releasing that memory in the local process.
* Repeated calls for the same allocation may, but are not required to, return
* unique handles.
*
* @param[in] ptr Pointer to memory allocated via ROCr APIs to prepare for
* sharing.
*
* @param[in] len Length in bytes of the allocation to share.
*
* @param[out] handle Process independent identifier referencing the shared
* allocation.
*
* @retval HSA_STATUS_SUCCESS allocation is prepared for interprocess sharing.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr does not point to the
* first byte of an allocation made through ROCr, or len is not the full length
* of the allocation or handle is NULL.
*/
hsa_status_t HSA_API hsa_amd_ipc_memory_create(void* ptr, size_t len,
hsa_amd_ipc_memory_t* handle);
/**
* @brief Imports shared memory into the local process and makes it accessible
* by the given agents. If a shared memory handle is attached multiple times
* in a process each attach may return a different address. Each returned
* address is refcounted and requires a matching number of calls to
* hsa_amd_ipc_memory_detach to release the shared memory mapping.
*
* @param[in] handle Pointer to the identifier for the shared memory.
*
* @param[in] len Length of the shared memory to import.
* Reserved. Must be the full length of the shared allocation in this version.
*
* @param[in] num_agents Count of agents in @p mapping_agents.
* May be zero if all agents are to be allowed access.
*
* @param[in] mapping_agents List of agents to access the shared memory.
* Ignored if @p num_agents is zero.
*
* @param[out] mapped_ptr Recieves a process local pointer to the shared memory.
*
* @retval HSA_STATUS_SUCCESS if memory is successfully imported.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p handle is not valid, @p len is
* incorrect, @p mapped_ptr is NULL, or some agent for which access was
* requested can not access the shared memory.
*/
hsa_status_t HSA_API hsa_amd_ipc_memory_attach(
const hsa_amd_ipc_memory_t* handle, size_t len,
uint32_t num_agents,
const hsa_agent_t* mapping_agents,
void** mapped_ptr);
/**
* @brief Decrements the reference count for the shared memory mapping and
* releases access to shared memory imported with hsa_amd_ipc_memory_attach.
*
* @param[in] mapped_ptr Pointer to the first byte of a shared allocation
* imported with hsa_amd_ipc_memory_attach.
*
* @retval HSA_STATUS_SUCCESS if @p mapped_ptr was imported with
* hsa_amd_ipc_memory_attach.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p mapped_ptr was not imported
* with hsa_amd_ipc_memory_attach.
*/
hsa_status_t HSA_API hsa_amd_ipc_memory_detach(void* mapped_ptr);
/**
* @brief 256-bit process independent identifier for a ROCr IPC signal.
*/
typedef hsa_amd_ipc_memory_t hsa_amd_ipc_signal_t;
/**
* @brief Obtains an interprocess sharing handle for a signal. The handle is
* valid while the signal it references remains valid in any process. In
* general applications should confirm that the signal has been attached (via
* hsa_amd_ipc_signal_attach) in the remote process prior to destroying that
* signal in the local process.
* Repeated calls for the same signal may, but are not required to, return
* unique handles.
*
* @param[in] signal Signal created with attribute HSA_AMD_SIGNAL_IPC.
*
* @param[out] handle Process independent identifier referencing the shared
* signal.
*
* @retval HSA_STATUS_SUCCESS @p handle is ready to use for interprocess sharing.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p signal is not a valid signal
* created with attribute HSA_AMD_SIGNAL_IPC or handle is NULL.
*/
hsa_status_t HSA_API hsa_amd_ipc_signal_create(hsa_signal_t signal, hsa_amd_ipc_signal_t* handle);
/**
* @brief Imports an IPC capable signal into the local process. If an IPC
* signal handle is attached multiple times in a process each attach may return
* a different signal handle. Each returned signal handle is refcounted and
* requires a matching number of calls to hsa_signal_destroy to release the
* shared signal.
*
* @param[in] handle Pointer to the identifier for the shared signal.
*
* @param[out] signal Recieves a process local signal handle to the shared signal.
*
* @retval HSA_STATUS_SUCCESS if the signal is successfully imported.
*
* @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized
*
* @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p handle is not valid.
*/
hsa_status_t HSA_API hsa_amd_ipc_signal_attach(const hsa_amd_ipc_signal_t* handle,
hsa_signal_t* signal);
/**
* @brief GPU system event type.
*/
typedef enum hsa_amd_event_type_s {
/*
AMD GPU memory fault.
*/
HSA_AMD_GPU_MEMORY_FAULT_EVENT = 0,
} hsa_amd_event_type_t;
/**
* @brief Flags denoting the cause of a memory fault.
*/
typedef enum {
// Page not present or supervisor privilege.
HSA_AMD_MEMORY_FAULT_PAGE_NOT_PRESENT = 1 << 0,
// Write access to a read-only page.
HSA_AMD_MEMORY_FAULT_READ_ONLY = 1 << 1,
// Execute access to a page marked NX.
HSA_AMD_MEMORY_FAULT_NX = 1 << 2,
// GPU attempted access to a host only page.
HSA_AMD_MEMORY_FAULT_HOST_ONLY = 1 << 3,
// DRAM ECC failure.
HSA_AMD_MEMORY_FAULT_DRAM_ECC = 1 << 4,
// Can't determine the exact fault address.
HSA_AMD_MEMORY_FAULT_IMPRECISE = 1 << 5,
// SRAM ECC failure (ie registers, no fault address).
HSA_AMD_MEMORY_FAULT_SRAM_ECC = 1 << 6,
// GPU reset following unspecified hang.
HSA_AMD_MEMORY_FAULT_HANG = 1 << 31
} hsa_amd_memory_fault_reason_t;
/**
* @brief AMD GPU memory fault event data.
*/
typedef struct hsa_amd_gpu_memory_fault_info_s {
/*
The agent where the memory fault occurred.
*/
hsa_agent_t agent;
/*
Virtual address accessed.
*/
uint64_t virtual_address;
/*
Bit field encoding the memory access failure reasons. There could be multiple bits set
for one fault. Bits are defined in hsa_amd_memory_fault_reason_t.
*/
uint32_t fault_reason_mask;
} hsa_amd_gpu_memory_fault_info_t;
/**
* @brief AMD GPU event data passed to event handler.
*/
typedef struct hsa_amd_event_s {
/*
The event type.
*/
hsa_amd_event_type_t event_type;
union {
/*
The memory fault info, only valid when @p event_type is HSA_AMD_GPU_MEMORY_FAULT_EVENT.
*/
hsa_amd_gpu_memory_fault_info_t memory_fault;
};
} hsa_amd_event_t;
typedef hsa_status_t (*hsa_amd_system_event_callback_t)(const hsa_amd_event_t* event, void* data);
/**
* @brief Register AMD GPU event handler.
*
* @param[in] callback Callback to be invoked when an event is triggered.
* The HSA runtime passes two arguments to the callback: @p event
* is defined per event by the HSA runtime, and @p data is the user data.
*
* @param[in] data User data that is passed to @p callback. May be NULL.
*
* @retval HSA_STATUS_SUCCESS The handler has been registered successfully.
*
* @retval HSA_STATUS_ERROR An event handler has already been registered.
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p event is invalid.
*/
hsa_status_t HSA_API hsa_amd_register_system_event_handler(hsa_amd_system_event_callback_t callback,
void* data);
/**
* @brief Per-queue dispatch and wavefront scheduling priority.
*/
typedef enum hsa_amd_queue_priority_s {
/*
Below normal/high priority compute and all graphics
*/
HSA_AMD_QUEUE_PRIORITY_LOW = 0,
/*
Above low priority compute, below high priority compute and all graphics
*/
HSA_AMD_QUEUE_PRIORITY_NORMAL = 1,
/*
Above low/normal priority compute and all graphics
*/
HSA_AMD_QUEUE_PRIORITY_HIGH = 2,
} hsa_amd_queue_priority_t;
/**
* @brief Modifies the dispatch and wavefront scheduling prioirty for a
* given compute queue. The default is HSA_AMD_QUEUE_PRIORITY_NORMAL.
*
* @param[in] queue Compute queue to apply new priority to.
*
* @param[in] priority Priority to associate with queue.
*
* @retval HSA_STATUS_SUCCESS if priority was changed successfully.
*
* @retval HSA_STATUS_ERROR_INVALID_QUEUE if queue is not a valid
* compute queue handle.
*
* @retval HSA_STATUS_ERROR_INVALID_ARGUMENT if priority is not a valid
* value from hsa_amd_queue_priority_t.
*/
hsa_status_t HSA_API hsa_amd_queue_set_priority(hsa_queue_t* queue,
hsa_amd_queue_priority_t priority);
/**
* @brief Deallocation notifier function type.
*/
typedef void (*hsa_amd_deallocation_callback_t)(void* ptr, void* user_data);
/**
* @brief Registers a deallocation notifier monitoring for release of agent
* accessible address @p ptr. If successful, @p callback will be invoked when
* @p ptr is removed from accessibility from all agents.
*
* Notification callbacks are automatically deregistered when they are invoked.
*
* Note: The current version supports notifications of address release
* originating from ::hsa_amd_memory_pool_free. Support for other address
* release APIs will follow.
*
* @param[in] ptr Agent accessible address to monitor for deallocation. Passed
* to @p callback.
*
* @param[in] callback Notifier to be invoked when @p ptr is released from
* agent accessibility.
*
* @param[in] user_data User provided value passed to @p callback. May be NULL.
*
* @retval ::HSA_STATUS_SUCCESS The notifier registered successfully
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ALLOCATION @p ptr does not refer to a valid agent accessible
* address.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL or @p ptr is NULL.
*
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating
* necessary resources
*/
hsa_status_t HSA_API hsa_amd_register_deallocation_callback(void* ptr,
hsa_amd_deallocation_callback_t callback,
void* user_data);
/**
* @brief Removes a deallocation notifier previously registered with
* ::hsa_amd_register_deallocation_callback. Arguments must be identical to
* those given in ::hsa_amd_register_deallocation_callback.
*
* @param[in] ptr Agent accessible address which was monitored for deallocation.
*
* @param[in] callback Notifier to be removed.
*
* @retval ::HSA_STATUS_SUCCESS The notifier has been removed successfully.
*
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
* initialized.
*
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The given notifier was not registered.
*/
hsa_status_t HSA_API hsa_amd_deregister_deallocation_callback(void* ptr,
hsa_amd_deallocation_callback_t callback);
#ifdef __cplusplus
} // end extern "C" block
#endif
#endif // header guard
|