UTMAREDG
Tensor Store from Shared to Global Memory with Reduction
2 variants on SM90 (H100)
UTMAREDG
[UR],[UR]
distilled:
@UP0 UTMAREDG.1D.ADD [UR0], [UR0] ;key:
UTMAREDG_UR_UR| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 |
| 0 | 1 | 1 | 0 | 1 | 1 | 0 | 1 | 1 | 1 | 0 | 0 | pred | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | operand 1 | 0 | operand 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | |||||||||||||||
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 |
| 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | modi 1 | IM2COL | 0 | 0 | 0 | 0 | modi 2 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | stall | y | r-bar | w-bar | b-mask | reuse | 0 | 0 | |||||||||||||||||||
Modifier Group 1
| Binary | Value |
|---|---|
| 000 | 1D |
| 001 | 2D |
| 010 | 3D |
| 011 | 4D |
| 100 | 5D |
| 101 | INVALID5 |
| 110 | INVALID6 |
| 111 | INVALID7 |
Modifier Group 2
| Binary | Value |
|---|---|
| 000 | ADD |
| 001 | MIN |
| 010 | MAX |
| 011 | INC |
| 100 | DEC |
| 101 | AND |
| 110 | OR |
| 111 | XOR |
UTMAREDG
[UR],[UR],desc[UR]
distilled:
@UP0 UTMAREDG.1D.ADD [UR0], [UR0], desc[UR0] ;key:
UTMAREDG_UR_UR_UR| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 |
| 0 | 1 | 1 | 0 | 1 | 1 | 0 | 1 | 1 | 1 | 0 | 0 | pred | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | operand 1 | 0 | operand 0 | 0 | operand 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | |||||||||||||||||||||
| 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 |
| 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | modi 1 | IM2COL | 0 | 0 | 0 | 0 | modi 2 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | stall | y | r-bar | w-bar | b-mask | reuse | 0 | 0 | |||||||||||||||||||
Modifier Group 1
| Binary | Value |
|---|---|
| 000 | 1D |
| 001 | 2D |
| 010 | 3D |
| 011 | 4D |
| 100 | 5D |
| 101 | INVALID5 |
| 110 | INVALID6 |
| 111 | INVALID7 |
Modifier Group 2
| Binary | Value |
|---|---|
| 000 | ADD |
| 001 | MIN |
| 010 | MAX |
| 011 | INC |
| 100 | DEC |
| 101 | AND |
| 110 | OR |
| 111 | XOR |