R600RegisterInfo.td revision 263508
1 2class R600Reg <string name, bits<16> encoding> : Register<name> { 3 let Namespace = "AMDGPU"; 4 let HWEncoding = encoding; 5} 6 7class R600RegWithChan <string name, bits<9> sel, string chan> : 8 Register <name> { 9 10 field bits<2> chan_encoding = !if(!eq(chan, "X"), 0, 11 !if(!eq(chan, "Y"), 1, 12 !if(!eq(chan, "Z"), 2, 13 !if(!eq(chan, "W"), 3, 0)))); 14 let HWEncoding{8-0} = sel; 15 let HWEncoding{10-9} = chan_encoding; 16 let Namespace = "AMDGPU"; 17} 18 19class R600Reg_128<string n, list<Register> subregs, bits<16> encoding> : 20 RegisterWithSubRegs<n, subregs> { 21 let Namespace = "AMDGPU"; 22 let SubRegIndices = [sub0, sub1, sub2, sub3]; 23 let HWEncoding = encoding; 24} 25 26class R600Reg_64<string n, list<Register> subregs, bits<16> encoding> : 27 RegisterWithSubRegs<n, subregs> { 28 let Namespace = "AMDGPU"; 29 let SubRegIndices = [sub0, sub1]; 30 let HWEncoding = encoding; 31} 32 33 34foreach Index = 0-127 in { 35 foreach Chan = [ "X", "Y", "Z", "W" ] in { 36 // 32-bit Temporary Registers 37 def T#Index#_#Chan : R600RegWithChan <"T"#Index#"."#Chan, Index, Chan>; 38 39 // Indirect addressing offset registers 40 def Addr#Index#_#Chan : R600RegWithChan <"T("#Index#" + AR.x)."#Chan, 41 Index, Chan>; 42 } 43 // 128-bit Temporary Registers 44 def T#Index#_XYZW : R600Reg_128 <"T"#Index#"", 45 [!cast<Register>("T"#Index#"_X"), 46 !cast<Register>("T"#Index#"_Y"), 47 !cast<Register>("T"#Index#"_Z"), 48 !cast<Register>("T"#Index#"_W")], 49 Index>; 50 51 def T#Index#_XY : R600Reg_64 <"T"#Index#"", 52 [!cast<Register>("T"#Index#"_X"), 53 !cast<Register>("T"#Index#"_Y")], 54 Index>; 55} 56 57// KCACHE_BANK0 58foreach Index = 159-128 in { 59 foreach Chan = [ "X", "Y", "Z", "W" ] in { 60 // 32-bit Temporary Registers 61 def KC0_#Index#_#Chan : R600RegWithChan <"KC0["#!add(Index,-128)#"]."#Chan, Index, Chan>; 62 } 63 // 128-bit Temporary Registers 64 def KC0_#Index#_XYZW : R600Reg_128 <"KC0["#!add(Index, -128)#"].XYZW", 65 [!cast<Register>("KC0_"#Index#"_X"), 66 !cast<Register>("KC0_"#Index#"_Y"), 67 !cast<Register>("KC0_"#Index#"_Z"), 68 !cast<Register>("KC0_"#Index#"_W")], 69 Index>; 70} 71 72// KCACHE_BANK1 73foreach Index = 191-160 in { 74 foreach Chan = [ "X", "Y", "Z", "W" ] in { 75 // 32-bit Temporary Registers 76 def KC1_#Index#_#Chan : R600RegWithChan <"KC1["#!add(Index,-160)#"]."#Chan, Index, Chan>; 77 } 78 // 128-bit Temporary Registers 79 def KC1_#Index#_XYZW : R600Reg_128 <"KC1["#!add(Index, -160)#"].XYZW", 80 [!cast<Register>("KC1_"#Index#"_X"), 81 !cast<Register>("KC1_"#Index#"_Y"), 82 !cast<Register>("KC1_"#Index#"_Z"), 83 !cast<Register>("KC1_"#Index#"_W")], 84 Index>; 85} 86 87 88// Array Base Register holding input in FS 89foreach Index = 448-480 in { 90 def ArrayBase#Index : R600Reg<"ARRAY_BASE", Index>; 91} 92 93 94// Special Registers 95 96def OQA : R600Reg<"OQA", 219>; 97def OQB : R600Reg<"OQB", 220>; 98def OQAP : R600Reg<"OQAP", 221>; 99def OQBP : R600Reg<"OQAP", 222>; 100def LDS_DIRECT_A : R600Reg<"LDS_DIRECT_A", 223>; 101def LDS_DIRECT_B : R600Reg<"LDS_DIRECT_B", 224>; 102def ZERO : R600Reg<"0.0", 248>; 103def ONE : R600Reg<"1.0", 249>; 104def NEG_ONE : R600Reg<"-1.0", 249>; 105def ONE_INT : R600Reg<"1", 250>; 106def HALF : R600Reg<"0.5", 252>; 107def NEG_HALF : R600Reg<"-0.5", 252>; 108def ALU_LITERAL_X : R600RegWithChan<"literal.x", 253, "X">; 109def ALU_LITERAL_Y : R600RegWithChan<"literal.y", 253, "Y">; 110def ALU_LITERAL_Z : R600RegWithChan<"literal.z", 253, "Z">; 111def ALU_LITERAL_W : R600RegWithChan<"literal.w", 253, "W">; 112def PV_X : R600RegWithChan<"PV.X", 254, "X">; 113def PV_Y : R600RegWithChan<"PV.Y", 254, "Y">; 114def PV_Z : R600RegWithChan<"PV.Z", 254, "Z">; 115def PV_W : R600RegWithChan<"PV.W", 254, "W">; 116def PS: R600Reg<"PS", 255>; 117def PREDICATE_BIT : R600Reg<"PredicateBit", 0>; 118def PRED_SEL_OFF: R600Reg<"Pred_sel_off", 0>; 119def PRED_SEL_ZERO : R600Reg<"Pred_sel_zero", 2>; 120def PRED_SEL_ONE : R600Reg<"Pred_sel_one", 3>; 121def AR_X : R600Reg<"AR.x", 0>; 122 123def R600_ArrayBase : RegisterClass <"AMDGPU", [f32, i32], 32, 124 (add (sequence "ArrayBase%u", 448, 480))>; 125// special registers for ALU src operands 126// const buffer reference, SRCx_SEL contains index 127def ALU_CONST : R600Reg<"CBuf", 0>; 128// interpolation param reference, SRCx_SEL contains index 129def ALU_PARAM : R600Reg<"Param", 0>; 130 131let isAllocatable = 0 in { 132 133// XXX: Only use the X channel, until we support wider stack widths 134def R600_Addr : RegisterClass <"AMDGPU", [i32], 127, (add (sequence "Addr%u_X", 0, 127))>; 135 136def R600_LDS_SRC_REG : RegisterClass<"AMDGPU", [i32], 32, 137 (add OQA, OQB, OQAP, OQBP, LDS_DIRECT_A, LDS_DIRECT_B)>; 138 139def R600_KC0_X : RegisterClass <"AMDGPU", [f32, i32], 32, 140 (add (sequence "KC0_%u_X", 128, 159))>; 141 142def R600_KC0_Y : RegisterClass <"AMDGPU", [f32, i32], 32, 143 (add (sequence "KC0_%u_Y", 128, 159))>; 144 145def R600_KC0_Z : RegisterClass <"AMDGPU", [f32, i32], 32, 146 (add (sequence "KC0_%u_Z", 128, 159))>; 147 148def R600_KC0_W : RegisterClass <"AMDGPU", [f32, i32], 32, 149 (add (sequence "KC0_%u_W", 128, 159))>; 150 151def R600_KC0 : RegisterClass <"AMDGPU", [f32, i32], 32, 152 (interleave R600_KC0_X, R600_KC0_Y, 153 R600_KC0_Z, R600_KC0_W)>; 154 155def R600_KC1_X : RegisterClass <"AMDGPU", [f32, i32], 32, 156 (add (sequence "KC1_%u_X", 160, 191))>; 157 158def R600_KC1_Y : RegisterClass <"AMDGPU", [f32, i32], 32, 159 (add (sequence "KC1_%u_Y", 160, 191))>; 160 161def R600_KC1_Z : RegisterClass <"AMDGPU", [f32, i32], 32, 162 (add (sequence "KC1_%u_Z", 160, 191))>; 163 164def R600_KC1_W : RegisterClass <"AMDGPU", [f32, i32], 32, 165 (add (sequence "KC1_%u_W", 160, 191))>; 166 167def R600_KC1 : RegisterClass <"AMDGPU", [f32, i32], 32, 168 (interleave R600_KC1_X, R600_KC1_Y, 169 R600_KC1_Z, R600_KC1_W)>; 170 171} // End isAllocatable = 0 172 173def R600_TReg32_X : RegisterClass <"AMDGPU", [f32, i32], 32, 174 (add (sequence "T%u_X", 0, 127), AR_X)>; 175 176def R600_TReg32_Y : RegisterClass <"AMDGPU", [f32, i32], 32, 177 (add (sequence "T%u_Y", 0, 127))>; 178 179def R600_TReg32_Z : RegisterClass <"AMDGPU", [f32, i32], 32, 180 (add (sequence "T%u_Z", 0, 127))>; 181 182def R600_TReg32_W : RegisterClass <"AMDGPU", [f32, i32], 32, 183 (add (sequence "T%u_W", 0, 127))>; 184 185def R600_TReg32 : RegisterClass <"AMDGPU", [f32, i32], 32, 186 (interleave R600_TReg32_X, R600_TReg32_Y, 187 R600_TReg32_Z, R600_TReg32_W)>; 188 189def R600_Reg32 : RegisterClass <"AMDGPU", [f32, i32], 32, (add 190 R600_TReg32, 191 R600_ArrayBase, 192 R600_Addr, 193 R600_KC0, R600_KC1, 194 ZERO, HALF, ONE, ONE_INT, PV_X, ALU_LITERAL_X, NEG_ONE, NEG_HALF, 195 ALU_CONST, ALU_PARAM, OQAP 196 )>; 197 198def R600_Predicate : RegisterClass <"AMDGPU", [i32], 32, (add 199 PRED_SEL_OFF, PRED_SEL_ZERO, PRED_SEL_ONE)>; 200 201def R600_Predicate_Bit: RegisterClass <"AMDGPU", [i32], 32, (add 202 PREDICATE_BIT)>; 203 204def R600_Reg128 : RegisterClass<"AMDGPU", [v4f32, v4i32], 128, 205 (add (sequence "T%u_XYZW", 0, 127))> { 206 let CopyCost = -1; 207} 208 209def R600_Reg64 : RegisterClass<"AMDGPU", [v2f32, v2i32], 64, 210 (add (sequence "T%u_XY", 0, 63))>; 211