2016-06-24 14:37:17 -05:00
// Copyright 2016 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.
// +build ignore
package main
import "strings"
2016-08-04 11:34:43 -07:00
// Notes:
// - Less-than-64-bit integer types live in the low portion of registers.
// For now, the upper portion is junk; sign/zero-extension might be optimized in the future, but not yet.
// - Boolean types are zero or 1; stored in a byte, but loaded with AMOVBZ so the upper bytes of a register are zero.
2017-01-07 08:23:11 -08:00
// - *const instructions may use a constant larger than the instruction can encode.
2016-08-04 11:34:43 -07:00
// In this case the assembler expands to multiple instructions and uses tmp
// register (R31).
2016-06-24 14:37:17 -05:00
var regNamesPPC64 = [ ] string {
2016-09-16 15:02:47 -07:00
"R0" , // REGZERO, not used, but simplifies counting in regalloc
2016-06-24 14:37:17 -05:00
"SP" , // REGSP
"SB" , // REGSB
"R3" ,
"R4" ,
"R5" ,
"R6" ,
"R7" ,
"R8" ,
"R9" ,
"R10" ,
"R11" , // REGCTXT for closures
"R12" ,
"R13" , // REGTLS
"R14" ,
"R15" ,
"R16" ,
"R17" ,
"R18" ,
"R19" ,
"R20" ,
"R21" ,
"R22" ,
"R23" ,
"R24" ,
"R25" ,
"R26" ,
"R27" ,
"R28" ,
"R29" ,
2016-07-26 09:24:18 -07:00
"g" , // REGG. Using name "g" and setting Config.hasGReg makes it "just happen".
2016-06-24 14:37:17 -05:00
"R31" , // REGTMP
2016-07-26 09:24:18 -07:00
2016-06-24 14:37:17 -05:00
"F0" ,
"F1" ,
"F2" ,
"F3" ,
"F4" ,
"F5" ,
"F6" ,
"F7" ,
"F8" ,
"F9" ,
"F10" ,
"F11" ,
"F12" ,
"F13" ,
"F14" ,
"F15" ,
"F16" ,
"F17" ,
"F18" ,
"F19" ,
"F20" ,
"F21" ,
"F22" ,
"F23" ,
"F24" ,
"F25" ,
"F26" ,
cmd/compile, runtime, etc: get rid of constant FP registers
On ARM64, MIPS64, and PPC64, some floating point registers were
reserved for constants 0, 1, 2, 0.5, etc. This CL removes them.
On ARM64, they are never used. On MIPS64 and PPC64, the only use
case is a multiplication-by-2 in the old backend of the compiler,
which is replaced with an addition.
Change-Id: I737cbf43283756e3408964fc88c567a938c57036
Reviewed-on: https://go-review.googlesource.com/28095
Run-TryBot: Cherry Zhang <cherryyz@google.com>
Reviewed-by: David Chase <drchase@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
2016-08-30 14:46:25 -04:00
"F27" ,
"F28" ,
"F29" ,
"F30" ,
"F31" ,
2016-07-26 09:24:18 -07:00
2019-10-28 00:53:14 -04:00
// If you add registers, update asyncPreempt in runtime.
2016-07-26 09:24:18 -07:00
// "CR0",
// "CR1",
// "CR2",
// "CR3",
// "CR4",
// "CR5",
// "CR6",
// "CR7",
2016-08-04 06:57:34 -04:00
// "CR",
2016-07-26 09:24:18 -07:00
// "XER",
// "LR",
// "CTR",
2016-06-24 14:37:17 -05:00
}
func init ( ) {
// Make map from reg names to reg integers.
if len ( regNamesPPC64 ) > 64 {
panic ( "too many registers" )
}
num := map [ string ] int { }
for i , name := range regNamesPPC64 {
num [ name ] = i
}
buildReg := func ( s string ) regMask {
m := regMask ( 0 )
for _ , r := range strings . Split ( s , " " ) {
if n , ok := num [ r ] ; ok {
m |= regMask ( 1 ) << uint ( n )
continue
}
panic ( "register " + r + " not found" )
}
return m
}
var (
2016-07-26 09:24:18 -07:00
gp = buildReg ( "R3 R4 R5 R6 R7 R8 R9 R10 R11 R12 R14 R15 R16 R17 R18 R19 R20 R21 R22 R23 R24 R25 R26 R27 R28 R29" )
2016-08-10 11:44:57 -07:00
fp = buildReg ( "F1 F2 F3 F4 F5 F6 F7 F8 F9 F10 F11 F12 F13 F14 F15 F16 F17 F18 F19 F20 F21 F22 F23 F24 F25 F26" )
2016-06-24 14:37:17 -05:00
sp = buildReg ( "SP" )
2016-07-06 13:32:52 -07:00
sb = buildReg ( "SB" )
2016-08-15 13:51:00 -07:00
gr = buildReg ( "g" )
2016-08-10 11:44:57 -07:00
// cr = buildReg("CR")
// ctr = buildReg("CTR")
// lr = buildReg("LR")
2017-09-11 10:39:24 -04:00
tmp = buildReg ( "R31" )
ctxt = buildReg ( "R11" )
callptr = buildReg ( "R12" )
2016-08-10 11:44:57 -07:00
// tls = buildReg("R13")
2016-08-04 06:57:34 -04:00
gp01 = regInfo { inputs : nil , outputs : [ ] regMask { gp } }
[dev.ssa] cmd/compile: replace storeconst w/ storezero, fold addressing
Because PPC lacks store-immediate, remove the instruction
that implies that it exists. Replace it with storezero for
the special case of storing zero, because R0 is reserved zero
for Go (though the assembler knows this, do it in SSA).
Also added address folding for storezero.
(Now corrected to use right-sized stores in bulk-zero code.)
Hello.go now compiles to
genssa main
00000 (...hello.go:7) TEXT "".main(SB), $0
00001 (...hello.go:7) FUNCDATA $0, "".gcargs·0(SB)
00002 (...hello.go:7) FUNCDATA $1, "".gclocals·1(SB)
v23 00003 (...hello.go:8) MOVD $go.string."Hello, World!\n"(SB), R3
v11 00004 (...hello.go:8) MOVD R3, 32(R1)
v22 00005 (...hello.go:8) MOVD $14, R3
v6 00006 (...hello.go:8) MOVD R3, 40(R1)
v20 00007 (...hello.go:8) MOVD R0, 48(R1)
v18 00008 (...hello.go:8) MOVD R0, 56(R1)
v9 00009 (...hello.go:8) MOVD R0, 64(R1)
v10 00010 (...hello.go:8) CALL fmt.Printf(SB)
b2 00011 (...hello.go:9) RET
00012 (<unknown line number>) END
Updates #16010
Change-Id: I33cfd98c21a1617502260ac753fa8cad68c8d85a
Reviewed-on: https://go-review.googlesource.com/25151
Reviewed-by: Cherry Zhang <cherryyz@google.com>
Run-TryBot: David Chase <drchase@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
2016-07-22 10:47:16 -07:00
gp11 = regInfo { inputs : [ ] regMask { gp | sp | sb } , outputs : [ ] regMask { gp } }
gp21 = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb } , outputs : [ ] regMask { gp } }
2020-08-17 16:14:48 -05:00
gp31 = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb , gp | sp | sb } , outputs : [ ] regMask { gp } }
2018-10-01 18:24:43 -03:00
gp22 = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb } , outputs : [ ] regMask { gp , gp } }
2019-04-24 14:33:50 -03:00
gp32 = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb , gp | sp | sb } , outputs : [ ] regMask { gp , gp } }
2016-08-04 06:57:34 -04:00
gp1cr = regInfo { inputs : [ ] regMask { gp | sp | sb } }
gp2cr = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb } }
crgp = regInfo { inputs : nil , outputs : [ ] regMask { gp } }
2019-09-12 09:22:07 -04:00
crgp11 = regInfo { inputs : [ ] regMask { gp } , outputs : [ ] regMask { gp } }
crgp21 = regInfo { inputs : [ ] regMask { gp , gp } , outputs : [ ] regMask { gp } }
[dev.ssa] cmd/compile: replace storeconst w/ storezero, fold addressing
Because PPC lacks store-immediate, remove the instruction
that implies that it exists. Replace it with storezero for
the special case of storing zero, because R0 is reserved zero
for Go (though the assembler knows this, do it in SSA).
Also added address folding for storezero.
(Now corrected to use right-sized stores in bulk-zero code.)
Hello.go now compiles to
genssa main
00000 (...hello.go:7) TEXT "".main(SB), $0
00001 (...hello.go:7) FUNCDATA $0, "".gcargs·0(SB)
00002 (...hello.go:7) FUNCDATA $1, "".gclocals·1(SB)
v23 00003 (...hello.go:8) MOVD $go.string."Hello, World!\n"(SB), R3
v11 00004 (...hello.go:8) MOVD R3, 32(R1)
v22 00005 (...hello.go:8) MOVD $14, R3
v6 00006 (...hello.go:8) MOVD R3, 40(R1)
v20 00007 (...hello.go:8) MOVD R0, 48(R1)
v18 00008 (...hello.go:8) MOVD R0, 56(R1)
v9 00009 (...hello.go:8) MOVD R0, 64(R1)
v10 00010 (...hello.go:8) CALL fmt.Printf(SB)
b2 00011 (...hello.go:9) RET
00012 (<unknown line number>) END
Updates #16010
Change-Id: I33cfd98c21a1617502260ac753fa8cad68c8d85a
Reviewed-on: https://go-review.googlesource.com/25151
Reviewed-by: Cherry Zhang <cherryyz@google.com>
Run-TryBot: David Chase <drchase@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
2016-07-22 10:47:16 -07:00
gpload = regInfo { inputs : [ ] regMask { gp | sp | sb } , outputs : [ ] regMask { gp } }
2018-09-14 16:30:54 -04:00
gploadidx = regInfo { inputs : [ ] regMask { gp | sp | sb , gp } , outputs : [ ] regMask { gp } }
2016-08-04 06:57:34 -04:00
gpstore = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb } }
2018-09-14 16:30:54 -04:00
gpstoreidx = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb , gp | sp | sb } }
2016-08-04 06:57:34 -04:00
gpstorezero = regInfo { inputs : [ ] regMask { gp | sp | sb } } // ppc64.REGZERO is reserved zero value
2017-02-10 17:45:12 -05:00
gpxchg = regInfo { inputs : [ ] regMask { gp | sp | sb , gp } , outputs : [ ] regMask { gp } }
gpcas = regInfo { inputs : [ ] regMask { gp | sp | sb , gp , gp } , outputs : [ ] regMask { gp } }
2016-08-04 06:57:34 -04:00
fp01 = regInfo { inputs : nil , outputs : [ ] regMask { fp } }
2016-08-08 14:19:56 -07:00
fp11 = regInfo { inputs : [ ] regMask { fp } , outputs : [ ] regMask { fp } }
2016-08-10 11:44:57 -07:00
fpgp = regInfo { inputs : [ ] regMask { fp } , outputs : [ ] regMask { gp } }
gpfp = regInfo { inputs : [ ] regMask { gp } , outputs : [ ] regMask { fp } }
2016-08-08 14:19:56 -07:00
fp21 = regInfo { inputs : [ ] regMask { fp , fp } , outputs : [ ] regMask { fp } }
2017-03-13 14:39:17 -04:00
fp31 = regInfo { inputs : [ ] regMask { fp , fp , fp } , outputs : [ ] regMask { fp } }
2016-08-08 14:19:56 -07:00
fp2cr = regInfo { inputs : [ ] regMask { fp , fp } }
fpload = regInfo { inputs : [ ] regMask { gp | sp | sb } , outputs : [ ] regMask { fp } }
2018-09-14 16:30:54 -04:00
fploadidx = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb } , outputs : [ ] regMask { fp } }
2016-08-08 14:19:56 -07:00
fpstore = regInfo { inputs : [ ] regMask { gp | sp | sb , fp } }
2018-09-14 16:30:54 -04:00
fpstoreidx = regInfo { inputs : [ ] regMask { gp | sp | sb , gp | sp | sb , fp } }
2016-08-15 13:51:00 -07:00
callerSave = regMask ( gp | fp | gr )
2019-02-06 14:12:36 -08:00
r3 = buildReg ( "R3" )
r4 = buildReg ( "R4" )
r5 = buildReg ( "R5" )
r6 = buildReg ( "R6" )
2016-06-24 14:37:17 -05:00
)
ops := [ ] opData {
2017-10-10 10:26:35 -04:00
{ name : "ADD" , argLength : 2 , reg : gp21 , asm : "ADD" , commutative : true } , // arg0 + arg1
{ name : "ADDconst" , argLength : 1 , reg : gp11 , asm : "ADD" , aux : "Int64" } , // arg0 + auxInt
{ name : "FADD" , argLength : 2 , reg : fp21 , asm : "FADD" , commutative : true } , // arg0+arg1
{ name : "FADDS" , argLength : 2 , reg : fp21 , asm : "FADDS" , commutative : true } , // arg0+arg1
{ name : "SUB" , argLength : 2 , reg : gp21 , asm : "SUB" } , // arg0-arg1
2020-08-20 15:06:23 -05:00
{ name : "SUBFCconst" , argLength : 1 , reg : gp11 , asm : "SUBC" , aux : "Int64" } , // auxInt - arg0 (with carry)
2017-10-10 10:26:35 -04:00
{ name : "FSUB" , argLength : 2 , reg : fp21 , asm : "FSUB" } , // arg0-arg1
{ name : "FSUBS" , argLength : 2 , reg : fp21 , asm : "FSUBS" } , // arg0-arg1
2016-08-02 13:17:09 -07:00
2016-08-08 14:19:56 -07:00
{ name : "MULLD" , argLength : 2 , reg : gp21 , asm : "MULLD" , typ : "Int64" , commutative : true } , // arg0*arg1 (signed 64-bit)
{ name : "MULLW" , argLength : 2 , reg : gp21 , asm : "MULLW" , typ : "Int32" , commutative : true } , // arg0*arg1 (signed 32-bit)
2020-08-17 16:14:48 -05:00
{ name : "MADDLD" , argLength : 3 , reg : gp31 , asm : "MADDLD" , typ : "Int64" } , // (arg0*arg1)+arg2 (signed 64-bit)
2016-08-02 13:17:09 -07:00
{ name : "MULHD" , argLength : 2 , reg : gp21 , asm : "MULHD" , commutative : true } , // (arg0 * arg1) >> 64, signed
{ name : "MULHW" , argLength : 2 , reg : gp21 , asm : "MULHW" , commutative : true } , // (arg0 * arg1) >> 32, signed
{ name : "MULHDU" , argLength : 2 , reg : gp21 , asm : "MULHDU" , commutative : true } , // (arg0 * arg1) >> 64, unsigned
{ name : "MULHWU" , argLength : 2 , reg : gp21 , asm : "MULHWU" , commutative : true } , // (arg0 * arg1) >> 32, unsigned
2018-10-01 18:24:43 -03:00
{ name : "LoweredMuluhilo" , argLength : 2 , reg : gp22 , resultNotInArgs : true } , // arg0 * arg1, returns (hi, lo)
2016-08-02 13:17:09 -07:00
2016-07-26 09:24:18 -07:00
{ name : "FMUL" , argLength : 2 , reg : fp21 , asm : "FMUL" , commutative : true } , // arg0*arg1
{ name : "FMULS" , argLength : 2 , reg : fp21 , asm : "FMULS" , commutative : true } , // arg0*arg1
2016-08-02 13:17:09 -07:00
2017-03-13 14:39:17 -04:00
{ name : "FMADD" , argLength : 3 , reg : fp31 , asm : "FMADD" } , // arg0*arg1 + arg2
{ name : "FMADDS" , argLength : 3 , reg : fp31 , asm : "FMADDS" } , // arg0*arg1 + arg2
{ name : "FMSUB" , argLength : 3 , reg : fp31 , asm : "FMSUB" } , // arg0*arg1 - arg2
{ name : "FMSUBS" , argLength : 3 , reg : fp31 , asm : "FMSUBS" } , // arg0*arg1 - arg2
2020-05-07 15:16:25 -07:00
{ name : "SRAD" , argLength : 2 , reg : gp21 , asm : "SRAD" } , // signed arg0 >> (arg1&127), 64 bit width (note: 127, not 63!)
{ name : "SRAW" , argLength : 2 , reg : gp21 , asm : "SRAW" } , // signed arg0 >> (arg1&63), 32 bit width
{ name : "SRD" , argLength : 2 , reg : gp21 , asm : "SRD" } , // unsigned arg0 >> (arg1&127), 64 bit width
{ name : "SRW" , argLength : 2 , reg : gp21 , asm : "SRW" } , // unsigned arg0 >> (arg1&63), 32 bit width
{ name : "SLD" , argLength : 2 , reg : gp21 , asm : "SLD" } , // arg0 << (arg1&127), 64 bit width
{ name : "SLW" , argLength : 2 , reg : gp21 , asm : "SLW" } , // arg0 << (arg1&63), 32 bit width
2016-08-02 13:17:09 -07:00
2017-08-29 11:49:08 -04:00
{ name : "ROTL" , argLength : 2 , reg : gp21 , asm : "ROTL" } , // arg0 rotate left by arg1 mod 64
{ name : "ROTLW" , argLength : 2 , reg : gp21 , asm : "ROTLW" } , // uint32(arg0) rotate left by arg1 mod 32
2020-08-20 15:06:06 -05:00
{ name : "LoweredAdd64Carry" , argLength : 3 , reg : gp32 , resultNotInArgs : true } , // arg0 + arg1 + carry, returns (sum, carry)
2016-08-02 13:17:09 -07:00
2020-05-07 15:16:25 -07:00
{ name : "SRADconst" , argLength : 1 , reg : gp11 , asm : "SRAD" , aux : "Int64" } , // signed arg0 >> auxInt, 0 <= auxInt < 64, 64 bit width
{ name : "SRAWconst" , argLength : 1 , reg : gp11 , asm : "SRAW" , aux : "Int64" } , // signed arg0 >> auxInt, 0 <= auxInt < 32, 32 bit width
{ name : "SRDconst" , argLength : 1 , reg : gp11 , asm : "SRD" , aux : "Int64" } , // unsigned arg0 >> auxInt, 0 <= auxInt < 64, 64 bit width
{ name : "SRWconst" , argLength : 1 , reg : gp11 , asm : "SRW" , aux : "Int64" } , // unsigned arg0 >> auxInt, 0 <= auxInt < 32, 32 bit width
{ name : "SLDconst" , argLength : 1 , reg : gp11 , asm : "SLD" , aux : "Int64" } , // arg0 << auxInt, 0 <= auxInt < 64, 64 bit width
{ name : "SLWconst" , argLength : 1 , reg : gp11 , asm : "SLW" , aux : "Int64" } , // arg0 << auxInt, 0 <= auxInt < 32, 32 bit width
2016-08-02 13:17:09 -07:00
2017-04-18 17:05:31 -04:00
{ name : "ROTLconst" , argLength : 1 , reg : gp11 , asm : "ROTL" , aux : "Int64" } , // arg0 rotate left by auxInt bits
{ name : "ROTLWconst" , argLength : 1 , reg : gp11 , asm : "ROTLW" , aux : "Int64" } , // uint32(arg0) rotate left by auxInt bits
2017-04-24 15:11:39 -04:00
{ name : "CNTLZD" , argLength : 1 , reg : gp11 , asm : "CNTLZD" , clobberFlags : true } , // count leading zeros
{ name : "CNTLZW" , argLength : 1 , reg : gp11 , asm : "CNTLZW" , clobberFlags : true } , // count leading zeros (32 bit)
2019-02-08 16:18:12 -02:00
{ name : "CNTTZD" , argLength : 1 , reg : gp11 , asm : "CNTTZD" } , // count trailing zeros
{ name : "CNTTZW" , argLength : 1 , reg : gp11 , asm : "CNTTZW" } , // count trailing zeros (32 bit)
2017-04-24 15:11:39 -04:00
{ name : "POPCNTD" , argLength : 1 , reg : gp11 , asm : "POPCNTD" } , // number of set bits in arg0
{ name : "POPCNTW" , argLength : 1 , reg : gp11 , asm : "POPCNTW" } , // number of set bits in each word of arg0 placed in corresponding word
2019-09-08 19:36:13 +03:00
{ name : "POPCNTB" , argLength : 1 , reg : gp11 , asm : "POPCNTB" } , // number of set bits in each byte of arg0 placed in corresponding byte
2017-04-24 15:11:39 -04:00
2016-08-02 13:17:09 -07:00
{ name : "FDIV" , argLength : 2 , reg : fp21 , asm : "FDIV" } , // arg0/arg1
{ name : "FDIVS" , argLength : 2 , reg : fp21 , asm : "FDIVS" } , // arg0/arg1
2016-08-08 14:19:56 -07:00
{ name : "DIVD" , argLength : 2 , reg : gp21 , asm : "DIVD" , typ : "Int64" } , // arg0/arg1 (signed 64-bit)
{ name : "DIVW" , argLength : 2 , reg : gp21 , asm : "DIVW" , typ : "Int32" } , // arg0/arg1 (signed 32-bit)
{ name : "DIVDU" , argLength : 2 , reg : gp21 , asm : "DIVDU" , typ : "Int64" } , // arg0/arg1 (unsigned 64-bit)
{ name : "DIVWU" , argLength : 2 , reg : gp21 , asm : "DIVWU" , typ : "Int32" } , // arg0/arg1 (unsigned 32-bit)
2020-04-23 15:36:28 -04:00
{ name : "MODUD" , argLength : 2 , reg : gp21 , asm : "MODUD" , typ : "UInt64" } , // arg0 % arg1 (unsigned 64-bit)
{ name : "MODSD" , argLength : 2 , reg : gp21 , asm : "MODSD" , typ : "Int64" } , // arg0 % arg1 (signed 64-bit)
{ name : "MODUW" , argLength : 2 , reg : gp21 , asm : "MODUW" , typ : "UInt32" } , // arg0 % arg1 (unsigned 32-bit)
{ name : "MODSW" , argLength : 2 , reg : gp21 , asm : "MODSW" , typ : "Int32" } , // arg0 % arg1 (signed 32-bit)
2016-08-08 14:19:56 -07:00
// MOD is implemented as rem := arg0 - (arg0/arg1) * arg1
2016-08-04 11:34:43 -07:00
2016-08-10 11:44:57 -07:00
// Conversions are all float-to-float register operations. "Integer" refers to encoding in the FP register.
{ name : "FCTIDZ" , argLength : 1 , reg : fp11 , asm : "FCTIDZ" , typ : "Float64" } , // convert float to 64-bit int round towards zero
{ name : "FCTIWZ" , argLength : 1 , reg : fp11 , asm : "FCTIWZ" , typ : "Float64" } , // convert float to 32-bit int round towards zero
{ name : "FCFID" , argLength : 1 , reg : fp11 , asm : "FCFID" , typ : "Float64" } , // convert 64-bit integer to float
2017-09-12 12:33:21 -04:00
{ name : "FCFIDS" , argLength : 1 , reg : fp11 , asm : "FCFIDS" , typ : "Float32" } , // convert 32-bit integer to float
2016-08-10 11:44:57 -07:00
{ name : "FRSP" , argLength : 1 , reg : fp11 , asm : "FRSP" , typ : "Float64" } , // round float to 32-bit value
// Movement between float and integer registers with no change in bits; accomplished with stores+loads on PPC.
// Because the 32-bit load-literal-bits instructions have impoverished addressability, always widen the
// data instead and use FMOVDload and FMOVDstore instead (this will also dodge endianess issues).
// There are optimizations that should apply -- (Xi2f64 (MOVWload (not-ADD-ptr+offset) ) ) could use
// the word-load instructions. (Xi2f64 (MOVDload ptr )) can be (FMOVDload ptr)
2017-09-12 12:33:21 -04:00
{ name : "MFVSRD" , argLength : 1 , reg : fpgp , asm : "MFVSRD" , typ : "Int64" } , // move 64 bits of F register into G register
{ name : "MTVSRD" , argLength : 1 , reg : gpfp , asm : "MTVSRD" , typ : "Float64" } , // move 64 bits of G register into F register
2016-08-10 11:44:57 -07:00
2019-09-23 16:16:04 -04:00
{ name : "AND" , argLength : 2 , reg : gp21 , asm : "AND" , commutative : true } , // arg0&arg1
{ name : "ANDN" , argLength : 2 , reg : gp21 , asm : "ANDN" } , // arg0&^arg1
{ name : "ANDCC" , argLength : 2 , reg : gp2cr , asm : "ANDCC" , commutative : true , typ : "Flags" } , // arg0&arg1 sets CC
{ name : "OR" , argLength : 2 , reg : gp21 , asm : "OR" , commutative : true } , // arg0|arg1
{ name : "ORN" , argLength : 2 , reg : gp21 , asm : "ORN" } , // arg0|^arg1
{ name : "ORCC" , argLength : 2 , reg : gp2cr , asm : "ORCC" , commutative : true , typ : "Flags" } , // arg0|arg1 sets CC
{ name : "NOR" , argLength : 2 , reg : gp21 , asm : "NOR" , commutative : true } , // ^(arg0|arg1)
{ name : "XOR" , argLength : 2 , reg : gp21 , asm : "XOR" , typ : "Int64" , commutative : true } , // arg0^arg1
{ name : "XORCC" , argLength : 2 , reg : gp2cr , asm : "XORCC" , commutative : true , typ : "Flags" } , // arg0^arg1 sets CC
{ name : "EQV" , argLength : 2 , reg : gp21 , asm : "EQV" , typ : "Int64" , commutative : true } , // arg0^^arg1
{ name : "NEG" , argLength : 1 , reg : gp11 , asm : "NEG" } , // -arg0 (integer)
{ name : "FNEG" , argLength : 1 , reg : fp11 , asm : "FNEG" } , // -arg0 (floating point)
{ name : "FSQRT" , argLength : 1 , reg : fp11 , asm : "FSQRT" } , // sqrt(arg0) (floating point)
{ name : "FSQRTS" , argLength : 1 , reg : fp11 , asm : "FSQRTS" } , // sqrt(arg0) (floating point, single precision)
{ name : "FFLOOR" , argLength : 1 , reg : fp11 , asm : "FRIM" } , // floor(arg0), float64
{ name : "FCEIL" , argLength : 1 , reg : fp11 , asm : "FRIP" } , // ceil(arg0), float64
{ name : "FTRUNC" , argLength : 1 , reg : fp11 , asm : "FRIZ" } , // trunc(arg0), float64
{ name : "FROUND" , argLength : 1 , reg : fp11 , asm : "FRIN" } , // round(arg0), float64
{ name : "FABS" , argLength : 1 , reg : fp11 , asm : "FABS" } , // abs(arg0), float64
{ name : "FNABS" , argLength : 1 , reg : fp11 , asm : "FNABS" } , // -abs(arg0), float64
{ name : "FCPSGN" , argLength : 2 , reg : fp21 , asm : "FCPSGN" } , // copysign arg0 -> arg1, float64
2016-08-04 11:34:43 -07:00
2016-08-04 06:57:34 -04:00
{ name : "ORconst" , argLength : 1 , reg : gp11 , asm : "OR" , aux : "Int64" } , // arg0|aux
{ name : "XORconst" , argLength : 1 , reg : gp11 , asm : "XOR" , aux : "Int64" } , // arg0^aux
{ name : "ANDconst" , argLength : 1 , reg : regInfo { inputs : [ ] regMask { gp | sp | sb } , outputs : [ ] regMask { gp } } , asm : "ANDCC" , aux : "Int64" , clobberFlags : true } , // arg0&aux // and-immediate sets CC on PPC, always.
2016-10-05 13:21:09 -07:00
{ name : "ANDCCconst" , argLength : 1 , reg : regInfo { inputs : [ ] regMask { gp | sp | sb } } , asm : "ANDCC" , aux : "Int64" , typ : "Flags" } , // arg0&aux == 0 // and-immediate sets CC on PPC, always.
2016-08-04 11:34:43 -07:00
2018-03-01 11:40:36 -05:00
{ name : "MOVBreg" , argLength : 1 , reg : gp11 , asm : "MOVB" , typ : "Int64" } , // sign extend int8 to int64
{ name : "MOVBZreg" , argLength : 1 , reg : gp11 , asm : "MOVBZ" , typ : "Int64" } , // zero extend uint8 to uint64
{ name : "MOVHreg" , argLength : 1 , reg : gp11 , asm : "MOVH" , typ : "Int64" } , // sign extend int16 to int64
{ name : "MOVHZreg" , argLength : 1 , reg : gp11 , asm : "MOVHZ" , typ : "Int64" } , // zero extend uint16 to uint64
{ name : "MOVWreg" , argLength : 1 , reg : gp11 , asm : "MOVW" , typ : "Int64" } , // sign extend int32 to int64
{ name : "MOVWZreg" , argLength : 1 , reg : gp11 , asm : "MOVWZ" , typ : "Int64" } , // zero extend uint32 to uint64
// Load bytes in the endian order of the arch from arg0+aux+auxint into a 64 bit register.
{ name : "MOVBZload" , argLength : 2 , reg : gpload , asm : "MOVBZ" , aux : "SymOff" , typ : "UInt8" , faultOnNilArg0 : true , symEffect : "Read" } , // load byte zero extend
{ name : "MOVHload" , argLength : 2 , reg : gpload , asm : "MOVH" , aux : "SymOff" , typ : "Int16" , faultOnNilArg0 : true , symEffect : "Read" } , // load 2 bytes sign extend
{ name : "MOVHZload" , argLength : 2 , reg : gpload , asm : "MOVHZ" , aux : "SymOff" , typ : "UInt16" , faultOnNilArg0 : true , symEffect : "Read" } , // load 2 bytes zero extend
{ name : "MOVWload" , argLength : 2 , reg : gpload , asm : "MOVW" , aux : "SymOff" , typ : "Int32" , faultOnNilArg0 : true , symEffect : "Read" } , // load 4 bytes sign extend
{ name : "MOVWZload" , argLength : 2 , reg : gpload , asm : "MOVWZ" , aux : "SymOff" , typ : "UInt32" , faultOnNilArg0 : true , symEffect : "Read" } , // load 4 bytes zero extend
{ name : "MOVDload" , argLength : 2 , reg : gpload , asm : "MOVD" , aux : "SymOff" , typ : "Int64" , faultOnNilArg0 : true , symEffect : "Read" } , // load 8 bytes
// Load bytes in reverse endian order of the arch from arg0 into a 64 bit register, all zero extend.
// The generated instructions are indexed loads with no offset field in the instruction so the aux fields are not used.
// In these cases the index register field is set to 0 and the full address is in the base register.
{ name : "MOVDBRload" , argLength : 2 , reg : gpload , asm : "MOVDBR" , aux : "SymOff" , typ : "Int64" , faultOnNilArg0 : true , symEffect : "Read" } , // load 8 bytes reverse order
{ name : "MOVWBRload" , argLength : 2 , reg : gpload , asm : "MOVWBR" , aux : "SymOff" , typ : "Int32" , faultOnNilArg0 : true , symEffect : "Read" } , // load 4 bytes zero extend reverse order
{ name : "MOVHBRload" , argLength : 2 , reg : gpload , asm : "MOVHBR" , aux : "SymOff" , typ : "Int16" , faultOnNilArg0 : true , symEffect : "Read" } , // load 2 bytes zero extend reverse order
2018-09-14 16:30:54 -04:00
// In these cases an index register is used in addition to a base register
2020-03-20 09:59:53 -07:00
// Loads from memory location arg[0] + arg[1].
{ name : "MOVBZloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVBZ" , typ : "UInt8" } , // zero extend uint8 to uint64
{ name : "MOVHloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVH" , typ : "Int16" } , // sign extend int16 to int64
{ name : "MOVHZloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVHZ" , typ : "UInt16" } , // zero extend uint16 to uint64
{ name : "MOVWloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVW" , typ : "Int32" } , // sign extend int32 to int64
{ name : "MOVWZloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVWZ" , typ : "UInt32" } , // zero extend uint32 to uint64
{ name : "MOVDloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVD" , typ : "Int64" } ,
{ name : "MOVHBRloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVHBR" , typ : "Int16" } , // sign extend int16 to int64
{ name : "MOVWBRloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVWBR" , typ : "Int32" } , // sign extend int32 to int64
{ name : "MOVDBRloadidx" , argLength : 3 , reg : gploadidx , asm : "MOVDBR" , typ : "Int64" } ,
{ name : "FMOVDloadidx" , argLength : 3 , reg : fploadidx , asm : "FMOVD" , typ : "Float64" } ,
{ name : "FMOVSloadidx" , argLength : 3 , reg : fploadidx , asm : "FMOVS" , typ : "Float32" } ,
2018-09-14 16:30:54 -04:00
2018-03-01 11:40:36 -05:00
// Store bytes in the reverse endian order of the arch into arg0.
2020-01-23 22:19:39 -08:00
// These are indexed stores with no offset field in the instruction so the auxint fields are not used.
{ name : "MOVDBRstore" , argLength : 3 , reg : gpstore , asm : "MOVDBR" , aux : "Sym" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 8 bytes reverse order
{ name : "MOVWBRstore" , argLength : 3 , reg : gpstore , asm : "MOVWBR" , aux : "Sym" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 4 bytes reverse order
{ name : "MOVHBRstore" , argLength : 3 , reg : gpstore , asm : "MOVHBR" , aux : "Sym" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 2 bytes reverse order
2018-03-01 11:40:36 -05:00
// Floating point loads from arg0+aux+auxint
{ name : "FMOVDload" , argLength : 2 , reg : fpload , asm : "FMOVD" , aux : "SymOff" , typ : "Float64" , faultOnNilArg0 : true , symEffect : "Read" } , // load double float
{ name : "FMOVSload" , argLength : 2 , reg : fpload , asm : "FMOVS" , aux : "SymOff" , typ : "Float32" , faultOnNilArg0 : true , symEffect : "Read" } , // load single float
// Store bytes in the endian order of the arch into arg0+aux+auxint
{ name : "MOVBstore" , argLength : 3 , reg : gpstore , asm : "MOVB" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store byte
{ name : "MOVHstore" , argLength : 3 , reg : gpstore , asm : "MOVH" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 2 bytes
{ name : "MOVWstore" , argLength : 3 , reg : gpstore , asm : "MOVW" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 4 bytes
{ name : "MOVDstore" , argLength : 3 , reg : gpstore , asm : "MOVD" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store 8 bytes
// Store floating point value into arg0+aux+auxint
{ name : "FMOVDstore" , argLength : 3 , reg : fpstore , asm : "FMOVD" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store double flot
{ name : "FMOVSstore" , argLength : 3 , reg : fpstore , asm : "FMOVS" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store single float
2018-09-14 16:30:54 -04:00
// Stores using index and base registers
2020-03-20 09:59:53 -07:00
// Stores to arg[0] + arg[1]
{ name : "MOVBstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVB" , typ : "Mem" } , // store bye
{ name : "MOVHstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVH" , typ : "Mem" } , // store half word
{ name : "MOVWstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVW" , typ : "Mem" } , // store word
{ name : "MOVDstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVD" , typ : "Mem" } , // store double word
{ name : "FMOVDstoreidx" , argLength : 4 , reg : fpstoreidx , asm : "FMOVD" , typ : "Mem" } , // store double float
{ name : "FMOVSstoreidx" , argLength : 4 , reg : fpstoreidx , asm : "FMOVS" , typ : "Mem" } , // store single float
{ name : "MOVHBRstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVHBR" , typ : "Mem" } , // store half word reversed byte using index reg
{ name : "MOVWBRstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVWBR" , typ : "Mem" } , // store word reversed byte using index reg
{ name : "MOVDBRstoreidx" , argLength : 4 , reg : gpstoreidx , asm : "MOVDBR" , typ : "Mem" } , // store double word reversed byte using index reg
2018-09-14 16:30:54 -04:00
2018-03-01 11:40:36 -05:00
// The following ops store 0 into arg0+aux+auxint arg1=mem
{ name : "MOVBstorezero" , argLength : 2 , reg : gpstorezero , asm : "MOVB" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store zero 1 byte
{ name : "MOVHstorezero" , argLength : 2 , reg : gpstorezero , asm : "MOVH" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store zero 2 bytes
{ name : "MOVWstorezero" , argLength : 2 , reg : gpstorezero , asm : "MOVW" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store zero 4 bytes
{ name : "MOVDstorezero" , argLength : 2 , reg : gpstorezero , asm : "MOVD" , aux : "SymOff" , typ : "Mem" , faultOnNilArg0 : true , symEffect : "Write" } , // store zero 8 bytes
{ name : "MOVDaddr" , argLength : 1 , reg : regInfo { inputs : [ ] regMask { sp | sb | gp } , outputs : [ ] regMask { gp } } , aux : "SymOff" , asm : "MOVD" , rematerializeable : true , symEffect : "Addr" } , // arg0 + auxInt + aux.(*gc.Sym), arg0=SP/SB/GP
2016-07-06 13:32:52 -07:00
2016-10-05 13:21:09 -07:00
{ name : "MOVDconst" , argLength : 0 , reg : gp01 , aux : "Int64" , asm : "MOVD" , typ : "Int64" , rematerializeable : true } , //
{ name : "FMOVDconst" , argLength : 0 , reg : fp01 , aux : "Float64" , asm : "FMOVD" , rematerializeable : true } , //
{ name : "FMOVSconst" , argLength : 0 , reg : fp01 , aux : "Float32" , asm : "FMOVS" , rematerializeable : true } , //
2016-06-24 14:37:17 -05:00
{ name : "FCMPU" , argLength : 2 , reg : fp2cr , asm : "FCMPU" , typ : "Flags" } ,
{ name : "CMP" , argLength : 2 , reg : gp2cr , asm : "CMP" , typ : "Flags" } , // arg0 compare to arg1
{ name : "CMPU" , argLength : 2 , reg : gp2cr , asm : "CMPU" , typ : "Flags" } , // arg0 compare to arg1
{ name : "CMPW" , argLength : 2 , reg : gp2cr , asm : "CMPW" , typ : "Flags" } , // arg0 compare to arg1
{ name : "CMPWU" , argLength : 2 , reg : gp2cr , asm : "CMPWU" , typ : "Flags" } , // arg0 compare to arg1
2016-08-02 13:17:09 -07:00
{ name : "CMPconst" , argLength : 1 , reg : gp1cr , asm : "CMP" , aux : "Int64" , typ : "Flags" } ,
{ name : "CMPUconst" , argLength : 1 , reg : gp1cr , asm : "CMPU" , aux : "Int64" , typ : "Flags" } ,
{ name : "CMPWconst" , argLength : 1 , reg : gp1cr , asm : "CMPW" , aux : "Int32" , typ : "Flags" } ,
{ name : "CMPWUconst" , argLength : 1 , reg : gp1cr , asm : "CMPWU" , aux : "Int32" , typ : "Flags" } ,
2016-06-24 14:37:17 -05:00
2019-09-12 09:22:07 -04:00
// ISEL auxInt values 0=LT 1=GT 2=EQ arg2 ? arg0 : arg1
// ISEL auxInt values 4=GE 5=LE 6=NE arg2 ? arg1 : arg0
// ISELB special case where arg0, arg1 values are 0, 1 for boolean result
{ name : "ISEL" , argLength : 3 , reg : crgp21 , asm : "ISEL" , aux : "Int32" , typ : "Int32" } , // see above
{ name : "ISELB" , argLength : 2 , reg : crgp11 , asm : "ISEL" , aux : "Int32" , typ : "Int32" } , // see above
2016-06-24 14:37:17 -05:00
// pseudo-ops
2016-08-10 11:44:57 -07:00
{ name : "Equal" , argLength : 1 , reg : crgp } , // bool, true flags encode x==y false otherwise.
{ name : "NotEqual" , argLength : 1 , reg : crgp } , // bool, true flags encode x!=y false otherwise.
{ name : "LessThan" , argLength : 1 , reg : crgp } , // bool, true flags encode x<y false otherwise.
{ name : "FLessThan" , argLength : 1 , reg : crgp } , // bool, true flags encode x<y false otherwise.
{ name : "LessEqual" , argLength : 1 , reg : crgp } , // bool, true flags encode x<=y false otherwise.
{ name : "FLessEqual" , argLength : 1 , reg : crgp } , // bool, true flags encode x<=y false otherwise; PPC <= === !> which is wrong for NaN
{ name : "GreaterThan" , argLength : 1 , reg : crgp } , // bool, true flags encode x>y false otherwise.
{ name : "FGreaterThan" , argLength : 1 , reg : crgp } , // bool, true flags encode x>y false otherwise.
{ name : "GreaterEqual" , argLength : 1 , reg : crgp } , // bool, true flags encode x>=y false otherwise.
{ name : "FGreaterEqual" , argLength : 1 , reg : crgp } , // bool, true flags encode x>=y false otherwise.; PPC >= === !< which is wrong for NaN
2016-07-26 09:24:18 -07:00
// Scheduler ensures LoweredGetClosurePtr occurs only in entry block,
// and sorts it to the very beginning of the block to prevent other
// use of the closure pointer.
2018-02-28 16:30:07 -05:00
{ name : "LoweredGetClosurePtr" , reg : regInfo { outputs : [ ] regMask { ctxt } } , zeroWidth : true } ,
2016-07-26 09:24:18 -07:00
2017-10-09 15:33:29 -04:00
// LoweredGetCallerSP returns the SP of the caller of the current function.
{ name : "LoweredGetCallerSP" , reg : gp01 , rematerializeable : true } ,
2018-05-02 14:25:00 +08:00
// LoweredGetCallerPC evaluates to the PC to which its "caller" will return.
// I.e., if f calls g "calls" getcallerpc,
// the result should be the PC within f that g will return to.
// See runtime/stubs.go for a more detailed discussion.
{ name : "LoweredGetCallerPC" , reg : gp01 , rematerializeable : true } ,
2016-07-26 09:24:18 -07:00
//arg0=ptr,arg1=mem, returns void. Faults if ptr is nil.
2016-09-27 14:39:27 -07:00
{ name : "LoweredNilCheck" , argLength : 2 , reg : regInfo { inputs : [ ] regMask { gp | sp | sb } , clobbers : tmp } , clobberFlags : true , nilCheck : true , faultOnNilArg0 : true } ,
2017-03-13 14:39:17 -04:00
// Round ops to block fused-multiply-add extraction.
2018-02-28 16:30:07 -05:00
{ name : "LoweredRound32F" , argLength : 1 , reg : fp11 , resultInArg0 : true , zeroWidth : true } ,
{ name : "LoweredRound64F" , argLength : 1 , reg : fp11 , resultInArg0 : true , zeroWidth : true } ,
2016-07-26 09:24:18 -07:00
2020-06-12 13:48:26 -04:00
{ name : "CALLstatic" , argLength : 1 , reg : regInfo { clobbers : callerSave } , aux : "CallOff" , clobberFlags : true , call : true } , // call static function aux.(*obj.LSym). arg0=mem, auxint=argsize, returns mem
2017-09-11 10:39:24 -04:00
{ name : "CALLclosure" , argLength : 3 , reg : regInfo { inputs : [ ] regMask { callptr , ctxt , 0 } , clobbers : callerSave } , aux : "Int64" , clobberFlags : true , call : true } , // call function via closure. arg0=codeptr, arg1=closure, arg2=mem, auxint=argsize, returns mem
{ name : "CALLinter" , argLength : 2 , reg : regInfo { inputs : [ ] regMask { callptr } , clobbers : callerSave } , aux : "Int64" , clobberFlags : true , call : true } , // call fn by pointer. arg0=codeptr, arg1=mem, auxint=argsize, returns mem
2016-07-26 09:24:18 -07:00
2016-07-27 13:54:07 -07:00
// large or unaligned zeroing
// arg0 = address of memory to zero (in R3, changed as side effect)
// returns mem
2017-03-13 10:16:30 -04:00
//
// a loop is generated when there is more than one iteration
// needed to clear 4 doublewords
//
2019-10-04 16:03:36 -04:00
// XXLXOR VS32,VS32,VS32
2017-03-13 10:16:30 -04:00
// MOVD $len/32,R31
// MOVD R31,CTR
2019-10-04 16:03:36 -04:00
// MOVD $16,R31
2017-03-13 10:16:30 -04:00
// loop:
2019-10-04 16:03:36 -04:00
// STXVD2X VS32,(R0)(R3)
// STXVD2X VS32,(R31),R3)
2017-03-13 10:16:30 -04:00
// ADD R3,32
// BC loop
// remaining doubleword clears generated as needed
// MOVD R0,(R3)
// MOVD R0,8(R3)
// MOVD R0,16(R3)
// MOVD R0,24(R3)
// one or more of these to clear remainder < 8 bytes
// MOVW R0,n1(R3)
// MOVH R0,n2(R3)
// MOVB R0,n3(R3)
2016-07-27 13:54:07 -07:00
{
name : "LoweredZero" ,
aux : "Int64" ,
2017-03-13 10:16:30 -04:00
argLength : 2 ,
2016-07-27 13:54:07 -07:00
reg : regInfo {
2020-03-30 15:23:19 -04:00
inputs : [ ] regMask { buildReg ( "R20" ) } ,
clobbers : buildReg ( "R20" ) ,
2016-07-27 13:54:07 -07:00
} ,
2016-09-13 17:01:01 -07:00
clobberFlags : true ,
typ : "Mem" ,
faultOnNilArg0 : true ,
2019-10-28 00:50:39 -04:00
unsafePoint : true ,
2016-07-27 13:54:07 -07:00
} ,
2020-03-30 15:23:19 -04:00
{
name : "LoweredZeroShort" ,
aux : "Int64" ,
argLength : 2 ,
reg : regInfo {
inputs : [ ] regMask { gp } } ,
typ : "Mem" ,
faultOnNilArg0 : true ,
unsafePoint : true ,
} ,
{
name : "LoweredQuadZeroShort" ,
aux : "Int64" ,
argLength : 2 ,
reg : regInfo {
inputs : [ ] regMask { gp } ,
} ,
typ : "Mem" ,
faultOnNilArg0 : true ,
unsafePoint : true ,
} ,
{
name : "LoweredQuadZero" ,
aux : "Int64" ,
argLength : 2 ,
reg : regInfo {
inputs : [ ] regMask { buildReg ( "R20" ) } ,
clobbers : buildReg ( "R20" ) ,
} ,
clobberFlags : true ,
typ : "Mem" ,
faultOnNilArg0 : true ,
unsafePoint : true ,
} ,
2019-10-04 16:03:36 -04:00
// R31 is temp register
2017-03-30 11:07:36 -04:00
// Loop code:
2019-10-04 16:03:36 -04:00
// MOVD len/32,R31 set up loop ctr
// MOVD R31,CTR
// MOVD $16,R31 index register
2017-03-30 11:07:36 -04:00
// loop:
2019-10-04 16:03:36 -04:00
// LXVD2X (R0)(R4),VS32
// LXVD2X (R31)(R4),VS33
// ADD R4,$32 increment src
// STXVD2X VS32,(R0)(R3)
// STXVD2X VS33,(R31)(R3)
// ADD R3,$32 increment dst
// BC 16,0,loop branch ctr
// For this purpose, VS32 and VS33 are treated as
// scratch registers. Since regalloc does not
// track vector registers, even if it could be marked
// as clobbered it would have no effect.
// TODO: If vector registers are managed by regalloc
// mark these as clobbered.
//
2017-03-30 11:07:36 -04:00
// Bytes not moved by this loop are moved
// with a combination of the following instructions,
// starting with the largest sizes and generating as
// many as needed, using the appropriate offset value.
2019-10-04 16:03:36 -04:00
// MOVD n(R4),R14
// MOVD R14,n(R3)
// MOVW n1(R4),R14
// MOVW R14,n1(R3)
// MOVH n2(R4),R14
// MOVH R14,n2(R3)
// MOVB n3(R4),R14
// MOVB R14,n3(R3)
2016-07-27 13:54:07 -07:00
{
name : "LoweredMove" ,
aux : "Int64" ,
2017-03-30 11:07:36 -04:00
argLength : 3 ,
2016-07-27 13:54:07 -07:00
reg : regInfo {
2020-03-30 15:23:19 -04:00
inputs : [ ] regMask { buildReg ( "R20" ) , buildReg ( "R21" ) } ,
clobbers : buildReg ( "R20 R21" ) ,
2016-07-27 13:54:07 -07:00
} ,
2016-09-13 17:01:01 -07:00
clobberFlags : true ,
typ : "Mem" ,
faultOnNilArg0 : true ,
faultOnNilArg1 : true ,
2019-10-28 00:50:39 -04:00
unsafePoint : true ,
2016-07-27 13:54:07 -07:00
} ,
2020-03-30 15:23:19 -04:00
{
name : "LoweredMoveShort" ,
aux : "Int64" ,
argLength : 3 ,
reg : regInfo {
inputs : [ ] regMask { gp , gp } ,
} ,
typ : "Mem" ,
faultOnNilArg0 : true ,
faultOnNilArg1 : true ,
unsafePoint : true ,
} ,
// The following is similar to the LoweredMove, but uses
// LXV instead of LXVD2X, which does not require an index
// register and will do 4 in a loop instead of only.
{
name : "LoweredQuadMove" ,
aux : "Int64" ,
argLength : 3 ,
reg : regInfo {
inputs : [ ] regMask { buildReg ( "R20" ) , buildReg ( "R21" ) } ,
clobbers : buildReg ( "R20 R21" ) ,
} ,
clobberFlags : true ,
typ : "Mem" ,
faultOnNilArg0 : true ,
faultOnNilArg1 : true ,
unsafePoint : true ,
} ,
{
name : "LoweredQuadMoveShort" ,
aux : "Int64" ,
argLength : 3 ,
reg : regInfo {
inputs : [ ] regMask { gp , gp } ,
} ,
typ : "Mem" ,
faultOnNilArg0 : true ,
faultOnNilArg1 : true ,
unsafePoint : true ,
} ,
2016-08-02 13:17:09 -07:00
2019-10-23 10:20:49 -04:00
{ name : "LoweredAtomicStore8" , argLength : 3 , reg : gpstore , typ : "Mem" , aux : "Int64" , faultOnNilArg0 : true , hasSideEffects : true } ,
2018-08-06 15:36:16 -05:00
{ name : "LoweredAtomicStore32" , argLength : 3 , reg : gpstore , typ : "Mem" , aux : "Int64" , faultOnNilArg0 : true , hasSideEffects : true } ,
{ name : "LoweredAtomicStore64" , argLength : 3 , reg : gpstore , typ : "Mem" , aux : "Int64" , faultOnNilArg0 : true , hasSideEffects : true } ,
2017-02-10 17:45:12 -05:00
2019-03-28 14:58:06 -04:00
{ name : "LoweredAtomicLoad8" , argLength : 2 , reg : gpload , typ : "UInt8" , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true } ,
2018-08-06 15:36:16 -05:00
{ name : "LoweredAtomicLoad32" , argLength : 2 , reg : gpload , typ : "UInt32" , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true } ,
{ name : "LoweredAtomicLoad64" , argLength : 2 , reg : gpload , typ : "Int64" , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true } ,
{ name : "LoweredAtomicLoadPtr" , argLength : 2 , reg : gpload , typ : "Int64" , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true } ,
2017-02-10 17:45:12 -05:00
// atomic add32, 64
// SYNC
// LDAR (Rarg0), Rout
// ADD Rarg1, Rout
// STDCCC Rout, (Rarg0)
// BNE -3(PC)
// ISYNC
// return new sum
{ name : "LoweredAtomicAdd32" , argLength : 3 , reg : gpxchg , resultNotInArgs : true , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
{ name : "LoweredAtomicAdd64" , argLength : 3 , reg : gpxchg , resultNotInArgs : true , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
// atomic exchange32, 64
// SYNC
// LDAR (Rarg0), Rout
// STDCCC Rarg1, (Rarg0)
// BNE -2(PC)
// ISYNC
// return old val
{ name : "LoweredAtomicExchange32" , argLength : 3 , reg : gpxchg , resultNotInArgs : true , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
{ name : "LoweredAtomicExchange64" , argLength : 3 , reg : gpxchg , resultNotInArgs : true , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
// atomic compare and swap.
// arg0 = pointer, arg1 = old value, arg2 = new value, arg3 = memory. auxint must be zero.
// if *arg0 == arg1 {
// *arg0 = arg2
// return (true, memory)
// } else {
// return (false, memory)
// }
// SYNC
// LDAR (Rarg0), Rtmp
// CMP Rarg1, Rtmp
// BNE 3(PC)
// STDCCC Rarg2, (Rarg0)
// BNE -4(PC)
// CBNZ Rtmp, -4(PC)
// CSET EQ, Rout
2018-08-06 15:36:16 -05:00
{ name : "LoweredAtomicCas64" , argLength : 4 , reg : gpcas , resultNotInArgs : true , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
{ name : "LoweredAtomicCas32" , argLength : 4 , reg : gpcas , resultNotInArgs : true , aux : "Int64" , clobberFlags : true , faultOnNilArg0 : true , hasSideEffects : true } ,
2017-02-10 17:45:12 -05:00
// atomic 8 and/or.
// *arg0 &= (|=) arg1. arg2=mem. returns memory. auxint must be zero.
// LBAR (Rarg0), Rtmp
// AND/OR Rarg1, Rtmp
// STBCCC Rtmp, (Rarg0), Rtmp
// BNE Rtmp, -3(PC)
{ name : "LoweredAtomicAnd8" , argLength : 3 , reg : gpstore , asm : "AND" , faultOnNilArg0 : true , hasSideEffects : true } ,
{ name : "LoweredAtomicOr8" , argLength : 3 , reg : gpstore , asm : "OR" , faultOnNilArg0 : true , hasSideEffects : true } ,
2017-11-15 14:54:24 -08:00
// LoweredWB invokes runtime.gcWriteBarrier. arg0=destptr, arg1=srcptr, arg2=mem, aux=runtime.gcWriteBarrier
cmd/compile, runtime: mark R12 clobbered for write barrier call on PPC64
When external linking, for large binaries, the external linker
may insert a trampoline for the write barrier call, which looks
0000000005a98cc8 <__long_branch_runtime.gcWriteBarrier>:
5a98cc8: 86 01 82 3d addis r12,r2,390
5a98ccc: d8 bd 8c e9 ld r12,-16936(r12)
5a98cd0: a6 03 89 7d mtctr r12
5a98cd4: 20 04 80 4e bctr
It clobbers R12 (and CTR, which is never live across a call).
As at compile time we don't know whether the binary is big and
what link mode will be used, I think we need to mark R12 as
clobbered for write barrier call. For extra safety (future-proof)
we mark caller-saved register that cannot be used for function
arguments, which includes R11, as potentially clobbered as well.
Fixes #40851.
Change-Id: Iedd901c5072f1127cc59b0a48cfeb4aaec81b519
Reviewed-on: https://go-review.googlesource.com/c/go/+/248917
Run-TryBot: Cherry Zhang <cherryyz@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>
2020-08-17 19:06:19 -04:00
// It preserves R0 through R17 (except special registers R1, R2, R11, R12, R13), g, and its arguments R20 and R21,
2017-11-15 14:54:24 -08:00
// but may clobber anything else, including R31 (REGTMP).
cmd/compile, runtime: mark R12 clobbered for write barrier call on PPC64
When external linking, for large binaries, the external linker
may insert a trampoline for the write barrier call, which looks
0000000005a98cc8 <__long_branch_runtime.gcWriteBarrier>:
5a98cc8: 86 01 82 3d addis r12,r2,390
5a98ccc: d8 bd 8c e9 ld r12,-16936(r12)
5a98cd0: a6 03 89 7d mtctr r12
5a98cd4: 20 04 80 4e bctr
It clobbers R12 (and CTR, which is never live across a call).
As at compile time we don't know whether the binary is big and
what link mode will be used, I think we need to mark R12 as
clobbered for write barrier call. For extra safety (future-proof)
we mark caller-saved register that cannot be used for function
arguments, which includes R11, as potentially clobbered as well.
Fixes #40851.
Change-Id: Iedd901c5072f1127cc59b0a48cfeb4aaec81b519
Reviewed-on: https://go-review.googlesource.com/c/go/+/248917
Run-TryBot: Cherry Zhang <cherryyz@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: Austin Clements <austin@google.com>
2020-08-17 19:06:19 -04:00
{ name : "LoweredWB" , argLength : 3 , reg : regInfo { inputs : [ ] regMask { buildReg ( "R20" ) , buildReg ( "R21" ) } , clobbers : ( callerSave &^ buildReg ( "R0 R3 R4 R5 R6 R7 R8 R9 R10 R14 R15 R16 R17 R20 R21 g" ) ) | buildReg ( "R31" ) } , clobberFlags : true , aux : "Sym" , symEffect : "None" } ,
2017-11-15 14:54:24 -08:00
2019-02-06 14:12:36 -08:00
// There are three of these functions so that they can have three different register inputs.
// When we check 0 <= c <= cap (A), then 0 <= b <= c (B), then 0 <= a <= b (C), we want the
// default registers to match so we don't need to copy registers around unnecessarily.
2020-04-27 15:58:16 -04:00
{ name : "LoweredPanicBoundsA" , argLength : 3 , aux : "Int64" , reg : regInfo { inputs : [ ] regMask { r5 , r6 } } , typ : "Mem" , call : true } , // arg0=idx, arg1=len, arg2=mem, returns memory. AuxInt contains report code (see PanicBounds in genericOps.go).
{ name : "LoweredPanicBoundsB" , argLength : 3 , aux : "Int64" , reg : regInfo { inputs : [ ] regMask { r4 , r5 } } , typ : "Mem" , call : true } , // arg0=idx, arg1=len, arg2=mem, returns memory. AuxInt contains report code (see PanicBounds in genericOps.go).
{ name : "LoweredPanicBoundsC" , argLength : 3 , aux : "Int64" , reg : regInfo { inputs : [ ] regMask { r3 , r4 } } , typ : "Mem" , call : true } , // arg0=idx, arg1=len, arg2=mem, returns memory. AuxInt contains report code (see PanicBounds in genericOps.go).
2019-02-06 14:12:36 -08:00
2016-08-02 13:17:09 -07:00
// (InvertFlags (CMP a b)) == (CMP b a)
// So if we want (LessThan (CMP a b)) but we can't do that because a is a constant,
// then we do (LessThan (InvertFlags (CMP b a))) instead.
// Rewrites will convert this to (GreaterThan (CMP b a)).
// InvertFlags is a pseudo-op which can't appear in assembly output.
{ name : "InvertFlags" , argLength : 1 } , // reverse direction of arg0
// Constant flag values. For any comparison, there are 3 possible
// outcomes: either the three from the signed total order (<,==,>)
// or the three from the unsigned total order, depending on which
// comparison operation was used (CMP or CMPU -- PPC is different from
// the other architectures, which have a single comparison producing
// both signed and unsigned comparison results.)
// These ops are for temporary use by rewrite rules. They
// cannot appear in the generated assembly.
2020-08-20 15:06:06 -05:00
{ name : "FlagEQ" } , // equal
{ name : "FlagLT" } , // signed < or unsigned <
{ name : "FlagGT" } , // signed > or unsigned >
2016-06-24 14:37:17 -05:00
}
blocks := [ ] blockData {
2019-08-12 20:19:58 +01:00
{ name : "EQ" , controls : 1 } ,
{ name : "NE" , controls : 1 } ,
{ name : "LT" , controls : 1 } ,
{ name : "LE" , controls : 1 } ,
{ name : "GT" , controls : 1 } ,
{ name : "GE" , controls : 1 } ,
{ name : "FLT" , controls : 1 } ,
{ name : "FLE" , controls : 1 } ,
{ name : "FGT" , controls : 1 } ,
{ name : "FGE" , controls : 1 } ,
2016-06-24 14:37:17 -05:00
}
archs = append ( archs , arch {
name : "PPC64" ,
pkg : "cmd/internal/obj/ppc64" ,
genfile : "../../ppc64/ssa.go" ,
ops : ops ,
blocks : blocks ,
regnames : regNamesPPC64 ,
gpregmask : gp ,
fpregmask : fp ,
framepointerreg : int8 ( num [ "SP" ] ) ,
2016-10-06 15:06:45 -04:00
linkreg : - 1 , // not used
2016-06-24 14:37:17 -05:00
} )
}