{ David Zhang 2007/01/15 $Id: ncpumat.pas,v 1.23 2005/02/14 17:13:10 peter Exp $ Copyright (c) 1998-2002 by Florian Klaempfl Generate MIPSel assembler for math nodes This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. **************************************************************************** } unit ncpumat; {$i fpcdefs.inc} interface uses symtype, node, nmat, ncgmat, cgbase; type tMIPSELmoddivnode = class(tmoddivnode) procedure pass_generate_code;override; end; tMIPSELshlshrnode = class(tcgshlshrnode) procedure second_64bit;override; { everything will be handled in pass_2 } function first_shlshr64bitint: tnode; override; end; tMIPSELnotnode = class(tcgnotnode) procedure second_boolean; override; end; TMIPSunaryminusnode = class(tcgunaryminusnode) procedure second_float; override; end; implementation uses globtype, systems, cutils, verbose, globals, symconst, symdef, aasmbase, aasmcpu, aasmtai, aasmdata, defutil, procinfo, cgobj, hlcgobj, pass_2, ncon, cpubase, ncgutil, cgcpu, cgutils; {***************************************************************************** TMipselMODDIVNODE *****************************************************************************} const ops_div: array[boolean] of tasmop = (A_DIVU, A_DIV); procedure tMIPSELmoddivnode.pass_generate_code; var power: longint; tmpreg, numerator, divider: tregister; hl,hl2: tasmlabel; begin secondpass(left); secondpass(right); location_reset(location,LOC_REGISTER,def_cgsize(resultdef)); location.register:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT); { put numerator in register } hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True); numerator := left.location.Register; if (nodetype = divn) and (right.nodetype = ordconstn) then begin if ispowerof2(tordconstnode(right).Value.svalue, power) then begin tmpreg := cg.GetIntRegister(current_asmdata.CurrAsmList, OS_INT); cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, 31, numerator, tmpreg); { if signed, tmpreg=right value-1, otherwise 0 } cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_AND, OS_INT, tordconstnode(right).Value.svalue - 1, tmpreg); { add left value } cg.a_op_reg_reg(current_asmdata.CurrAsmList, OP_ADD, OS_INT, numerator, tmpreg); cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, aword(power), tmpreg, location.register); end else cg.g_div_const_reg_reg(current_asmdata.CurrAsmList,def_cgsize(resultdef), tordconstnode(right).value.svalue,numerator,location.register); end else begin { load divider in a register if necessary } hlcg.location_force_reg(current_asmdata.CurrAsmList, right.location, right.resultdef, right.resultdef, True); divider := right.location.Register; { GAS performs division in delay slot: bne denom,$zero,.L1 div $zero,numerator,denom break 7 .L1: mflo result We can't yet do the same without prior fixing the spilling code: if registers require spilling, loads can be inserted before 'div', resulting in invalid code. } current_asmdata.CurrAsmList.Concat(taicpu.op_reg_reg_reg(ops_div[is_signed(resultdef)],NR_R0,numerator,divider)); { Check for zero denominator, omit if dividing by constant (constants are checked earlier) } if (right.nodetype<>ordconstn) then begin current_asmdata.getjumplabel(hl); cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R0,hl); current_asmdata.CurrAsmList.Concat(taicpu.op_const(A_BREAK,7)); cg.a_label(current_asmdata.CurrAsmList,hl); end; { Dividing low(longint) by -1 will overflow } if is_signed(right.resultdef) and (cs_check_overflow in current_settings.localswitches) then begin current_asmdata.getjumplabel(hl2); current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_const(A_ADDIU,NR_R1,NR_R0,-1)); cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R1,hl2); current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_LUI,NR_R1,$8000)); cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,numerator,NR_R1,hl2); current_asmdata.CurrAsmList.concat(taicpu.op_const(A_BREAK,6)); cg.a_label(current_asmdata.CurrAsmList,hl2); end; if (nodetype=modn) then current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFHI,location.register)) else current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFLO,location.register)); end; end; {***************************************************************************** TMIPSelSHLRSHRNODE *****************************************************************************} function TMIPSELShlShrNode.first_shlshr64bitint: TNode; begin { 64bit without constants need a helper } if is_64bit(left.resultdef) and (right.nodetype <> ordconstn) then begin Result := inherited first_shlshr64bitint; exit; end; Result := nil; end; procedure tMIPSELshlshrnode.second_64bit; var hregister, hreg64hi, hreg64lo: tregister; op: topcg; shiftval: aword; const ops: array [boolean] of topcg = (OP_SHR,OP_SHL); begin { 64bit without constants need a helper, and is already replaced in pass1 } if (right.nodetype <> ordconstn) then internalerror(200405301); location_reset(location, LOC_REGISTER, def_cgsize(resultdef)); { load left operator in a register } hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, resultdef, true); hreg64hi := left.location.register64.reghi; hreg64lo := left.location.register64.reglo; shiftval := tordconstnode(right).Value.svalue and 63; op := ops[nodetype=shln]; if shiftval > 31 then begin if nodetype = shln then begin location.register64.reglo:=NR_R0; location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32); { if shiftval and 31 = 0, it will optimize to MOVE } cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, shiftval and 31, hreg64lo, location.register64.reghi); end else begin location.register64.reghi:=NR_R0; location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32); cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, shiftval and 31, hreg64hi, location.register64.reglo); end; end else begin location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32); location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32); hregister := cg.getintregister(current_asmdata.CurrAsmList, OS_32); cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64hi, location.register64.reghi); cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64lo, location.register64.reglo); if shiftval <> 0 then begin if nodetype = shln then begin cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, 32-shiftval, hreg64lo, hregister); cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reghi, location.register64.reghi); end else begin cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, 32-shiftval, hreg64hi, hregister); cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reglo, location.register64.reglo); end; end; end; end; {***************************************************************************** TMIPSelNOTNODE *****************************************************************************} procedure tMIPSELnotnode.second_boolean; var tmpreg : TRegister; begin secondpass(left); if not handle_locjump then begin case left.location.loc of LOC_REGISTER, LOC_CREGISTER, LOC_REFERENCE, LOC_CREFERENCE, LOC_SUBSETREG,LOC_CSUBSETREG,LOC_SUBSETREF,LOC_CSUBSETREF: begin hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True); location_reset(location,LOC_FLAGS,OS_NO); location.resflags.reg2:=NR_R0; location.resflags.cond:=OC_EQ; if is_64bit(resultdef) then begin tmpreg:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT); { OR low and high parts together } current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_OR,tmpreg,left.location.register64.reglo,left.location.register64.reghi)); location.resflags.reg1:=tmpreg; end else location.resflags.reg1:=left.location.register; end; else internalerror(2003042401); end; end; end; {***************************************************************************** TMIPSunaryminusnode *****************************************************************************} procedure TMIPSunaryminusnode.second_float; begin secondpass(left); hlcg.location_force_fpureg(current_asmdata.CurrAsmList,left.location,left.resultdef,true); location_reset(location,LOC_FPUREGISTER,def_cgsize(resultdef)); location.register:=cg.getfpuregister(current_asmdata.CurrAsmList,location.size); case location.size of OS_F32: current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_s,location.register,left.location.register)); OS_F64: current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_d,location.register,left.location.register)); else internalerror(2013030501); end; end; begin cmoddivnode := tMIPSELmoddivnode; cshlshrnode := tMIPSELshlshrnode; cnotnode := tMIPSELnotnode; cunaryminusnode := TMIPSunaryminusnode; end.