cgcpu.pas 54 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427
  1. {
  2. Copyright (c) 2014 by Jonas Maebe
  3. This unit implements the code generator for Xtensa
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit cgcpu;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. globtype,parabase,
  22. cgbase,cgutils,cgobj,
  23. aasmbase,aasmtai,aasmdata,aasmcpu,
  24. cpubase,cpuinfo,
  25. node,symconst,SymType,symdef,
  26. rgcpu,
  27. cg64f32;
  28. type
  29. tcgcpu=class(tcg)
  30. private
  31. procedure fixref(list : TAsmList; var ref : treference);
  32. procedure g_concatcopy_move(list : tasmlist; const Source,dest : treference; len : tcgint);
  33. public
  34. procedure init_register_allocators;override;
  35. procedure done_register_allocators;override;
  36. { move instructions }
  37. procedure a_load_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  38. procedure a_load_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister;const ref: TReference);override;
  39. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: TReference; reg: tregister);override;
  40. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  41. procedure a_loadaddr_ref_reg(list: TAsmList; const ref: TReference; r: tregister);override;
  42. procedure a_op_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src, dst: tregister);override;
  43. procedure a_op_const_reg(list: TAsmList; op: topcg; size: tcgsize; a: tcgint; reg: tregister);override;
  44. procedure a_op_reg_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src1, src2, dst: tregister);override;
  45. procedure a_op_const_reg_reg(list : TAsmList; op : TOpCg; size : tcgsize; a : tcgint; src,dst : tregister);override;
  46. procedure a_call_name(list:TAsmList;const s:string; weak: boolean);override;
  47. procedure a_call_reg(list:TAsmList;Reg:tregister);override;
  48. procedure a_jmp_name(list: TAsmList; const s: string);override;
  49. procedure a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);override;
  50. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  51. procedure g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);override;
  52. { comparison operations }
  53. procedure a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel); override;
  54. procedure a_cmp_reg_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg1, reg2: tregister; l: tasmlabel);override;
  55. procedure a_jmp_always(list: TAsmList; l: TAsmLabel);override;
  56. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);override;
  57. procedure g_concatcopy(list : TAsmList; const source,dest : treference; len : tcgint);override;
  58. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  59. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister);override;
  60. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);override;
  61. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  62. procedure g_overflowcheck(list: TAsmList; const Loc:tlocation; def:tdef);override;
  63. end;
  64. tcg64fxtensa = class(tcg64f32)
  65. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  66. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  67. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  68. procedure a_op64_reg_reg_reg(list : TAsmList; op : TOpCG;size : tcgsize; regsrc1,regsrc2,regdst : tregister64);override;
  69. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  70. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  71. //procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  72. //procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  73. //procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  74. //procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  75. end;
  76. procedure create_codegen;
  77. const
  78. TOpCG2AsmOp: array[topcg] of TAsmOp = (
  79. A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MULL,A_MULL,A_NEG,A_NONE,A_OR,A_SRA,A_SLL,A_SRL,A_SUB,A_XOR,A_NONE,A_NONE
  80. );
  81. {
  82. );TOpCG2AsmOpReg: array[topcg] of TAsmOp = (
  83. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASRV,A_LSLV,A_LSRV,A_SUB,A_EOR,A_NONE,A_RORV
  84. );
  85. TOpCG2AsmOpImm: array[topcg] of TAsmOp = (
  86. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR
  87. );
  88. TOpCmp2AsmCond: array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  89. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI
  90. );
  91. }
  92. implementation
  93. uses
  94. globals,verbose,systems,cutils,
  95. paramgr,fmodule,
  96. symtable,symsym,
  97. tgobj,
  98. procinfo,cpupi;
  99. const
  100. TOpCmp2AsmCond: array[TOpCmp] of TAsmCond = (
  101. C_None,
  102. C_EQ,
  103. C_None,
  104. C_LT,
  105. C_GE,
  106. C_None,
  107. C_NE,
  108. C_None,
  109. C_LTU,
  110. C_GEU,
  111. C_None
  112. );
  113. procedure tcgcpu.init_register_allocators;
  114. begin
  115. inherited init_register_allocators;
  116. if target_info.abi = abi_xtensa_call0 then
  117. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  118. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,{RS_A8,}RS_A9,
  119. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14{,RS_A15}],first_int_imreg,[])
  120. else
  121. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  122. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,RS_A8,RS_A9,
  123. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14,RS_A15],first_int_imreg,[]);
  124. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  125. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7,RS_F8,RS_F9,
  126. RS_F10,RS_F11,RS_F12,RS_F13,RS_F14,RS_F15],first_fpu_imreg,[]);
  127. rg[R_SPECIALREGISTER]:=trgcpu.create(R_SPECIALREGISTER,R_SUBNONE,
  128. [RS_B0,RS_B1,RS_B2,RS_B3,RS_B4,RS_B5,RS_B6,RS_B7,RS_B8,RS_B9,
  129. RS_B10,RS_B11,RS_B12,RS_B13,RS_B14,RS_B15],first_flag_imreg,[]);
  130. end;
  131. procedure tcgcpu.done_register_allocators;
  132. begin
  133. rg[R_INTREGISTER].free;
  134. rg[R_FPUREGISTER].free;
  135. rg[R_SPECIALREGISTER].free;
  136. inherited done_register_allocators;
  137. end;
  138. procedure tcgcpu.a_load_reg_reg(list : TAsmList; fromsize,tosize : tcgsize;
  139. reg1,reg2 : tregister);
  140. var
  141. conv_done : Boolean;
  142. instr : taicpu;
  143. begin
  144. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  145. internalerror(2020030710);
  146. conv_done:=false;
  147. if tosize<>fromsize then
  148. begin
  149. conv_done:=true;
  150. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  151. fromsize:=tosize;
  152. case fromsize of
  153. OS_8:
  154. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,8));
  155. OS_S8:
  156. begin
  157. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  158. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,7))
  159. else
  160. begin
  161. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,24));
  162. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,24));
  163. end;
  164. if tosize=OS_16 then
  165. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg2,0,16));
  166. end;
  167. OS_16:
  168. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,16));
  169. OS_S16:
  170. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  171. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,15))
  172. else
  173. begin
  174. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,16));
  175. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,16));
  176. end;
  177. else
  178. conv_done:=false;
  179. end;
  180. end;
  181. if not conv_done and (reg1<>reg2) then
  182. begin
  183. { same size, only a register mov required }
  184. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  185. list.Concat(instr);
  186. { Notify the register allocator that we have written a move instruction so
  187. it can try to eliminate it. }
  188. add_move_instruction(instr);
  189. end;
  190. end;
  191. procedure tcgcpu.a_load_reg_ref(list : TAsmList; fromsize,tosize : tcgsize;
  192. reg : tregister; const ref : TReference);
  193. var
  194. op: TAsmOp;
  195. href : treference;
  196. begin
  197. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  198. FromSize := ToSize;
  199. case tosize of
  200. { signed integer registers }
  201. OS_8,
  202. OS_S8:
  203. op:=A_S8I;
  204. OS_16,
  205. OS_S16:
  206. op:=A_S16I;
  207. OS_32,
  208. OS_S32:
  209. op:=A_S32I;
  210. else
  211. InternalError(2020030804);
  212. end;
  213. href:=ref;
  214. if assigned(href.symbol) or
  215. (href.index<>NR_NO) or
  216. ((op=A_S8I) and ((href.offset<0) or (href.offset>255))) or
  217. ((op=A_S16I) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  218. ((op=A_S32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  219. fixref(list,href);
  220. list.concat(taicpu.op_reg_ref(op,reg,href));
  221. end;
  222. procedure tcgcpu.a_load_ref_reg(list : TAsmList; fromsize,tosize : tcgsize;
  223. const ref : TReference; reg : tregister);
  224. var
  225. href: treference;
  226. op: TAsmOp;
  227. tmpreg: TRegister;
  228. begin
  229. case fromsize of
  230. OS_8: op:=A_L8UI;
  231. OS_16: op:=A_L16UI;
  232. OS_S8: op:=A_L8UI;
  233. OS_S16: op:=A_L16SI;
  234. OS_64,OS_S64, { This only happens if tosize is smaller than fromsize }
  235. { We can therefore only consider the low 32-bit of the 64bit value }
  236. OS_32,
  237. OS_S32: op:=A_L32I;
  238. else
  239. internalerror(2020030801);
  240. end;
  241. href:=ref;
  242. if assigned(href.symbol) or
  243. (href.index<>NR_NO) or
  244. ((op=A_L8UI) and ((href.offset<0) or (href.offset>255))) or
  245. ((op in [A_L16SI,A_L16UI]) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  246. ((op=A_L32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  247. fixref(list,href);
  248. list.concat(taicpu.op_reg_ref(op,reg,href));
  249. if (fromsize=OS_S8) and not(tosize in [OS_S8,OS_8]) then
  250. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  251. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg,reg,7))
  252. else
  253. begin
  254. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg,reg,24));
  255. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg,reg,24));
  256. end;
  257. if (fromsize<>tosize) and (not (tosize in [OS_SINT,OS_INT])) then
  258. a_load_reg_reg(list,fromsize,tosize,reg,reg);
  259. end;
  260. procedure tcgcpu.a_load_const_reg(list : TAsmList; size : tcgsize;
  261. a : tcgint; reg : tregister);
  262. var
  263. hr : treference;
  264. l : TAsmLabel;
  265. begin
  266. if (a>=-2048) and (a<=2047) then
  267. list.Concat(taicpu.op_reg_const(A_MOVI,reg,a))
  268. else
  269. begin
  270. reference_reset(hr,4,[]);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  274. hr.symbol:=l;
  275. list.concat(taicpu.op_reg_ref(A_L32R,reg,hr));
  276. end;
  277. end;
  278. procedure tcgcpu.fixref(list : TAsmList;var ref : treference);
  279. var
  280. tmpreg, tmpreg2 : tregister;
  281. tmpref : treference;
  282. l : tasmlabel;
  283. begin
  284. { create consts entry }
  285. if assigned(ref.symbol) or (ref.offset<-2048) or (ref.offset>2047) then
  286. begin
  287. reference_reset(tmpref,4,[]);
  288. current_asmdata.getjumplabel(l);
  289. cg.a_label(current_procinfo.aktlocaldata,l);
  290. tmpreg:=NR_NO;
  291. if assigned(ref.symbol) then
  292. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  293. else if ref.offset<>0 then
  294. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  295. { load consts entry }
  296. tmpreg:=getintregister(list,OS_INT);
  297. tmpref.symbol:=l;
  298. list.concat(taicpu.op_reg_ref(A_L32R,tmpreg,tmpref));
  299. if ref.base<>NR_NO then
  300. begin
  301. if ref.index<>NR_NO then
  302. begin
  303. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  304. ref.base:=tmpreg;
  305. end
  306. else
  307. ref.index:=tmpreg;
  308. end
  309. else
  310. ref.base:=tmpreg;
  311. end
  312. else if ref.offset<>0 then
  313. begin
  314. tmpreg:=getintregister(list,OS_INT);
  315. if (ref.offset>=-128) and (ref.offset<=127) then
  316. begin
  317. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,ref.base,ref.offset));
  318. ref.base:=tmpreg;
  319. end
  320. else
  321. begin
  322. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,ref.offset));
  323. if ref.base<>NR_NO then
  324. begin
  325. if ref.index<>NR_NO then
  326. begin
  327. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  328. ref.base:=tmpreg;
  329. end
  330. else
  331. ref.index:=tmpreg;
  332. end
  333. else
  334. ref.base:=tmpreg;
  335. end;
  336. end;
  337. if ref.index<>NR_NO then
  338. begin
  339. if ref.base<>NR_NO then
  340. begin
  341. tmpreg:=getintregister(list,OS_INT);
  342. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  343. ref.base:=tmpreg;
  344. end
  345. else
  346. ref.base:=ref.index;
  347. ref.index:=NR_NO;
  348. end;
  349. ref.offset:=0;
  350. ref.symbol:=nil;
  351. end;
  352. procedure tcgcpu.a_loadaddr_ref_reg(list : TAsmList;
  353. const ref : TReference; r : tregister);
  354. var
  355. b : byte;
  356. tmpref : treference;
  357. instr : taicpu;
  358. begin
  359. tmpref:=ref;
  360. { Be sure to have a base register }
  361. if tmpref.base=NR_NO then
  362. begin
  363. tmpref.base:=tmpref.index;
  364. tmpref.index:=NR_NO;
  365. end;
  366. if assigned(tmpref.symbol) then
  367. fixref(list,tmpref);
  368. { expect a base here if there is an index }
  369. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  370. internalerror(200312022);
  371. if tmpref.index<>NR_NO then
  372. begin
  373. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  374. if tmpref.offset<>0 then
  375. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  376. end
  377. else
  378. begin
  379. if tmpref.base=NR_NO then
  380. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  381. else
  382. if tmpref.offset<>0 then
  383. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  384. else
  385. begin
  386. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  387. list.concat(instr);
  388. add_move_instruction(instr);
  389. end;
  390. end;
  391. end;
  392. procedure tcgcpu.a_op_reg_reg(list : TAsmList; op : topcg; size : tcgsize; src,dst : tregister);
  393. var
  394. tmpreg : TRegister;
  395. begin
  396. if op = OP_NEG then
  397. begin
  398. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  399. maybeadjustresult(list,OP_NEG,size,dst);
  400. end
  401. else if op = OP_NOT then
  402. begin
  403. tmpreg:=getintregister(list,size);
  404. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  405. list.concat(taicpu.op_reg_reg_reg(A_XOR,dst,tmpreg,src));
  406. maybeadjustresult(list,OP_NOT,size,dst);
  407. end
  408. else
  409. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  410. end;
  411. procedure tcgcpu.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  412. var
  413. l1 : longint;
  414. tmpreg : TRegister;
  415. begin
  416. optimize_op_const(size, op, a);
  417. case op of
  418. OP_NONE:
  419. begin
  420. if src <> dst then
  421. a_load_reg_reg(list, size, size, src, dst);
  422. exit;
  423. end;
  424. OP_MOVE:
  425. begin
  426. a_load_const_reg(list, size, a, dst);
  427. exit;
  428. end;
  429. else
  430. ;
  431. end;
  432. { there could be added some more sophisticated optimizations }
  433. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  434. a_op_reg_reg(list,OP_NEG,size,src,dst)
  435. { we do this here instead in the peephole optimizer because
  436. it saves us a register }
  437. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) then
  438. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  439. else if (op=OP_ADD) and (a>=-128) and (a<=127) then
  440. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,a))
  441. else if (op=OP_ADD) and (a>=-128-32768) and (a<=127+32512) then
  442. begin
  443. {$ifdef EXTDEBUG}
  444. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  445. {$endif EXTDEBUG}
  446. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  447. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  448. end
  449. else if (op=OP_SUB) and (a>=-127) and (a<=128) then
  450. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,-a))
  451. else if (op=OP_SUB) and (a>=-127-32512) and (a<=128+32768) then
  452. begin
  453. {$ifdef EXTDEBUG}
  454. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  455. {$endif EXTDEBUG}
  456. a:=-a;
  457. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  458. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  459. end
  460. else if (op=OP_SHL) and (a>=1) and (a<=31) then
  461. list.concat(taicpu.op_reg_reg_const(A_SLLI,dst,src,a))
  462. else if (op=OP_SAR) and (a>=0) and (a<=31) then
  463. list.concat(taicpu.op_reg_reg_const(A_SRAI,dst,src,a))
  464. else if (op=OP_SHR) and (a>=0) and (a<=15) then
  465. list.concat(taicpu.op_reg_reg_const(A_SRLI,dst,src,a))
  466. else if (op=OP_SHR) and (a>15) and (a<=31) then
  467. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,a,32-a))
  468. else
  469. begin
  470. tmpreg:=getintregister(list,size);
  471. a_load_const_reg(list,size,a,tmpreg);
  472. a_op_reg_reg_reg(list,op,size,tmpreg,src,dst);
  473. end;
  474. maybeadjustresult(list,op,size,dst);
  475. end;
  476. procedure tcgcpu.a_op_const_reg(list : TAsmList; op : topcg; size : tcgsize; a : tcgint; reg : tregister);
  477. begin
  478. a_op_const_reg_reg(list,op,size,a,reg,reg);
  479. end;
  480. procedure tcgcpu.a_op_reg_reg_reg(list : TAsmList; op : topcg;
  481. size : tcgsize; src1,src2,dst : tregister);
  482. var
  483. tmpreg : TRegister;
  484. begin
  485. if op=OP_NOT then
  486. begin
  487. tmpreg:=getintregister(list,size);
  488. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  489. maybeadjustresult(list,op,size,dst);
  490. end
  491. else if op=OP_NEG then
  492. begin
  493. list.concat(taicpu.op_reg_reg(A_NEG,dst,src1));
  494. maybeadjustresult(list,op,size,dst);
  495. end
  496. else if op in [OP_SAR,OP_SHL,OP_SHR] then
  497. begin
  498. if op=OP_SHL then
  499. list.concat(taicpu.op_reg(A_SSL,src1))
  500. else
  501. list.concat(taicpu.op_reg(A_SSR,src1));
  502. list.concat(taicpu.op_reg_reg(TOpCG2AsmOp[op],dst,src2));
  503. maybeadjustresult(list,op,size,dst);
  504. end
  505. else
  506. case op of
  507. OP_MOVE:
  508. a_load_reg_reg(list,size,size,src1,dst);
  509. else
  510. begin
  511. list.concat(taicpu.op_reg_reg_reg(TOpCG2AsmOp[op],dst,src2,src1));
  512. maybeadjustresult(list,op,size,dst);
  513. end;
  514. end;
  515. end;
  516. procedure tcgcpu.a_call_name(list : TAsmList; const s : string;
  517. weak : boolean);
  518. begin
  519. if not weak then
  520. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.RefAsmSymbol(s,AT_FUNCTION)))
  521. else
  522. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION)));
  523. end;
  524. procedure tcgcpu.a_call_reg(list : TAsmList; Reg : tregister);
  525. begin
  526. list.concat(taicpu.op_reg(txtensaprocinfo(current_procinfo).callxins,reg));
  527. end;
  528. procedure tcgcpu.a_jmp_name(list : TAsmList; const s : string);
  529. var
  530. ai : taicpu;
  531. tmpreg: TRegister;
  532. begin
  533. { for now, we use A15 here, however, this is not save as it might contain an argument }
  534. ai:=TAiCpu.op_sym_reg(A_J,current_asmdata.RefAsmSymbol(s,AT_FUNCTION),NR_A15);
  535. ai.oppostfix := PF_L; // if destination is too far for J then assembler can convert to JX
  536. ai.is_jmp:=true;
  537. list.Concat(ai);
  538. end;
  539. procedure tcgcpu.a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);
  540. var
  541. instr: taicpu;
  542. begin
  543. if CPUXTENSA_HAS_BOOLEAN_OPTION in cpu_capabilities[current_settings.cputype] then
  544. begin
  545. instr:=taicpu.op_reg_sym(A_B,f.register,l);
  546. instr.condition:=flags_to_cond(f.flag);
  547. list.concat(instr);
  548. end
  549. else
  550. Internalerror(2020070401);
  551. end;
  552. procedure tcgcpu.g_proc_entry(list : TAsmList; localsize : longint;
  553. nostackframe : boolean);
  554. var
  555. ref : treference;
  556. r : byte;
  557. regs : tcpuregisterset;
  558. stackmisalignment : pint;
  559. regoffset : LongInt;
  560. stack_parameters : Boolean;
  561. registerarea : PtrInt;
  562. l : TAsmLabel;
  563. begin
  564. LocalSize:=align(LocalSize,4);
  565. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  566. { call instruction does not put anything on the stack }
  567. registerarea:=0;
  568. if not(nostackframe) then
  569. begin
  570. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  571. a_reg_alloc(list,NR_STACK_POINTER_REG);
  572. case target_info.abi of
  573. abi_xtensa_call0:
  574. begin
  575. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  576. Include(regs,RS_A15);
  577. if pi_do_call in current_procinfo.flags then
  578. Include(regs,RS_A0);
  579. if regs<>[] then
  580. begin
  581. for r:=RS_A0 to RS_A15 do
  582. if r in regs then
  583. inc(registerarea,4);
  584. end;
  585. inc(localsize,registerarea);
  586. if LocalSize<>0 then
  587. begin
  588. localsize:=align(localsize,current_settings.alignment.localalignmax);
  589. a_reg_alloc(list,NR_STACK_POINTER_REG);
  590. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,-localsize));
  591. end;
  592. reference_reset(ref,4,[]);
  593. ref.base:=NR_STACK_POINTER_REG;
  594. ref.offset:=localsize;
  595. if ref.offset>1024 then
  596. begin
  597. if ref.offset<=1024+32512 then
  598. begin
  599. list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  600. ref.offset:=ref.offset and $3ff;
  601. ref.base:=NR_A8;
  602. end
  603. else
  604. { fix me! }
  605. Internalerror(2020031101);
  606. end;
  607. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  608. begin
  609. dec(ref.offset,4);
  610. list.concat(taicpu.op_reg_ref(A_S32I,NR_A15,ref));
  611. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  612. list.concat(taicpu.op_reg_reg(A_MOV,NR_A15,NR_STACK_POINTER_REG));
  613. end;
  614. if regs<>[] then
  615. begin
  616. for r:=RS_A14 downto RS_A0 do
  617. if r in regs then
  618. begin
  619. dec(ref.offset,4);
  620. list.concat(taicpu.op_reg_ref(A_S32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  621. end;
  622. end;
  623. end;
  624. abi_xtensa_windowed:
  625. begin
  626. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  627. begin
  628. if localsize>txtensaprocinfo(current_procinfo).stackframesize then
  629. internalerror(2020031402)
  630. else
  631. localsize:=txtensaprocinfo(current_procinfo).stackframesize-registerarea;
  632. end
  633. else
  634. begin
  635. { default spill area }
  636. inc(localsize,4*4);
  637. { additional spill area? }
  638. if pi_do_call in current_procinfo.flags then
  639. inc(localsize,txtensaprocinfo(current_procinfo).maxcall*4);
  640. localsize:=align(localsize,current_settings.alignment.localalignmax);
  641. end;
  642. if localsize>32760 then
  643. begin
  644. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,32));
  645. reference_reset(ref,4,[]);
  646. current_asmdata.getjumplabel(l);
  647. cg.a_label(current_procinfo.aktlocaldata,l);
  648. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(localsize-32)));
  649. ref.symbol:=l;
  650. list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));
  651. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_A8,NR_STACK_POINTER_REG,NR_A8));
  652. list.concat(taicpu.op_reg_reg(A_MOVSP,NR_STACK_POINTER_REG,NR_A8));
  653. end
  654. else
  655. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,localsize));
  656. end;
  657. else
  658. Internalerror(2020031401);
  659. end;
  660. end;
  661. end;
  662. procedure tcgcpu.g_proc_exit(list : TAsmList; parasize : longint;
  663. nostackframe : boolean);
  664. var
  665. ref : treference;
  666. r : byte;
  667. regs : tcpuregisterset;
  668. stackmisalignment : pint;
  669. regoffset : LongInt;
  670. stack_parameters : Boolean;
  671. registerarea : PtrInt;
  672. l : TAsmLabel;
  673. LocalSize: longint;
  674. begin
  675. case target_info.abi of
  676. abi_xtensa_windowed:
  677. list.Concat(taicpu.op_none(A_RETW));
  678. abi_xtensa_call0:
  679. begin
  680. if not(nostackframe) then
  681. begin
  682. LocalSize:=current_procinfo.calc_stackframe_size;
  683. LocalSize:=align(LocalSize,4);
  684. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  685. registerarea:=0;
  686. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  687. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  688. Include(regs,RS_A15);
  689. if pi_do_call in current_procinfo.flags then
  690. Include(regs,RS_A0);
  691. if regs<>[] then
  692. begin
  693. for r:=RS_A0 to RS_A15 do
  694. if r in regs then
  695. inc(registerarea,4);
  696. end;
  697. inc(localsize,registerarea);
  698. if LocalSize<>0 then
  699. begin
  700. localsize:=align(localsize,current_settings.alignment.localalignmax);
  701. // Determine reference mode required to access stack
  702. reference_reset(ref,4,[]);
  703. ref.base:=NR_STACK_POINTER_REG;
  704. ref.offset:=localsize;
  705. if ref.offset>1024 then
  706. begin
  707. if ref.offset<=1024+32512 then
  708. begin
  709. // allocation done in proc_entry
  710. //list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  711. ref.offset:=ref.offset and $3ff;
  712. ref.base:=NR_A8;
  713. end
  714. else
  715. { fix me! }
  716. Internalerror(2020031101);
  717. end;
  718. // restore a15 if used
  719. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  720. begin
  721. dec(ref.offset,4);
  722. list.concat(taicpu.op_reg_ref(A_L32I,NR_A15,ref));
  723. a_reg_dealloc(list,NR_FRAME_POINTER_REG);
  724. end;
  725. // restore rest of registers
  726. if regs<>[] then
  727. begin
  728. for r:=RS_A14 downto RS_A0 do
  729. if r in regs then
  730. begin
  731. dec(ref.offset,4);
  732. list.concat(taicpu.op_reg_ref(A_L32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  733. end;
  734. end;
  735. // restore stack pointer
  736. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize));
  737. a_reg_dealloc(list,NR_STACK_POINTER_REG);
  738. end;
  739. end;
  740. list.Concat(taicpu.op_none(A_RET));
  741. end
  742. else
  743. Internalerror(2020031403);
  744. end;
  745. end;
  746. procedure tcgcpu.a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel);
  747. function is_b4const(v: tcgint): boolean;
  748. begin
  749. case v of
  750. -1,1,2,3,4,5,6,7,8,
  751. 10,12,16,32,64,128,256:
  752. result:=true;
  753. else
  754. result:=false;
  755. end;
  756. end;
  757. function is_b4constu(v: tcgint): boolean;
  758. begin
  759. case v of
  760. 32768,65536,
  761. 2,3,4,5,6,7,8,
  762. 10,12,16,32,64,128,256:
  763. result:=true;
  764. else
  765. result:=false;
  766. end;
  767. end;
  768. var
  769. op: TAsmCond;
  770. instr: taicpu;
  771. begin
  772. if (a=0) and (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  773. begin
  774. case cmp_op of
  775. OC_EQ: op:=C_EQZ;
  776. OC_NE: op:=C_NEZ;
  777. OC_LT: op:=C_LTZ;
  778. OC_GTE: op:=C_GEZ;
  779. else
  780. Internalerror(2020030801);
  781. end;
  782. instr:=taicpu.op_reg_sym(A_B,reg,l);
  783. instr.condition:=op;
  784. list.concat(instr);
  785. end
  786. else if is_b4const(a) and
  787. (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  788. begin
  789. case cmp_op of
  790. OC_EQ: op:=C_EQI;
  791. OC_NE: op:=C_NEI;
  792. OC_LT: op:=C_LTI;
  793. OC_GTE: op:=C_GEI;
  794. else
  795. Internalerror(2020030801);
  796. end;
  797. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  798. instr.condition:=op;
  799. list.concat(instr);
  800. end
  801. else if is_b4constu(a) and
  802. (cmp_op in [OC_B,OC_AE]) then
  803. begin
  804. case cmp_op of
  805. OC_B: op:=C_LTUI;
  806. OC_AE: op:=C_GEUI;
  807. else
  808. Internalerror(2020030801);
  809. end;
  810. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  811. instr.condition:=op;
  812. list.concat(instr);
  813. end
  814. else
  815. inherited a_cmp_const_reg_label(list, size, cmp_op, a, reg, l);
  816. end;
  817. procedure tcgcpu.a_cmp_reg_reg_label(list : TAsmList; size : tcgsize;
  818. cmp_op : topcmp; reg1,reg2 : tregister; l : tasmlabel);
  819. var
  820. tmpreg: TRegister;
  821. instr: taicpu;
  822. begin
  823. if TOpCmp2AsmCond[cmp_op]=C_None then
  824. begin
  825. cmp_op:=swap_opcmp(cmp_op);
  826. tmpreg:=reg1;
  827. reg1:=reg2;
  828. reg2:=tmpreg;
  829. end;
  830. instr:=taicpu.op_reg_reg_sym(A_B,reg2,reg1,l);
  831. instr.condition:=TOpCmp2AsmCond[cmp_op];
  832. list.concat(instr);
  833. end;
  834. procedure tcgcpu.a_jmp_always(list : TAsmList; l : TAsmLabel);
  835. var
  836. ai : taicpu;
  837. begin
  838. if l.bind in [AB_GLOBAL] then
  839. begin
  840. { for now, we use A15 here, however, this is not save as it might contain an argument, I have not figured out a
  841. solution yet }
  842. ai:=taicpu.op_sym_reg(A_J,l,NR_A15);
  843. ai.oppostfix := PF_L;
  844. end
  845. else
  846. ai:=taicpu.op_sym(A_J,l);
  847. ai.is_jmp:=true;
  848. list.concat(ai);
  849. end;
  850. procedure tcgcpu.g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);
  851. var
  852. hregister: TRegister;
  853. instr: taicpu;
  854. begin
  855. a_load_const_reg(list,size,0,reg);
  856. hregister:=getintregister(list,size);
  857. a_load_const_reg(list,size,1,hregister);
  858. instr:=taicpu.op_reg_reg_reg(A_MOV,reg,hregister,f.register);
  859. instr.condition:=flags_to_cond(f.flag);
  860. list.concat(instr);
  861. end;
  862. procedure tcgcpu.g_concatcopy_move(list: tasmlist; const Source, dest: treference; len: tcgint);
  863. var
  864. paraloc1, paraloc2, paraloc3: TCGPara;
  865. pd: tprocdef;
  866. begin
  867. pd:=search_system_proc('MOVE');
  868. paraloc1.init;
  869. paraloc2.init;
  870. paraloc3.init;
  871. paramanager.getcgtempparaloc(list, pd, 1, paraloc1);
  872. paramanager.getcgtempparaloc(list, pd, 2, paraloc2);
  873. paramanager.getcgtempparaloc(list, pd, 3, paraloc3);
  874. a_load_const_cgpara(list, OS_SINT, len, paraloc3);
  875. a_loadaddr_ref_cgpara(list, dest, paraloc2);
  876. a_loadaddr_ref_cgpara(list, Source, paraloc1);
  877. paramanager.freecgpara(list, paraloc3);
  878. paramanager.freecgpara(list, paraloc2);
  879. paramanager.freecgpara(list, paraloc1);
  880. alloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  881. alloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  882. a_call_name(list, 'FPC_MOVE', false);
  883. dealloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  884. dealloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  885. paraloc3.done;
  886. paraloc2.done;
  887. paraloc1.done;
  888. end;
  889. procedure tcgcpu.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  890. var
  891. tmpreg1, hreg, countreg: TRegister;
  892. src, dst, src2, dst2: TReference;
  893. lab: tasmlabel;
  894. Count, count2: aint;
  895. function reference_is_reusable(const ref: treference): boolean;
  896. begin
  897. result:=(ref.base<>NR_NO) and (ref.index=NR_NO) and
  898. (ref.symbol=nil);
  899. end;
  900. begin
  901. src2:=source;
  902. fixref(list,src2);
  903. dst2:=dest;
  904. fixref(list,dst2);
  905. if len > high(longint) then
  906. internalerror(2002072704);
  907. { A call (to FPC_MOVE) requires the outgoing parameter area to be properly
  908. allocated on stack. This can only be done before tmipsprocinfo.set_first_temp_offset,
  909. i.e. before secondpass. Other internal procedures request correct stack frame
  910. by setting pi_do_call during firstpass, but for this particular one it is impossible.
  911. Therefore, if the current procedure is a leaf one, we have to leave it that way. }
  912. { anybody wants to determine a good value here :)? }
  913. if (len > 100) and
  914. assigned(current_procinfo) and
  915. (pi_do_call in current_procinfo.flags) then
  916. g_concatcopy_move(list, src2, dst2, len)
  917. else
  918. begin
  919. Count := len div 4;
  920. if (count<=4) and reference_is_reusable(src2) then
  921. src:=src2
  922. else
  923. begin
  924. reference_reset(src,sizeof(aint),[]);
  925. { load the address of src2 into src.base }
  926. src.base := GetAddressRegister(list);
  927. a_loadaddr_ref_reg(list, src2, src.base);
  928. end;
  929. if (count<=4) and reference_is_reusable(dst2) then
  930. dst:=dst2
  931. else
  932. begin
  933. reference_reset(dst,sizeof(aint),[]);
  934. { load the address of dst2 into dst.base }
  935. dst.base := GetAddressRegister(list);
  936. a_loadaddr_ref_reg(list, dst2, dst.base);
  937. end;
  938. { generate a loop }
  939. if Count > 4 then
  940. begin
  941. countreg := GetIntRegister(list, OS_INT);
  942. tmpreg1 := GetIntRegister(list, OS_INT);
  943. a_load_const_reg(list, OS_INT, Count, countreg);
  944. current_asmdata.getjumplabel(lab);
  945. a_label(list, lab);
  946. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  947. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  948. list.concat(taicpu.op_reg_reg_const(A_ADDI, src.base, src.base, 4));
  949. list.concat(taicpu.op_reg_reg_const(A_ADDI, dst.base, dst.base, 4));
  950. list.concat(taicpu.op_reg_reg_const(A_ADDI, countreg, countreg, -1));
  951. a_cmp_const_reg_label(list,OS_INT,OC_GT,0,countreg,lab);
  952. { keep the registers alive }
  953. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  954. list.concat(taicpu.op_reg_reg(A_MOV,src.base,src.base));
  955. list.concat(taicpu.op_reg_reg(A_MOV,dst.base,dst.base));
  956. len := len mod 4;
  957. end;
  958. { unrolled loop }
  959. Count := len div 4;
  960. if Count > 0 then
  961. begin
  962. tmpreg1 := GetIntRegister(list, OS_INT);
  963. for count2 := 1 to Count do
  964. begin
  965. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  966. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  967. Inc(src.offset, 4);
  968. Inc(dst.offset, 4);
  969. end;
  970. len := len mod 4;
  971. end;
  972. if (len and 4) <> 0 then
  973. begin
  974. hreg := GetIntRegister(list, OS_INT);
  975. a_load_ref_reg(list, OS_32, OS_32, src, hreg);
  976. a_load_reg_ref(list, OS_32, OS_32, hreg, dst);
  977. Inc(src.offset, 4);
  978. Inc(dst.offset, 4);
  979. end;
  980. { copy the leftovers }
  981. if (len and 2) <> 0 then
  982. begin
  983. hreg := GetIntRegister(list, OS_INT);
  984. a_load_ref_reg(list, OS_16, OS_16, src, hreg);
  985. a_load_reg_ref(list, OS_16, OS_16, hreg, dst);
  986. Inc(src.offset, 2);
  987. Inc(dst.offset, 2);
  988. end;
  989. if (len and 1) <> 0 then
  990. begin
  991. hreg := GetIntRegister(list, OS_INT);
  992. a_load_ref_reg(list, OS_8, OS_8, src, hreg);
  993. a_load_reg_ref(list, OS_8, OS_8, hreg, dst);
  994. end;
  995. end;
  996. end;
  997. procedure tcgcpu.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  998. var
  999. ai: taicpu;
  1000. begin
  1001. if not(fromsize in [OS_32,OS_F32]) then
  1002. InternalError(2020032603);
  1003. ai := taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1004. ai.oppostfix := PF_S;
  1005. list.concat(ai);
  1006. end;
  1007. procedure tcgcpu.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1008. var
  1009. href: treference;
  1010. begin
  1011. if not(fromsize in [OS_32,OS_F32]) then
  1012. InternalError(2020032602);
  1013. href:=ref;
  1014. if assigned(href.symbol) or
  1015. (href.index<>NR_NO) or
  1016. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1017. fixref(list,href);
  1018. list.concat(taicpu.op_reg_ref(A_LSI,reg,href));
  1019. if fromsize<>tosize then
  1020. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1021. end;
  1022. procedure tcgcpu.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1023. var
  1024. href: treference;
  1025. begin
  1026. if not(fromsize in [OS_32,OS_F32]) then
  1027. InternalError(2020032604);
  1028. href:=ref;
  1029. if assigned(href.symbol) or
  1030. (href.index<>NR_NO) or
  1031. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1032. fixref(list,href);
  1033. list.concat(taicpu.op_reg_ref(A_SSI,reg,href));
  1034. end;
  1035. procedure tcgcpu.maybeadjustresult(list : TAsmList; op : TOpCg; size : tcgsize; dst : tregister);
  1036. const
  1037. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  1038. begin
  1039. if (op in overflowops) and
  1040. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  1041. a_load_reg_reg(list,OS_32,size,dst,dst);
  1042. end;
  1043. procedure tcgcpu.g_overflowcheck(list: TAsmList; const Loc: tlocation; def: tdef);
  1044. begin
  1045. { no overflow checking yet }
  1046. end;
  1047. procedure tcg64fxtensa.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  1048. var
  1049. signed: Boolean;
  1050. tmplo, carry, tmphi, hreg: TRegister;
  1051. instr: taicpu;
  1052. no_carry: TAsmLabel;
  1053. begin
  1054. case op of
  1055. OP_NEG,
  1056. OP_NOT :
  1057. internalerror(2020030810);
  1058. else
  1059. ;
  1060. end;
  1061. case op of
  1062. OP_AND,OP_OR,OP_XOR:
  1063. begin
  1064. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  1065. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  1066. end;
  1067. OP_ADD:
  1068. begin
  1069. signed:=(size in [OS_S64]);
  1070. tmplo := cg.GetIntRegister(list,OS_S32);
  1071. carry := cg.GetIntRegister(list,OS_S32);
  1072. list.concat(taicpu.op_reg_reg_reg(A_ADD, tmplo, regsrc2.reglo, regsrc1.reglo));
  1073. if signed then
  1074. begin
  1075. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1076. current_asmdata.getjumplabel(no_carry);
  1077. instr:=taicpu.op_reg_reg_sym(A_B,tmplo, regsrc2.reglo, no_carry);
  1078. instr.condition:=C_GEU;
  1079. list.concat(instr);
  1080. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1081. cg.a_label(list,no_carry);
  1082. end
  1083. else
  1084. begin
  1085. cg.a_load_const_reg(list,OS_INT,1,carry);
  1086. current_asmdata.getjumplabel(no_carry);
  1087. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B,tmplo, regsrc2.reglo,no_carry);
  1088. cg.a_load_const_reg(list,OS_INT,0,carry);
  1089. cg.a_label(list,no_carry);
  1090. cg.a_load_reg_reg(list,OS_INT,OS_INT,tmplo,regdst.reglo);
  1091. tmphi:=cg.GetIntRegister(list,OS_INT);
  1092. hreg:=cg.GetIntRegister(list,OS_INT);
  1093. cg.a_load_const_reg(list,OS_INT,$80000000,hreg);
  1094. // first add carry to one of the addends
  1095. list.concat(taicpu.op_reg_reg_reg(A_ADD, tmphi, regsrc2.reghi, carry));
  1096. cg.a_load_const_reg(list,OS_INT,1,carry);
  1097. current_asmdata.getjumplabel(no_carry);
  1098. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B,tmphi, regsrc2.reghi,no_carry);
  1099. cg.a_load_const_reg(list,OS_INT,0,carry);
  1100. cg.a_label(list,no_carry);
  1101. list.concat(taicpu.op_reg_reg_reg(A_SUB, carry, hreg, carry));
  1102. // then add another addend
  1103. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reghi, tmphi, regsrc1.reghi));
  1104. end;
  1105. end;
  1106. OP_SUB:
  1107. begin
  1108. signed:=(size in [OS_S64]);
  1109. tmplo := cg.GetIntRegister(list,OS_S32);
  1110. carry := cg.GetIntRegister(list,OS_S32);
  1111. list.concat(taicpu.op_reg_reg_reg(A_SUB, tmplo, regsrc2.reglo, regsrc1.reglo));
  1112. if signed then
  1113. begin
  1114. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1115. current_asmdata.getjumplabel(no_carry);
  1116. instr:=taicpu.op_reg_reg_sym(A_B, regsrc2.reglo, tmplo, no_carry);
  1117. instr.condition:=C_GEU;
  1118. list.concat(instr);
  1119. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, -1));
  1120. cg.a_label(list,no_carry);
  1121. end
  1122. else
  1123. begin
  1124. cg.a_load_const_reg(list,OS_INT,1,carry);
  1125. current_asmdata.getjumplabel(no_carry);
  1126. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B, regsrc2.reglo, tmplo, no_carry);
  1127. cg.a_load_const_reg(list,OS_INT,0,carry);
  1128. cg.a_label(list,no_carry);
  1129. cg.a_load_reg_reg(list,OS_INT,OS_INT,tmplo,regdst.reglo);
  1130. tmphi:=cg.GetIntRegister(list,OS_INT);
  1131. hreg:=cg.GetIntRegister(list,OS_INT);
  1132. cg.a_load_const_reg(list,OS_INT,$80000000,hreg);
  1133. // first add carry to one of the addends
  1134. list.concat(taicpu.op_reg_reg_reg(A_SUB, regsrc2.reghi, tmplo, carry));
  1135. cg.a_load_const_reg(list,OS_INT,1,carry);
  1136. current_asmdata.getjumplabel(no_carry);
  1137. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B,tmphi, regsrc2.reghi,no_carry);
  1138. cg.a_load_const_reg(list,OS_INT,0,carry);
  1139. cg.a_label(list,no_carry);
  1140. list.concat(taicpu.op_reg_reg_reg(A_SUB, carry, hreg, carry));
  1141. // then add another addend
  1142. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reghi, tmphi, regsrc1.reghi));
  1143. end;
  1144. end;
  1145. else
  1146. internalerror(2020030813);
  1147. end;
  1148. end;
  1149. procedure tcg64fxtensa.a_op64_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; regsrc,regdst : tregister64);
  1150. var
  1151. tmpreg : TRegister;
  1152. instr : taicpu;
  1153. begin
  1154. case op of
  1155. OP_NEG:
  1156. begin
  1157. tmpreg:=cg.GetIntRegister(list, OS_INT);
  1158. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reglo,regsrc.reglo));
  1159. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reghi,regsrc.reghi));
  1160. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,regdst.reghi,-1));
  1161. instr:=taicpu.op_reg_reg_reg(A_MOV,regdst.reghi,tmpreg,regdst.reglo);
  1162. instr.condition:=C_EQZ;
  1163. list.concat(instr);
  1164. end;
  1165. OP_NOT:
  1166. begin
  1167. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  1168. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  1169. end;
  1170. else
  1171. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  1172. end;
  1173. end;
  1174. procedure tcg64fxtensa.a_op64_const_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; regsrc,regdst : tregister64);
  1175. var
  1176. tmpreg,tmplo,carry,tmphi,hreg: tregister;
  1177. tmpreg64 : tregister64;
  1178. b : byte;
  1179. signed : Boolean;
  1180. no_carry : TAsmLabel;
  1181. instr : taicpu;
  1182. begin
  1183. case op of
  1184. OP_NEG,
  1185. OP_NOT :
  1186. internalerror(2020030904);
  1187. else
  1188. ;
  1189. end;
  1190. case op of
  1191. OP_AND,OP_OR,OP_XOR:
  1192. begin
  1193. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  1194. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  1195. end;
  1196. OP_ADD:
  1197. begin
  1198. { could do better here (hi(value) in 248..2047), for now we support only the simple cases }
  1199. if (value>=-2048) and (value<=2047) then
  1200. begin
  1201. signed:=(size in [OS_S64]);
  1202. tmplo := cg.GetIntRegister(list,OS_S32);
  1203. carry := cg.GetIntRegister(list,OS_S32);
  1204. list.concat(taicpu.op_reg_reg_const(A_ADDI, tmplo, regsrc.reglo, value));
  1205. if signed then
  1206. begin
  1207. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regsrc.reghi, 0));
  1208. current_asmdata.getjumplabel(no_carry);
  1209. instr:=taicpu.op_reg_reg_sym(A_B,tmplo, regsrc.reglo, no_carry);
  1210. instr.condition:=C_GEU;
  1211. list.concat(instr);
  1212. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1213. cg.a_label(list,no_carry);
  1214. end
  1215. else
  1216. begin
  1217. cg.a_load_const_reg(list,OS_INT,1,carry);
  1218. current_asmdata.getjumplabel(no_carry);
  1219. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B,tmplo, regsrc.reglo,no_carry);
  1220. cg.a_load_const_reg(list,OS_INT,0,carry);
  1221. cg.a_label(list,no_carry);
  1222. cg.a_load_reg_reg(list,OS_INT,OS_INT,tmplo,regdst.reglo);
  1223. tmphi:=cg.GetIntRegister(list,OS_INT);
  1224. hreg:=cg.GetIntRegister(list,OS_INT);
  1225. cg.a_load_const_reg(list,OS_INT,$80000000,hreg);
  1226. // first add carry to one of the addends
  1227. list.concat(taicpu.op_reg_reg_reg(A_ADD, tmphi, regsrc.reghi, carry));
  1228. cg.a_load_const_reg(list,OS_INT,1,carry);
  1229. current_asmdata.getjumplabel(no_carry);
  1230. cg.a_cmp_reg_reg_label(list,OS_INT,OC_B,tmphi, regsrc.reghi,no_carry);
  1231. cg.a_load_const_reg(list,OS_INT,0,carry);
  1232. cg.a_label(list,no_carry);
  1233. list.concat(taicpu.op_reg_reg_reg(A_SUB, carry, hreg, carry));
  1234. // then add another addend
  1235. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, tmphi, 0));
  1236. end
  1237. end
  1238. else
  1239. begin
  1240. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1241. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1242. a_load64_const_reg(list,value,tmpreg64);
  1243. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1244. end;
  1245. end;
  1246. OP_SUB:
  1247. begin
  1248. { for now, we take the simple approach }
  1249. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1250. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1251. a_load64_const_reg(list,value,tmpreg64);
  1252. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1253. end;
  1254. else
  1255. internalerror(2020030901);
  1256. end;
  1257. end;
  1258. procedure tcg64fxtensa.a_op64_const_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; reg : tregister64);
  1259. begin
  1260. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  1261. end;
  1262. {$warnings off}
  1263. procedure create_codegen;
  1264. begin
  1265. cg:=tcgcpu.Create;
  1266. cg64:=tcg64fxtensa.Create;
  1267. end;
  1268. end.