cgcpu.pas 52 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371
  1. {
  2. Copyright (c) 2014 by Jonas Maebe
  3. This unit implements the code generator for Xtensa
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit cgcpu;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. globtype,parabase,
  22. cgbase,cgutils,cgobj,
  23. aasmbase,aasmtai,aasmdata,aasmcpu,
  24. cpubase,cpuinfo,
  25. node,symconst,SymType,symdef,
  26. rgcpu,
  27. cg64f32;
  28. type
  29. tcgcpu=class(tcg)
  30. private
  31. procedure fixref(list : TAsmList; var ref : treference);
  32. procedure g_concatcopy_move(list : tasmlist; const Source,dest : treference; len : tcgint);
  33. public
  34. procedure init_register_allocators;override;
  35. procedure done_register_allocators;override;
  36. { move instructions }
  37. procedure a_load_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  38. procedure a_load_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister;const ref: TReference);override;
  39. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: TReference; reg: tregister);override;
  40. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  41. procedure a_loadaddr_ref_reg(list: TAsmList; const ref: TReference; r: tregister);override;
  42. procedure a_op_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src, dst: tregister);override;
  43. procedure a_op_const_reg(list: TAsmList; op: topcg; size: tcgsize; a: tcgint; reg: tregister);override;
  44. procedure a_op_reg_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src1, src2, dst: tregister);override;
  45. procedure a_op_const_reg_reg(list : TAsmList; op : TOpCg; size : tcgsize; a : tcgint; src,dst : tregister);override;
  46. procedure a_call_name(list:TAsmList;const s:string; weak: boolean);override;
  47. procedure a_call_reg(list:TAsmList;Reg:tregister);override;
  48. procedure a_jmp_name(list: TAsmList; const s: string);override;
  49. procedure a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);override;
  50. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  51. procedure g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);override;
  52. { comparison operations }
  53. procedure a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel); override;
  54. procedure a_cmp_reg_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg1, reg2: tregister; l: tasmlabel);override;
  55. procedure a_jmp_always(list: TAsmList; l: TAsmLabel);override;
  56. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);override;
  57. procedure g_concatcopy(list : TAsmList; const source,dest : treference; len : tcgint);override;
  58. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  59. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister);override;
  60. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);override;
  61. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  62. procedure g_overflowcheck(list: TAsmList; const Loc:tlocation; def:tdef);override;
  63. end;
  64. tcg64fxtensa = class(tcg64f32)
  65. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  66. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  67. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  68. procedure a_op64_reg_reg_reg(list : TAsmList; op : TOpCG;size : tcgsize; regsrc1,regsrc2,regdst : tregister64);override;
  69. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  70. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  71. //procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  72. //procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  73. //procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  74. //procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  75. end;
  76. procedure create_codegen;
  77. const
  78. TOpCG2AsmOp: array[topcg] of TAsmOp = (
  79. A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MULL,A_MULL,A_NEG,A_NONE,A_OR,A_SRA,A_SLL,A_SRL,A_SUB,A_XOR,A_NONE,A_NONE
  80. );
  81. {
  82. );TOpCG2AsmOpReg: array[topcg] of TAsmOp = (
  83. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASRV,A_LSLV,A_LSRV,A_SUB,A_EOR,A_NONE,A_RORV
  84. );
  85. TOpCG2AsmOpImm: array[topcg] of TAsmOp = (
  86. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR
  87. );
  88. TOpCmp2AsmCond: array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  89. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI
  90. );
  91. }
  92. implementation
  93. uses
  94. globals,verbose,systems,cutils,
  95. paramgr,fmodule,
  96. symtable,symsym,
  97. tgobj,
  98. procinfo,cpupi;
  99. const
  100. TOpCmp2AsmCond: array[TOpCmp] of TAsmCond = (
  101. C_None,
  102. C_EQ,
  103. C_None,
  104. C_LT,
  105. C_GE,
  106. C_None,
  107. C_NE,
  108. C_None,
  109. C_LTU,
  110. C_GEU,
  111. C_None
  112. );
  113. procedure tcgcpu.init_register_allocators;
  114. begin
  115. inherited init_register_allocators;
  116. if target_info.abi = abi_xtensa_call0 then
  117. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  118. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,{RS_A8,}RS_A9,
  119. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14{,RS_A15}],first_int_imreg,[])
  120. else
  121. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  122. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,RS_A8,RS_A9,
  123. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14,RS_A15],first_int_imreg,[]);
  124. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  125. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7,RS_F8,RS_F9,
  126. RS_F10,RS_F11,RS_F12,RS_F13,RS_F14,RS_F15],first_fpu_imreg,[]);
  127. rg[R_SPECIALREGISTER]:=trgcpu.create(R_SPECIALREGISTER,R_SUBNONE,
  128. [RS_B0,RS_B1,RS_B2,RS_B3,RS_B4,RS_B5,RS_B6,RS_B7,RS_B8,RS_B9,
  129. RS_B10,RS_B11,RS_B12,RS_B13,RS_B14,RS_B15],first_flag_imreg,[]);
  130. end;
  131. procedure tcgcpu.done_register_allocators;
  132. begin
  133. rg[R_INTREGISTER].free;
  134. rg[R_FPUREGISTER].free;
  135. rg[R_SPECIALREGISTER].free;
  136. inherited done_register_allocators;
  137. end;
  138. procedure tcgcpu.a_load_reg_reg(list : TAsmList; fromsize,tosize : tcgsize;
  139. reg1,reg2 : tregister);
  140. var
  141. conv_done : Boolean;
  142. instr : taicpu;
  143. begin
  144. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  145. internalerror(2020030710);
  146. conv_done:=false;
  147. if tosize<>fromsize then
  148. begin
  149. conv_done:=true;
  150. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  151. fromsize:=tosize;
  152. case fromsize of
  153. OS_8:
  154. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,8));
  155. OS_S8:
  156. begin
  157. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  158. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,7))
  159. else
  160. begin
  161. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,24));
  162. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,24));
  163. end;
  164. if tosize=OS_16 then
  165. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg2,0,16));
  166. end;
  167. OS_16:
  168. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,16));
  169. OS_S16:
  170. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  171. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,15))
  172. else
  173. begin
  174. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,16));
  175. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,16));
  176. end;
  177. else
  178. conv_done:=false;
  179. end;
  180. end;
  181. if not conv_done and (reg1<>reg2) then
  182. begin
  183. { same size, only a register mov required }
  184. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  185. list.Concat(instr);
  186. { Notify the register allocator that we have written a move instruction so
  187. it can try to eliminate it. }
  188. add_move_instruction(instr);
  189. end;
  190. end;
  191. procedure tcgcpu.a_load_reg_ref(list : TAsmList; fromsize,tosize : tcgsize;
  192. reg : tregister; const ref : TReference);
  193. var
  194. op: TAsmOp;
  195. href : treference;
  196. begin
  197. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  198. FromSize := ToSize;
  199. case tosize of
  200. { signed integer registers }
  201. OS_8,
  202. OS_S8:
  203. op:=A_S8I;
  204. OS_16,
  205. OS_S16:
  206. op:=A_S16I;
  207. OS_32,
  208. OS_S32:
  209. op:=A_S32I;
  210. else
  211. InternalError(2020030804);
  212. end;
  213. href:=ref;
  214. if assigned(href.symbol) or
  215. (href.index<>NR_NO) or
  216. ((op=A_S8I) and ((href.offset<0) or (href.offset>255))) or
  217. ((op=A_S16I) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  218. ((op=A_S32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  219. fixref(list,href);
  220. list.concat(taicpu.op_reg_ref(op,reg,href));
  221. end;
  222. procedure tcgcpu.a_load_ref_reg(list : TAsmList; fromsize,tosize : tcgsize;
  223. const ref : TReference; reg : tregister);
  224. var
  225. href: treference;
  226. op: TAsmOp;
  227. tmpreg: TRegister;
  228. begin
  229. case fromsize of
  230. OS_8: op:=A_L8UI;
  231. OS_16: op:=A_L16UI;
  232. OS_S8: op:=A_L8UI;
  233. OS_S16: op:=A_L16SI;
  234. OS_64,OS_S64, { This only happens if tosize is smaller than fromsize }
  235. { We can therefore only consider the low 32-bit of the 64bit value }
  236. OS_32,
  237. OS_S32: op:=A_L32I;
  238. else
  239. internalerror(2020030801);
  240. end;
  241. href:=ref;
  242. if assigned(href.symbol) or
  243. (href.index<>NR_NO) or
  244. ((op=A_L8UI) and ((href.offset<0) or (href.offset>255))) or
  245. ((op in [A_L16SI,A_L16UI]) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  246. ((op=A_L32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  247. fixref(list,href);
  248. list.concat(taicpu.op_reg_ref(op,reg,href));
  249. if (fromsize=OS_S8) and not(tosize in [OS_S8,OS_8]) then
  250. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  251. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg,reg,7))
  252. else
  253. begin
  254. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg,reg,24));
  255. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg,reg,24));
  256. end;
  257. if (fromsize<>tosize) and (not (tosize in [OS_SINT,OS_INT])) then
  258. a_load_reg_reg(list,fromsize,tosize,reg,reg);
  259. end;
  260. procedure tcgcpu.a_load_const_reg(list : TAsmList; size : tcgsize;
  261. a : tcgint; reg : tregister);
  262. var
  263. hr : treference;
  264. l : TAsmLabel;
  265. begin
  266. if (a>=-2048) and (a<=2047) then
  267. list.Concat(taicpu.op_reg_const(A_MOVI,reg,a))
  268. else
  269. begin
  270. reference_reset(hr,4,[]);
  271. current_asmdata.getjumplabel(l);
  272. cg.a_label(current_procinfo.aktlocaldata,l);
  273. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(a)));
  274. hr.symbol:=l;
  275. list.concat(taicpu.op_reg_ref(A_L32R,reg,hr));
  276. end;
  277. end;
  278. procedure tcgcpu.fixref(list : TAsmList;var ref : treference);
  279. var
  280. tmpreg, tmpreg2 : tregister;
  281. tmpref : treference;
  282. l : tasmlabel;
  283. begin
  284. { create consts entry }
  285. if assigned(ref.symbol) or (ref.offset<-2048) or (ref.offset>2047) then
  286. begin
  287. reference_reset(tmpref,4,[]);
  288. current_asmdata.getjumplabel(l);
  289. cg.a_label(current_procinfo.aktlocaldata,l);
  290. tmpreg:=NR_NO;
  291. if assigned(ref.symbol) then
  292. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(ref.symbol,ref.offset))
  293. else if ref.offset<>0 then
  294. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(ref.offset));
  295. { load consts entry }
  296. tmpreg:=getintregister(list,OS_INT);
  297. tmpref.symbol:=l;
  298. list.concat(taicpu.op_reg_ref(A_L32R,tmpreg,tmpref));
  299. if ref.base<>NR_NO then
  300. begin
  301. if ref.index<>NR_NO then
  302. begin
  303. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  304. ref.base:=tmpreg;
  305. end
  306. else
  307. ref.index:=tmpreg;
  308. end
  309. else
  310. ref.base:=tmpreg;
  311. end
  312. else if ref.offset<>0 then
  313. begin
  314. tmpreg:=getintregister(list,OS_INT);
  315. if (ref.offset>=-128) and (ref.offset<=127) then
  316. begin
  317. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,ref.base,ref.offset));
  318. ref.base:=tmpreg;
  319. end
  320. else
  321. begin
  322. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,ref.offset));
  323. if ref.base<>NR_NO then
  324. begin
  325. if ref.index<>NR_NO then
  326. begin
  327. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  328. ref.base:=tmpreg;
  329. end
  330. else
  331. ref.index:=tmpreg;
  332. end
  333. else
  334. ref.base:=tmpreg;
  335. end;
  336. end;
  337. if ref.index<>NR_NO then
  338. begin
  339. if ref.base<>NR_NO then
  340. begin
  341. tmpreg:=getintregister(list,OS_INT);
  342. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  343. ref.base:=tmpreg;
  344. end
  345. else
  346. ref.base:=ref.index;
  347. ref.index:=NR_NO;
  348. end;
  349. ref.offset:=0;
  350. ref.symbol:=nil;
  351. end;
  352. procedure tcgcpu.a_loadaddr_ref_reg(list : TAsmList;
  353. const ref : TReference; r : tregister);
  354. var
  355. b : byte;
  356. tmpref : treference;
  357. instr : taicpu;
  358. begin
  359. tmpref:=ref;
  360. { Be sure to have a base register }
  361. if tmpref.base=NR_NO then
  362. begin
  363. tmpref.base:=tmpref.index;
  364. tmpref.index:=NR_NO;
  365. end;
  366. if assigned(tmpref.symbol) then
  367. fixref(list,tmpref);
  368. { expect a base here if there is an index }
  369. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  370. internalerror(200312022);
  371. if tmpref.index<>NR_NO then
  372. begin
  373. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  374. if tmpref.offset<>0 then
  375. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  376. end
  377. else
  378. begin
  379. if tmpref.base=NR_NO then
  380. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  381. else
  382. if tmpref.offset<>0 then
  383. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  384. else
  385. begin
  386. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  387. list.concat(instr);
  388. add_move_instruction(instr);
  389. end;
  390. end;
  391. end;
  392. procedure tcgcpu.a_op_reg_reg(list : TAsmList; op : topcg; size : tcgsize; src,dst : tregister);
  393. var
  394. tmpreg : TRegister;
  395. begin
  396. if op = OP_NEG then
  397. begin
  398. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  399. maybeadjustresult(list,OP_NEG,size,dst);
  400. end
  401. else if op = OP_NOT then
  402. begin
  403. tmpreg:=getintregister(list,size);
  404. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  405. list.concat(taicpu.op_reg_reg_reg(A_XOR,dst,tmpreg,src));
  406. maybeadjustresult(list,OP_NOT,size,dst);
  407. end
  408. else
  409. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  410. end;
  411. procedure tcgcpu.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  412. var
  413. l1 : longint;
  414. tmpreg : TRegister;
  415. begin
  416. optimize_op_const(size, op, a);
  417. case op of
  418. OP_NONE:
  419. begin
  420. if src <> dst then
  421. a_load_reg_reg(list, size, size, src, dst);
  422. exit;
  423. end;
  424. OP_MOVE:
  425. begin
  426. a_load_const_reg(list, size, a, dst);
  427. exit;
  428. end;
  429. else
  430. ;
  431. end;
  432. { there could be added some more sophisticated optimizations }
  433. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  434. a_op_reg_reg(list,OP_NEG,size,src,dst)
  435. { we do this here instead in the peephole optimizer because
  436. it saves us a register }
  437. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) then
  438. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  439. else if (op=OP_ADD) and (a>=-128) and (a<=127) then
  440. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,a))
  441. else if (op=OP_ADD) and (a>=-128-32768) and (a<=127+32512) then
  442. begin
  443. {$ifdef EXTDEBUG}
  444. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  445. {$endif EXTDEBUG}
  446. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  447. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  448. end
  449. else if (op=OP_SUB) and (a>=-127) and (a<=128) then
  450. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,-a))
  451. else if (op=OP_SUB) and (a>=-127-32512) and (a<=128+32768) then
  452. begin
  453. {$ifdef EXTDEBUG}
  454. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  455. {$endif EXTDEBUG}
  456. a:=-a;
  457. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  458. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  459. end
  460. else if (op=OP_SHL) and (a>=1) and (a<=31) then
  461. list.concat(taicpu.op_reg_reg_const(A_SLLI,dst,src,a))
  462. else if (op=OP_SAR) and (a>=0) and (a<=31) then
  463. list.concat(taicpu.op_reg_reg_const(A_SRAI,dst,src,a))
  464. else if (op=OP_SHR) and (a>=0) and (a<=15) then
  465. list.concat(taicpu.op_reg_reg_const(A_SRLI,dst,src,a))
  466. else if (op=OP_SHR) and (a>15) and (a<=31) then
  467. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,a,32-a))
  468. else if (op=OP_AND) and (63-BsrQWord(a)+PopCnt(QWord(a))=64) and (PopCnt(QWord(a))<=16) then
  469. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,0,PopCnt(QWord(a))))
  470. else
  471. begin
  472. tmpreg:=getintregister(list,size);
  473. a_load_const_reg(list,size,a,tmpreg);
  474. a_op_reg_reg_reg(list,op,size,tmpreg,src,dst);
  475. end;
  476. maybeadjustresult(list,op,size,dst);
  477. end;
  478. procedure tcgcpu.a_op_const_reg(list : TAsmList; op : topcg; size : tcgsize; a : tcgint; reg : tregister);
  479. begin
  480. a_op_const_reg_reg(list,op,size,a,reg,reg);
  481. end;
  482. procedure tcgcpu.a_op_reg_reg_reg(list : TAsmList; op : topcg;
  483. size : tcgsize; src1,src2,dst : tregister);
  484. var
  485. tmpreg : TRegister;
  486. begin
  487. if op=OP_NOT then
  488. begin
  489. tmpreg:=getintregister(list,size);
  490. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  491. maybeadjustresult(list,op,size,dst);
  492. end
  493. else if op=OP_NEG then
  494. begin
  495. list.concat(taicpu.op_reg_reg(A_NEG,dst,src1));
  496. maybeadjustresult(list,op,size,dst);
  497. end
  498. else if op in [OP_SAR,OP_SHL,OP_SHR] then
  499. begin
  500. if op=OP_SHL then
  501. list.concat(taicpu.op_reg(A_SSL,src1))
  502. else
  503. list.concat(taicpu.op_reg(A_SSR,src1));
  504. list.concat(taicpu.op_reg_reg(TOpCG2AsmOp[op],dst,src2));
  505. maybeadjustresult(list,op,size,dst);
  506. end
  507. else
  508. case op of
  509. OP_MOVE:
  510. a_load_reg_reg(list,size,size,src1,dst);
  511. else
  512. begin
  513. list.concat(taicpu.op_reg_reg_reg(TOpCG2AsmOp[op],dst,src2,src1));
  514. maybeadjustresult(list,op,size,dst);
  515. end;
  516. end;
  517. end;
  518. procedure tcgcpu.a_call_name(list : TAsmList; const s : string;
  519. weak : boolean);
  520. begin
  521. if not weak then
  522. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.RefAsmSymbol(s,AT_FUNCTION)))
  523. else
  524. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION)));
  525. end;
  526. procedure tcgcpu.a_call_reg(list : TAsmList; Reg : tregister);
  527. begin
  528. list.concat(taicpu.op_reg(txtensaprocinfo(current_procinfo).callxins,reg));
  529. end;
  530. procedure tcgcpu.a_jmp_name(list : TAsmList; const s : string);
  531. var
  532. ai : taicpu;
  533. tmpreg: TRegister;
  534. begin
  535. { for now, we use A15 here, however, this is not save as it might contain an argument }
  536. ai:=TAiCpu.op_sym_reg(A_J,current_asmdata.RefAsmSymbol(s,AT_FUNCTION),NR_A15);
  537. ai.oppostfix := PF_L; // if destination is too far for J then assembler can convert to JX
  538. ai.is_jmp:=true;
  539. list.Concat(ai);
  540. end;
  541. procedure tcgcpu.a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);
  542. var
  543. instr: taicpu;
  544. begin
  545. if CPUXTENSA_HAS_BOOLEAN_OPTION in cpu_capabilities[current_settings.cputype] then
  546. begin
  547. instr:=taicpu.op_reg_sym(A_B,f.register,l);
  548. instr.condition:=flags_to_cond(f.flag);
  549. list.concat(instr);
  550. end
  551. else
  552. Internalerror(2020070401);
  553. end;
  554. procedure tcgcpu.g_proc_entry(list : TAsmList; localsize : longint;
  555. nostackframe : boolean);
  556. var
  557. ref : treference;
  558. r : byte;
  559. regs : tcpuregisterset;
  560. stackmisalignment : pint;
  561. regoffset : LongInt;
  562. stack_parameters : Boolean;
  563. registerarea : PtrInt;
  564. l : TAsmLabel;
  565. begin
  566. LocalSize:=align(LocalSize,4);
  567. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  568. { call instruction does not put anything on the stack }
  569. registerarea:=0;
  570. if not(nostackframe) then
  571. begin
  572. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  573. a_reg_alloc(list,NR_STACK_POINTER_REG);
  574. case target_info.abi of
  575. abi_xtensa_call0:
  576. begin
  577. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  578. Include(regs,RS_A15);
  579. if pi_do_call in current_procinfo.flags then
  580. Include(regs,RS_A0);
  581. if regs<>[] then
  582. begin
  583. for r:=RS_A0 to RS_A15 do
  584. if r in regs then
  585. inc(registerarea,4);
  586. end;
  587. inc(localsize,registerarea);
  588. if LocalSize<>0 then
  589. begin
  590. localsize:=align(localsize,current_settings.alignment.localalignmax);
  591. a_reg_alloc(list,NR_STACK_POINTER_REG);
  592. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,-localsize));
  593. end;
  594. reference_reset(ref,4,[]);
  595. ref.base:=NR_STACK_POINTER_REG;
  596. ref.offset:=localsize;
  597. if ref.offset>1024 then
  598. begin
  599. if ref.offset<=1024+32512 then
  600. begin
  601. list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  602. ref.offset:=ref.offset and $3ff;
  603. ref.base:=NR_A8;
  604. end
  605. else
  606. { fix me! }
  607. Internalerror(2020031101);
  608. end;
  609. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  610. begin
  611. dec(ref.offset,4);
  612. list.concat(taicpu.op_reg_ref(A_S32I,NR_A15,ref));
  613. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  614. list.concat(taicpu.op_reg_reg(A_MOV,NR_A15,NR_STACK_POINTER_REG));
  615. end;
  616. if regs<>[] then
  617. begin
  618. for r:=RS_A14 downto RS_A0 do
  619. if r in regs then
  620. begin
  621. dec(ref.offset,4);
  622. list.concat(taicpu.op_reg_ref(A_S32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  623. end;
  624. end;
  625. end;
  626. abi_xtensa_windowed:
  627. begin
  628. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  629. begin
  630. if localsize>txtensaprocinfo(current_procinfo).stackframesize then
  631. internalerror(2020031402)
  632. else
  633. localsize:=txtensaprocinfo(current_procinfo).stackframesize-registerarea;
  634. end
  635. else
  636. begin
  637. { default spill area }
  638. inc(localsize,4*4);
  639. { additional spill area? }
  640. if pi_do_call in current_procinfo.flags then
  641. inc(localsize,txtensaprocinfo(current_procinfo).maxcall*4);
  642. localsize:=align(localsize,current_settings.alignment.localalignmax);
  643. end;
  644. if localsize>32760 then
  645. begin
  646. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,32));
  647. reference_reset(ref,4,[]);
  648. current_asmdata.getjumplabel(l);
  649. cg.a_label(current_procinfo.aktlocaldata,l);
  650. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(longint(localsize-32)));
  651. ref.symbol:=l;
  652. list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));
  653. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_A8,NR_STACK_POINTER_REG,NR_A8));
  654. list.concat(taicpu.op_reg_reg(A_MOVSP,NR_STACK_POINTER_REG,NR_A8));
  655. end
  656. else
  657. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,localsize));
  658. end;
  659. else
  660. Internalerror(2020031401);
  661. end;
  662. end
  663. else if target_info.abi=abi_xtensa_windowed then
  664. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,16));
  665. end;
  666. procedure tcgcpu.g_proc_exit(list : TAsmList; parasize : longint;
  667. nostackframe : boolean);
  668. var
  669. ref : treference;
  670. r : byte;
  671. regs : tcpuregisterset;
  672. stackmisalignment : pint;
  673. regoffset : LongInt;
  674. stack_parameters : Boolean;
  675. registerarea : PtrInt;
  676. l : TAsmLabel;
  677. LocalSize: longint;
  678. begin
  679. case target_info.abi of
  680. abi_xtensa_windowed:
  681. list.Concat(taicpu.op_none(A_RETW));
  682. abi_xtensa_call0:
  683. begin
  684. if not(nostackframe) then
  685. begin
  686. LocalSize:=current_procinfo.calc_stackframe_size;
  687. LocalSize:=align(LocalSize,4);
  688. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  689. registerarea:=0;
  690. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  691. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  692. Include(regs,RS_A15);
  693. if pi_do_call in current_procinfo.flags then
  694. Include(regs,RS_A0);
  695. if regs<>[] then
  696. begin
  697. for r:=RS_A0 to RS_A15 do
  698. if r in regs then
  699. inc(registerarea,4);
  700. end;
  701. inc(localsize,registerarea);
  702. if LocalSize<>0 then
  703. begin
  704. localsize:=align(localsize,current_settings.alignment.localalignmax);
  705. // Determine reference mode required to access stack
  706. reference_reset(ref,4,[]);
  707. ref.base:=NR_STACK_POINTER_REG;
  708. ref.offset:=localsize;
  709. if ref.offset>1024 then
  710. begin
  711. if ref.offset<=1024+32512 then
  712. begin
  713. // allocation done in proc_entry
  714. //list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  715. ref.offset:=ref.offset and $3ff;
  716. ref.base:=NR_A8;
  717. end
  718. else
  719. { fix me! }
  720. Internalerror(2020031102);
  721. end;
  722. // restore a15 if used
  723. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  724. begin
  725. dec(ref.offset,4);
  726. list.concat(taicpu.op_reg_ref(A_L32I,NR_A15,ref));
  727. a_reg_dealloc(list,NR_FRAME_POINTER_REG);
  728. end;
  729. // restore rest of registers
  730. if regs<>[] then
  731. begin
  732. for r:=RS_A14 downto RS_A0 do
  733. if r in regs then
  734. begin
  735. dec(ref.offset,4);
  736. list.concat(taicpu.op_reg_ref(A_L32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  737. end;
  738. end;
  739. // restore stack pointer
  740. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize));
  741. a_reg_dealloc(list,NR_STACK_POINTER_REG);
  742. end;
  743. end;
  744. list.Concat(taicpu.op_none(A_RET));
  745. end
  746. else
  747. Internalerror(2020031403);
  748. end;
  749. end;
  750. procedure tcgcpu.a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel);
  751. function is_b4const(v: tcgint): boolean;
  752. begin
  753. case v of
  754. -1,1,2,3,4,5,6,7,8,
  755. 10,12,16,32,64,128,256:
  756. result:=true;
  757. else
  758. result:=false;
  759. end;
  760. end;
  761. function is_b4constu(v: tcgint): boolean;
  762. begin
  763. case v of
  764. 32768,65536,
  765. 2,3,4,5,6,7,8,
  766. 10,12,16,32,64,128,256:
  767. result:=true;
  768. else
  769. result:=false;
  770. end;
  771. end;
  772. var
  773. op: TAsmCond;
  774. instr: taicpu;
  775. begin
  776. if (a=0) and (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  777. begin
  778. case cmp_op of
  779. OC_EQ: op:=C_EQZ;
  780. OC_NE: op:=C_NEZ;
  781. OC_LT: op:=C_LTZ;
  782. OC_GTE: op:=C_GEZ;
  783. else
  784. Internalerror(2020030801);
  785. end;
  786. instr:=taicpu.op_reg_sym(A_B,reg,l);
  787. instr.condition:=op;
  788. list.concat(instr);
  789. end
  790. else if is_b4const(a) and
  791. (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  792. begin
  793. case cmp_op of
  794. OC_EQ: op:=C_EQI;
  795. OC_NE: op:=C_NEI;
  796. OC_LT: op:=C_LTI;
  797. OC_GTE: op:=C_GEI;
  798. else
  799. Internalerror(2020030801);
  800. end;
  801. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  802. instr.condition:=op;
  803. list.concat(instr);
  804. end
  805. else if is_b4constu(a) and
  806. (cmp_op in [OC_B,OC_AE]) then
  807. begin
  808. case cmp_op of
  809. OC_B: op:=C_LTUI;
  810. OC_AE: op:=C_GEUI;
  811. else
  812. Internalerror(2020030801);
  813. end;
  814. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  815. instr.condition:=op;
  816. list.concat(instr);
  817. end
  818. else
  819. inherited a_cmp_const_reg_label(list, size, cmp_op, a, reg, l);
  820. end;
  821. procedure tcgcpu.a_cmp_reg_reg_label(list : TAsmList; size : tcgsize;
  822. cmp_op : topcmp; reg1,reg2 : tregister; l : tasmlabel);
  823. var
  824. tmpreg: TRegister;
  825. instr: taicpu;
  826. begin
  827. if TOpCmp2AsmCond[cmp_op]=C_None then
  828. begin
  829. cmp_op:=swap_opcmp(cmp_op);
  830. tmpreg:=reg1;
  831. reg1:=reg2;
  832. reg2:=tmpreg;
  833. end;
  834. instr:=taicpu.op_reg_reg_sym(A_B,reg2,reg1,l);
  835. instr.condition:=TOpCmp2AsmCond[cmp_op];
  836. list.concat(instr);
  837. end;
  838. procedure tcgcpu.a_jmp_always(list : TAsmList; l : TAsmLabel);
  839. var
  840. ai : taicpu;
  841. begin
  842. if l.bind in [AB_GLOBAL] then
  843. begin
  844. { for now, we use A15 here, however, this is not save as it might contain an argument, I have not figured out a
  845. solution yet }
  846. ai:=taicpu.op_sym_reg(A_J,l,NR_A15);
  847. ai.oppostfix := PF_L;
  848. end
  849. else
  850. ai:=taicpu.op_sym(A_J,l);
  851. ai.is_jmp:=true;
  852. list.concat(ai);
  853. end;
  854. procedure tcgcpu.g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);
  855. var
  856. hregister: TRegister;
  857. instr: taicpu;
  858. begin
  859. a_load_const_reg(list,size,0,reg);
  860. hregister:=getintregister(list,size);
  861. a_load_const_reg(list,size,1,hregister);
  862. instr:=taicpu.op_reg_reg_reg(A_MOV,reg,hregister,f.register);
  863. instr.condition:=flags_to_cond(f.flag);
  864. list.concat(instr);
  865. end;
  866. procedure tcgcpu.g_concatcopy_move(list: tasmlist; const Source, dest: treference; len: tcgint);
  867. var
  868. paraloc1, paraloc2, paraloc3: TCGPara;
  869. pd: tprocdef;
  870. begin
  871. pd:=search_system_proc('MOVE');
  872. paraloc1.init;
  873. paraloc2.init;
  874. paraloc3.init;
  875. paramanager.getcgtempparaloc(list, pd, 1, paraloc1);
  876. paramanager.getcgtempparaloc(list, pd, 2, paraloc2);
  877. paramanager.getcgtempparaloc(list, pd, 3, paraloc3);
  878. a_load_const_cgpara(list, OS_SINT, len, paraloc3);
  879. a_loadaddr_ref_cgpara(list, dest, paraloc2);
  880. a_loadaddr_ref_cgpara(list, Source, paraloc1);
  881. paramanager.freecgpara(list, paraloc3);
  882. paramanager.freecgpara(list, paraloc2);
  883. paramanager.freecgpara(list, paraloc1);
  884. alloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  885. alloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  886. a_call_name(list, 'FPC_MOVE', false);
  887. dealloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  888. dealloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  889. paraloc3.done;
  890. paraloc2.done;
  891. paraloc1.done;
  892. end;
  893. procedure tcgcpu.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  894. var
  895. tmpreg1, hreg, countreg: TRegister;
  896. src, dst, src2, dst2: TReference;
  897. lab: tasmlabel;
  898. Count, count2: aint;
  899. function reference_is_reusable(const ref: treference): boolean;
  900. begin
  901. result:=(ref.base<>NR_NO) and (ref.index=NR_NO) and
  902. (ref.symbol=nil);
  903. end;
  904. begin
  905. src2:=source;
  906. fixref(list,src2);
  907. dst2:=dest;
  908. fixref(list,dst2);
  909. if len > high(longint) then
  910. internalerror(2002072704);
  911. { A call (to FPC_MOVE) requires the outgoing parameter area to be properly
  912. allocated on stack. This can only be done before tmipsprocinfo.set_first_temp_offset,
  913. i.e. before secondpass. Other internal procedures request correct stack frame
  914. by setting pi_do_call during firstpass, but for this particular one it is impossible.
  915. Therefore, if the current procedure is a leaf one, we have to leave it that way. }
  916. { anybody wants to determine a good value here :)? }
  917. if (len > 100) and
  918. assigned(current_procinfo) and
  919. (pi_do_call in current_procinfo.flags) then
  920. g_concatcopy_move(list, src2, dst2, len)
  921. else
  922. begin
  923. Count := len div 4;
  924. if (count<=4) and reference_is_reusable(src2) then
  925. src:=src2
  926. else
  927. begin
  928. reference_reset(src,sizeof(aint),[]);
  929. { load the address of src2 into src.base }
  930. src.base := GetAddressRegister(list);
  931. a_loadaddr_ref_reg(list, src2, src.base);
  932. end;
  933. if (count<=4) and reference_is_reusable(dst2) then
  934. dst:=dst2
  935. else
  936. begin
  937. reference_reset(dst,sizeof(aint),[]);
  938. { load the address of dst2 into dst.base }
  939. dst.base := GetAddressRegister(list);
  940. a_loadaddr_ref_reg(list, dst2, dst.base);
  941. end;
  942. { generate a loop }
  943. if Count > 4 then
  944. begin
  945. countreg := GetIntRegister(list, OS_INT);
  946. tmpreg1 := GetIntRegister(list, OS_INT);
  947. a_load_const_reg(list, OS_INT, Count, countreg);
  948. current_asmdata.getjumplabel(lab);
  949. a_label(list, lab);
  950. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  951. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  952. list.concat(taicpu.op_reg_reg_const(A_ADDI, src.base, src.base, 4));
  953. list.concat(taicpu.op_reg_reg_const(A_ADDI, dst.base, dst.base, 4));
  954. list.concat(taicpu.op_reg_reg_const(A_ADDI, countreg, countreg, -1));
  955. a_cmp_const_reg_label(list,OS_INT,OC_GT,0,countreg,lab);
  956. { keep the registers alive }
  957. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  958. list.concat(taicpu.op_reg_reg(A_MOV,src.base,src.base));
  959. list.concat(taicpu.op_reg_reg(A_MOV,dst.base,dst.base));
  960. len := len mod 4;
  961. end;
  962. { unrolled loop }
  963. Count := len div 4;
  964. if Count > 0 then
  965. begin
  966. tmpreg1 := GetIntRegister(list, OS_INT);
  967. for count2 := 1 to Count do
  968. begin
  969. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  970. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  971. Inc(src.offset, 4);
  972. Inc(dst.offset, 4);
  973. end;
  974. len := len mod 4;
  975. end;
  976. if (len and 4) <> 0 then
  977. begin
  978. hreg := GetIntRegister(list, OS_INT);
  979. a_load_ref_reg(list, OS_32, OS_32, src, hreg);
  980. a_load_reg_ref(list, OS_32, OS_32, hreg, dst);
  981. Inc(src.offset, 4);
  982. Inc(dst.offset, 4);
  983. end;
  984. { copy the leftovers }
  985. if (len and 2) <> 0 then
  986. begin
  987. hreg := GetIntRegister(list, OS_INT);
  988. a_load_ref_reg(list, OS_16, OS_16, src, hreg);
  989. a_load_reg_ref(list, OS_16, OS_16, hreg, dst);
  990. Inc(src.offset, 2);
  991. Inc(dst.offset, 2);
  992. end;
  993. if (len and 1) <> 0 then
  994. begin
  995. hreg := GetIntRegister(list, OS_INT);
  996. a_load_ref_reg(list, OS_8, OS_8, src, hreg);
  997. a_load_reg_ref(list, OS_8, OS_8, hreg, dst);
  998. end;
  999. end;
  1000. end;
  1001. procedure tcgcpu.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  1002. var
  1003. ai: taicpu;
  1004. begin
  1005. if not(fromsize in [OS_32,OS_F32]) then
  1006. InternalError(2020032603);
  1007. ai := taicpu.op_reg_reg(A_MOV,reg2,reg1);
  1008. ai.oppostfix := PF_S;
  1009. list.concat(ai);
  1010. end;
  1011. procedure tcgcpu.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  1012. var
  1013. href: treference;
  1014. begin
  1015. if not(fromsize in [OS_32,OS_F32]) then
  1016. InternalError(2020032602);
  1017. href:=ref;
  1018. if assigned(href.symbol) or
  1019. (href.index<>NR_NO) or
  1020. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1021. fixref(list,href);
  1022. list.concat(taicpu.op_reg_ref(A_LSI,reg,href));
  1023. if fromsize<>tosize then
  1024. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1025. end;
  1026. procedure tcgcpu.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1027. var
  1028. href: treference;
  1029. begin
  1030. if not(fromsize in [OS_32,OS_F32]) then
  1031. InternalError(2020032604);
  1032. href:=ref;
  1033. if assigned(href.symbol) or
  1034. (href.index<>NR_NO) or
  1035. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1036. fixref(list,href);
  1037. list.concat(taicpu.op_reg_ref(A_SSI,reg,href));
  1038. end;
  1039. procedure tcgcpu.maybeadjustresult(list : TAsmList; op : TOpCg; size : tcgsize; dst : tregister);
  1040. const
  1041. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  1042. begin
  1043. if (op in overflowops) and
  1044. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  1045. a_load_reg_reg(list,OS_32,size,dst,dst);
  1046. end;
  1047. procedure tcgcpu.g_overflowcheck(list: TAsmList; const Loc: tlocation; def: tdef);
  1048. begin
  1049. { no overflow checking yet }
  1050. end;
  1051. procedure tcg64fxtensa.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  1052. var
  1053. instr: taicpu;
  1054. no_carry: TAsmLabel;
  1055. tmpreg: TRegister;
  1056. begin
  1057. case op of
  1058. OP_NEG,
  1059. OP_NOT :
  1060. internalerror(2020030810);
  1061. else
  1062. ;
  1063. end;
  1064. case op of
  1065. OP_AND,OP_OR,OP_XOR:
  1066. begin
  1067. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  1068. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  1069. end;
  1070. OP_ADD:
  1071. begin
  1072. if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then
  1073. Internalerror(2020082205);
  1074. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reglo, regsrc2.reglo, regsrc1.reglo));
  1075. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1076. current_asmdata.getjumplabel(no_carry);
  1077. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regdst.reglo, no_carry);
  1078. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1079. cg.a_label(list,no_carry);
  1080. end;
  1081. OP_SUB:
  1082. begin
  1083. if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then
  1084. Internalerror(2020082206);
  1085. { we need the original src2 value for the comparison, do not overwrite it }
  1086. if regsrc2.reglo=regdst.reglo then
  1087. begin
  1088. tmpreg:=cg.GetIntRegister(list,OS_S32);
  1089. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc2.reglo,tmpreg);
  1090. regsrc2.reglo:=tmpreg;
  1091. end;
  1092. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reglo, regsrc2.reglo, regsrc1.reglo));
  1093. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1094. current_asmdata.getjumplabel(no_carry);
  1095. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regsrc2.reglo, no_carry);
  1096. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, -1));
  1097. cg.a_label(list,no_carry);
  1098. end;
  1099. else
  1100. internalerror(2020030813);
  1101. end;
  1102. end;
  1103. procedure tcg64fxtensa.a_op64_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; regsrc,regdst : tregister64);
  1104. var
  1105. tmpreg : TRegister;
  1106. instr : taicpu;
  1107. begin
  1108. case op of
  1109. OP_NEG:
  1110. begin
  1111. tmpreg:=cg.GetIntRegister(list, OS_INT);
  1112. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reglo,regsrc.reglo));
  1113. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reghi,regsrc.reghi));
  1114. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,regdst.reghi,-1));
  1115. instr:=taicpu.op_reg_reg_reg(A_MOV,regdst.reghi,tmpreg,regdst.reglo);
  1116. instr.condition:=C_EQZ;
  1117. list.concat(instr);
  1118. end;
  1119. OP_NOT:
  1120. begin
  1121. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  1122. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  1123. end;
  1124. else
  1125. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  1126. end;
  1127. end;
  1128. procedure tcg64fxtensa.a_op64_const_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; regsrc,regdst : tregister64);
  1129. var
  1130. tmpreg64 : tregister64;
  1131. no_carry : TAsmLabel;
  1132. tmpreg: tregister;
  1133. begin
  1134. case op of
  1135. OP_NEG,
  1136. OP_NOT :
  1137. internalerror(2020030904);
  1138. else
  1139. ;
  1140. end;
  1141. case op of
  1142. OP_AND,OP_OR,OP_XOR:
  1143. begin
  1144. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  1145. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  1146. end;
  1147. OP_ADD:
  1148. begin
  1149. { could do better here (hi(value) in 248..2047), for now we support only the simple cases }
  1150. if (value>=-2048) and (value<=2047) then
  1151. begin
  1152. { we need the original src value for the comparison, do not overwrite it }
  1153. if regsrc.reglo=regdst.reglo then
  1154. begin
  1155. tmpreg:=cg.GetIntRegister(list,OS_S32);
  1156. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,tmpreg);
  1157. regsrc.reglo:=tmpreg;
  1158. end;
  1159. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reglo, regsrc.reglo, value));
  1160. list.concat(taicpu.op_reg_reg(A_MOV, regdst.reghi, regsrc.reghi));
  1161. current_asmdata.getjumplabel(no_carry);
  1162. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc.reglo, regdst.reglo, no_carry);
  1163. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1164. cg.a_label(list,no_carry);
  1165. end
  1166. else
  1167. begin
  1168. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1169. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1170. a_load64_const_reg(list,value,tmpreg64);
  1171. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1172. end;
  1173. end;
  1174. OP_SHL:
  1175. begin
  1176. if (value>0) and (value<=16) then
  1177. begin
  1178. tmpreg:=cg.GetIntRegister(list,OS_32);
  1179. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI, tmpreg, regsrc.reglo, 32-value, value));
  1180. list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reglo, regsrc.reglo, value));
  1181. list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reghi, regsrc.reghi, value));
  1182. list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reghi, tmpreg, regdst.reghi));
  1183. end
  1184. else if value=32 then
  1185. begin
  1186. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,regdst.reghi);
  1187. cg.a_load_const_reg(list,OS_INT,0,regdst.reglo);
  1188. end
  1189. else
  1190. Internalerror(2020082209);
  1191. end;
  1192. OP_SHR:
  1193. begin
  1194. if (value>0) and (value<=15) then
  1195. begin
  1196. tmpreg:=cg.GetIntRegister(list,OS_32);
  1197. list.concat(taicpu.op_reg_reg_const(A_SLLI, tmpreg, regsrc.reghi, 32-value));
  1198. list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reglo, regsrc.reglo, value));
  1199. list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reglo, tmpreg, regdst.reglo));
  1200. list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reghi, regsrc.reghi, value));
  1201. end
  1202. else if value=32 then
  1203. begin
  1204. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reghi,regdst.reglo);
  1205. cg.a_load_const_reg(list,OS_INT,0,regdst.reghi);
  1206. end
  1207. else
  1208. Internalerror(2020082210);
  1209. end;
  1210. OP_SUB:
  1211. begin
  1212. { for now, we take the simple approach }
  1213. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1214. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1215. a_load64_const_reg(list,value,tmpreg64);
  1216. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1217. end;
  1218. else
  1219. internalerror(2020030901);
  1220. end;
  1221. end;
  1222. procedure tcg64fxtensa.a_op64_const_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; reg : tregister64);
  1223. begin
  1224. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  1225. end;
  1226. {$warnings off}
  1227. procedure create_codegen;
  1228. begin
  1229. cg:=tcgcpu.Create;
  1230. cg64:=tcg64fxtensa.Create;
  1231. end;
  1232. end.