cgcpu.pas 52 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389
  1. {
  2. Copyright (c) 2014 by Jonas Maebe
  3. This unit implements the code generator for Xtensa
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit cgcpu;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. globtype,parabase,
  22. cgbase,cgutils,cgobj,
  23. aasmbase,aasmtai,aasmdata,aasmcpu,
  24. cpubase,cpuinfo,
  25. node,symconst,SymType,symdef,
  26. rgcpu,
  27. cg64f32;
  28. type
  29. tcgcpu=class(tcg)
  30. private
  31. procedure fixref(list : TAsmList; var ref : treference);
  32. procedure g_concatcopy_move(list : tasmlist; const Source,dest : treference; len : tcgint);
  33. public
  34. procedure init_register_allocators;override;
  35. procedure done_register_allocators;override;
  36. { move instructions }
  37. procedure a_load_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  38. procedure a_load_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister;const ref: TReference);override;
  39. procedure a_load_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: TReference; reg: tregister);override;
  40. procedure a_load_const_reg(list: TAsmList; size: tcgsize; a: tcgint; reg: tregister);override;
  41. procedure a_loadaddr_ref_reg(list: TAsmList; const ref: TReference; r: tregister);override;
  42. procedure a_op_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src, dst: tregister);override;
  43. procedure a_op_const_reg(list: TAsmList; op: topcg; size: tcgsize; a: tcgint; reg: tregister);override;
  44. procedure a_op_reg_reg_reg(list: TAsmList; op: topcg; size: tcgsize; src1, src2, dst: tregister);override;
  45. procedure a_op_const_reg_reg(list : TAsmList; op : TOpCg; size : tcgsize; a : tcgint; src,dst : tregister);override;
  46. procedure a_call_name(list:TAsmList;const s:string; weak: boolean);override;
  47. procedure a_call_reg(list:TAsmList;Reg:tregister);override;
  48. procedure a_jmp_name(list: TAsmList; const s: string);override;
  49. procedure a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);override;
  50. procedure g_proc_entry(list: TAsmList; localsize: longint; nostackframe: boolean);override;
  51. procedure g_proc_exit(list: TAsmList; parasize: longint; nostackframe: boolean);override;
  52. { comparison operations }
  53. procedure a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel); override;
  54. procedure a_cmp_reg_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; reg1, reg2: tregister; l: tasmlabel);override;
  55. procedure a_jmp_always(list: TAsmList; l: TAsmLabel);override;
  56. procedure g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);override;
  57. procedure g_concatcopy(list : TAsmList; const source,dest : treference; len : tcgint);override;
  58. procedure a_loadfpu_reg_reg(list: TAsmList; fromsize, tosize: tcgsize; reg1, reg2: tregister);override;
  59. procedure a_loadfpu_ref_reg(list: TAsmList; fromsize, tosize: tcgsize; const ref: treference; reg: tregister);override;
  60. procedure a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);override;
  61. procedure maybeadjustresult(list: TAsmList; op: TOpCg; size: tcgsize; dst: tregister);
  62. procedure g_overflowcheck(list: TAsmList; const Loc:tlocation; def:tdef);override;
  63. function create_data_entry(symbol: TAsmSymbol; offset: asizeint): TAsmLabel;
  64. end;
  65. tcg64fxtensa = class(tcg64f32)
  66. procedure a_op64_reg_reg(list : TAsmList;op:TOpCG;size : tcgsize;regsrc,regdst : tregister64);override;
  67. procedure a_op64_const_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64);override;
  68. procedure a_op64_const_reg(list : TAsmList;op:TOpCG;size : tcgsize;value : int64;reg : tregister64);override;
  69. procedure a_op64_reg_reg_reg(list : TAsmList; op : TOpCG;size : tcgsize; regsrc1,regsrc2,regdst : tregister64);override;
  70. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  71. //procedure a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);override;
  72. //procedure a_op64_const_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;value : int64;regsrc,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  73. //procedure a_op64_reg_reg_reg_checkoverflow(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64;setflags : boolean;var ovloc : tlocation);override;
  74. //procedure a_loadmm_intreg64_reg(list: TAsmList; mmsize: tcgsize; intreg: tregister64; mmreg: tregister);override;
  75. //procedure a_loadmm_reg_intreg64(list: TAsmList; mmsize: tcgsize; mmreg: tregister; intreg: tregister64);override;
  76. end;
  77. procedure create_codegen;
  78. const
  79. TOpCG2AsmOp: array[topcg] of TAsmOp = (
  80. A_NONE,A_MOV,A_ADD,A_AND,A_NONE,A_NONE,A_MULL,A_MULL,A_NEG,A_NONE,A_OR,A_SRA,A_SLL,A_SRL,A_SUB,A_XOR,A_NONE,A_NONE
  81. );
  82. {
  83. );TOpCG2AsmOpReg: array[topcg] of TAsmOp = (
  84. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASRV,A_LSLV,A_LSRV,A_SUB,A_EOR,A_NONE,A_RORV
  85. );
  86. TOpCG2AsmOpImm: array[topcg] of TAsmOp = (
  87. A_NONE,A_MOV,A_ADD,A_AND,A_UDIV,A_SDIV,A_MUL,A_MUL,A_NEG,A_MVN,A_ORR,A_ASR,A_LSL,A_LSR,A_SUB,A_EOR,A_NONE,A_ROR
  88. );
  89. TOpCmp2AsmCond: array[topcmp] of TAsmCond = (C_NONE,C_EQ,C_GT,
  90. C_LT,C_GE,C_LE,C_NE,C_LS,C_CC,C_CS,C_HI
  91. );
  92. }
  93. implementation
  94. uses
  95. globals,verbose,systems,cutils,
  96. paramgr,fmodule,
  97. symtable,symsym,
  98. tgobj,
  99. procinfo,cpupi;
  100. const
  101. TOpCmp2AsmCond: array[TOpCmp] of TAsmCond = (
  102. C_None,
  103. C_EQ,
  104. C_None,
  105. C_LT,
  106. C_GE,
  107. C_None,
  108. C_NE,
  109. C_None,
  110. C_LTU,
  111. C_GEU,
  112. C_None
  113. );
  114. procedure tcgcpu.init_register_allocators;
  115. begin
  116. inherited init_register_allocators;
  117. if target_info.abi = abi_xtensa_call0 then
  118. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  119. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,{RS_A8,}RS_A9,
  120. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14{,RS_A15}],first_int_imreg,[])
  121. else
  122. rg[R_INTREGISTER]:=trgintcpu.create(R_INTREGISTER,R_SUBWHOLE,
  123. [RS_A2,RS_A3,RS_A4,RS_A5,RS_A6,RS_A7,RS_A8,RS_A9,
  124. RS_A10,RS_A11,RS_A12,RS_A13,RS_A14,RS_A15],first_int_imreg,[]);
  125. rg[R_FPUREGISTER]:=trgcpu.create(R_FPUREGISTER,R_SUBNONE,
  126. [RS_F0,RS_F1,RS_F2,RS_F3,RS_F4,RS_F5,RS_F6,RS_F7,RS_F8,RS_F9,
  127. RS_F10,RS_F11,RS_F12,RS_F13,RS_F14,RS_F15],first_fpu_imreg,[]);
  128. rg[R_SPECIALREGISTER]:=trgcpu.create(R_SPECIALREGISTER,R_SUBNONE,
  129. [RS_B0,RS_B1,RS_B2,RS_B3,RS_B4,RS_B5,RS_B6,RS_B7,RS_B8,RS_B9,
  130. RS_B10,RS_B11,RS_B12,RS_B13,RS_B14,RS_B15],first_flag_imreg,[]);
  131. end;
  132. procedure tcgcpu.done_register_allocators;
  133. begin
  134. rg[R_INTREGISTER].free;
  135. rg[R_FPUREGISTER].free;
  136. rg[R_SPECIALREGISTER].free;
  137. inherited done_register_allocators;
  138. end;
  139. procedure tcgcpu.a_load_reg_reg(list : TAsmList; fromsize,tosize : tcgsize;
  140. reg1,reg2 : tregister);
  141. var
  142. conv_done : Boolean;
  143. instr : taicpu;
  144. begin
  145. if (tcgsize2size[fromsize]>32) or (tcgsize2size[tosize]>32) or (fromsize=OS_NO) or (tosize=OS_NO) then
  146. internalerror(2020030710);
  147. conv_done:=false;
  148. if tosize<>fromsize then
  149. begin
  150. conv_done:=true;
  151. if tcgsize2size[tosize]<=tcgsize2size[fromsize] then
  152. fromsize:=tosize;
  153. case fromsize of
  154. OS_8:
  155. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,8));
  156. OS_S8:
  157. begin
  158. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  159. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,7))
  160. else
  161. begin
  162. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,24));
  163. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,24));
  164. end;
  165. if tosize=OS_16 then
  166. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg2,0,16));
  167. end;
  168. OS_16:
  169. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,reg2,reg1,0,16));
  170. OS_S16:
  171. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  172. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg2,reg1,15))
  173. else
  174. begin
  175. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg2,reg1,16));
  176. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg2,reg2,16));
  177. end;
  178. else
  179. conv_done:=false;
  180. end;
  181. end;
  182. if not conv_done and (reg1<>reg2) then
  183. begin
  184. { same size, only a register mov required }
  185. instr:=taicpu.op_reg_reg(A_MOV,reg2,reg1);
  186. list.Concat(instr);
  187. { Notify the register allocator that we have written a move instruction so
  188. it can try to eliminate it. }
  189. add_move_instruction(instr);
  190. end;
  191. end;
  192. procedure tcgcpu.a_load_reg_ref(list : TAsmList; fromsize,tosize : tcgsize;
  193. reg : tregister; const ref : TReference);
  194. var
  195. op: TAsmOp;
  196. href : treference;
  197. begin
  198. if (TCGSize2Size[FromSize] >= TCGSize2Size[ToSize]) then
  199. FromSize := ToSize;
  200. case tosize of
  201. { signed integer registers }
  202. OS_8,
  203. OS_S8:
  204. op:=A_S8I;
  205. OS_16,
  206. OS_S16:
  207. op:=A_S16I;
  208. OS_32,
  209. OS_S32:
  210. op:=A_S32I;
  211. else
  212. InternalError(2020030804);
  213. end;
  214. href:=ref;
  215. if assigned(href.symbol) or
  216. (href.index<>NR_NO) or
  217. ((op=A_S8I) and ((href.offset<0) or (href.offset>255))) or
  218. ((op=A_S16I) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  219. ((op=A_S32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  220. fixref(list,href);
  221. list.concat(taicpu.op_reg_ref(op,reg,href));
  222. end;
  223. procedure tcgcpu.a_load_ref_reg(list : TAsmList; fromsize,tosize : tcgsize;
  224. const ref : TReference; reg : tregister);
  225. var
  226. href: treference;
  227. op: TAsmOp;
  228. tmpreg: TRegister;
  229. begin
  230. case fromsize of
  231. OS_8: op:=A_L8UI;
  232. OS_16: op:=A_L16UI;
  233. OS_S8: op:=A_L8UI;
  234. OS_S16: op:=A_L16SI;
  235. OS_64,OS_S64, { This only happens if tosize is smaller than fromsize }
  236. { We can therefore only consider the low 32-bit of the 64bit value }
  237. OS_32,
  238. OS_S32: op:=A_L32I;
  239. else
  240. internalerror(2020030801);
  241. end;
  242. href:=ref;
  243. if assigned(href.symbol) or
  244. (href.index<>NR_NO) or
  245. ((op=A_L8UI) and ((href.offset<0) or (href.offset>255))) or
  246. ((op in [A_L16SI,A_L16UI]) and ((href.offset<0) or (href.offset>510) or (href.offset mod 2<>0))) or
  247. ((op=A_L32I) and ((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  248. fixref(list,href);
  249. list.concat(taicpu.op_reg_ref(op,reg,href));
  250. if (fromsize=OS_S8) and not(tosize in [OS_S8,OS_8]) then
  251. if CPUXTENSA_HAS_SEXT in cpu_capabilities[current_settings.cputype] then
  252. list.concat(taicpu.op_reg_reg_const(A_SEXT,reg,reg,7))
  253. else
  254. begin
  255. list.concat(taicpu.op_reg_reg_const(A_SLLI,reg,reg,24));
  256. list.concat(taicpu.op_reg_reg_const(A_SRAI,reg,reg,24));
  257. end;
  258. if (fromsize<>tosize) and (not (tosize in [OS_SINT,OS_INT])) then
  259. a_load_reg_reg(list,fromsize,tosize,reg,reg);
  260. end;
  261. procedure tcgcpu.a_load_const_reg(list : TAsmList; size : tcgsize;
  262. a : tcgint; reg : tregister);
  263. var
  264. hr : treference;
  265. l : TAsmLabel;
  266. begin
  267. if (a>=-2048) and (a<=2047) then
  268. list.Concat(taicpu.op_reg_const(A_MOVI,reg,a))
  269. else
  270. begin
  271. reference_reset(hr,4,[]);
  272. hr.symbol:=create_data_entry(nil,longint(a));
  273. list.concat(taicpu.op_reg_ref(A_L32R,reg,hr));
  274. end;
  275. end;
  276. procedure tcgcpu.fixref(list : TAsmList;var ref : treference);
  277. var
  278. tmpreg, tmpreg2 : tregister;
  279. tmpref : treference;
  280. l : tasmlabel;
  281. begin
  282. { create consts entry }
  283. if assigned(ref.symbol) or (ref.offset<-2048) or (ref.offset>2047) then
  284. begin
  285. reference_reset(tmpref,4,[]);
  286. tmpreg:=NR_NO;
  287. { load consts entry }
  288. tmpreg:=getintregister(list,OS_INT);
  289. tmpref.symbol:=create_data_entry(ref.symbol,ref.offset);
  290. list.concat(taicpu.op_reg_ref(A_L32R,tmpreg,tmpref));
  291. if ref.base<>NR_NO then
  292. begin
  293. if ref.index<>NR_NO then
  294. begin
  295. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  296. ref.base:=tmpreg;
  297. end
  298. else
  299. ref.index:=tmpreg;
  300. end
  301. else
  302. ref.base:=tmpreg;
  303. end
  304. else if ref.offset<>0 then
  305. begin
  306. tmpreg:=getintregister(list,OS_INT);
  307. if (ref.offset>=-128) and (ref.offset<=127) then
  308. begin
  309. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,ref.base,ref.offset));
  310. ref.base:=tmpreg;
  311. end
  312. else
  313. begin
  314. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,ref.offset));
  315. if ref.base<>NR_NO then
  316. begin
  317. if ref.index<>NR_NO then
  318. begin
  319. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,tmpreg));
  320. ref.base:=tmpreg;
  321. end
  322. else
  323. ref.index:=tmpreg;
  324. end
  325. else
  326. ref.base:=tmpreg;
  327. end;
  328. end;
  329. if ref.index<>NR_NO then
  330. begin
  331. if ref.base<>NR_NO then
  332. begin
  333. tmpreg:=getintregister(list,OS_INT);
  334. list.concat(taicpu.op_reg_reg_reg(A_ADD,tmpreg,ref.base,ref.index));
  335. ref.base:=tmpreg;
  336. end
  337. else
  338. ref.base:=ref.index;
  339. ref.index:=NR_NO;
  340. end;
  341. ref.offset:=0;
  342. ref.symbol:=nil;
  343. end;
  344. procedure tcgcpu.a_loadaddr_ref_reg(list : TAsmList;
  345. const ref : TReference; r : tregister);
  346. var
  347. b : byte;
  348. tmpref : treference;
  349. instr : taicpu;
  350. begin
  351. tmpref:=ref;
  352. { Be sure to have a base register }
  353. if tmpref.base=NR_NO then
  354. begin
  355. tmpref.base:=tmpref.index;
  356. tmpref.index:=NR_NO;
  357. end;
  358. if assigned(tmpref.symbol) then
  359. fixref(list,tmpref);
  360. { expect a base here if there is an index }
  361. if (tmpref.base=NR_NO) and (tmpref.index<>NR_NO) then
  362. internalerror(200312022);
  363. if tmpref.index<>NR_NO then
  364. begin
  365. a_op_reg_reg_reg(list,OP_ADD,OS_ADDR,tmpref.base,tmpref.index,r);
  366. if tmpref.offset<>0 then
  367. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,r,r);
  368. end
  369. else
  370. begin
  371. if tmpref.base=NR_NO then
  372. a_load_const_reg(list,OS_ADDR,tmpref.offset,r)
  373. else
  374. if tmpref.offset<>0 then
  375. a_op_const_reg_reg(list,OP_ADD,OS_ADDR,tmpref.offset,tmpref.base,r)
  376. else
  377. begin
  378. instr:=taicpu.op_reg_reg(A_MOV,r,tmpref.base);
  379. list.concat(instr);
  380. add_move_instruction(instr);
  381. end;
  382. end;
  383. end;
  384. procedure tcgcpu.a_op_reg_reg(list : TAsmList; op : topcg; size : tcgsize; src,dst : tregister);
  385. var
  386. tmpreg : TRegister;
  387. begin
  388. if op = OP_NEG then
  389. begin
  390. list.concat(taicpu.op_reg_reg(A_NEG,dst,src));
  391. maybeadjustresult(list,OP_NEG,size,dst);
  392. end
  393. else if op = OP_NOT then
  394. begin
  395. tmpreg:=getintregister(list,size);
  396. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  397. list.concat(taicpu.op_reg_reg_reg(A_XOR,dst,tmpreg,src));
  398. maybeadjustresult(list,OP_NOT,size,dst);
  399. end
  400. else
  401. a_op_reg_reg_reg(list,op,size,src,dst,dst);
  402. end;
  403. procedure tcgcpu.a_op_const_reg_reg(list: TAsmList; op: TOpCg; size: tcgsize; a: tcgint; src, dst: tregister);
  404. var
  405. l1 : longint;
  406. tmpreg : TRegister;
  407. begin
  408. optimize_op_const(size, op, a);
  409. case op of
  410. OP_NONE:
  411. begin
  412. if src <> dst then
  413. a_load_reg_reg(list, size, size, src, dst);
  414. exit;
  415. end;
  416. OP_MOVE:
  417. begin
  418. a_load_const_reg(list, size, a, dst);
  419. exit;
  420. end;
  421. else
  422. ;
  423. end;
  424. { there could be added some more sophisticated optimizations }
  425. if (op in [OP_IMUL,OP_IDIV]) and (a=-1) then
  426. a_op_reg_reg(list,OP_NEG,size,src,dst)
  427. { we do this here instead in the peephole optimizer because
  428. it saves us a register }
  429. else if (op in [OP_MUL,OP_IMUL]) and ispowerof2(a,l1) then
  430. a_op_const_reg_reg(list,OP_SHL,size,l1,src,dst)
  431. else if (op=OP_ADD) and (a>=-128) and (a<=127) then
  432. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,a))
  433. else if (op=OP_ADD) and (a>=-128-32768) and (a<=127+32512) then
  434. begin
  435. {$ifdef EXTDEBUG}
  436. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  437. {$endif EXTDEBUG}
  438. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  439. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  440. end
  441. else if (op=OP_SUB) and (a>=-127) and (a<=128) then
  442. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,src,-a))
  443. else if (op=OP_SUB) and (a>=-127-32512) and (a<=128+32768) then
  444. begin
  445. {$ifdef EXTDEBUG}
  446. list.concat(tai_comment.Create(strpnew('Value: '+tostr(a))));
  447. {$endif EXTDEBUG}
  448. a:=-a;
  449. list.concat(taicpu.op_reg_reg_const(A_ADDMI,dst,src,Smallint((a+128) and $ff00)));
  450. list.concat(taicpu.op_reg_reg_const(A_ADDI,dst,dst,Shortint(a and $ff)));
  451. end
  452. else if (op=OP_SHL) and (a>=1) and (a<=31) then
  453. list.concat(taicpu.op_reg_reg_const(A_SLLI,dst,src,a))
  454. else if (op=OP_SAR) and (a>=0) and (a<=31) then
  455. list.concat(taicpu.op_reg_reg_const(A_SRAI,dst,src,a))
  456. else if (op=OP_SHR) and (a>=0) and (a<=15) then
  457. list.concat(taicpu.op_reg_reg_const(A_SRLI,dst,src,a))
  458. else if (op=OP_SHR) and (a>15) and (a<=31) then
  459. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,a,32-a))
  460. else if (op=OP_AND) and (63-BsrQWord(a)+PopCnt(QWord(a))=64) and (PopCnt(QWord(a))<=16) then
  461. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI,dst,src,0,PopCnt(QWord(a))))
  462. else
  463. begin
  464. tmpreg:=getintregister(list,size);
  465. a_load_const_reg(list,size,a,tmpreg);
  466. a_op_reg_reg_reg(list,op,size,tmpreg,src,dst);
  467. end;
  468. maybeadjustresult(list,op,size,dst);
  469. end;
  470. procedure tcgcpu.a_op_const_reg(list : TAsmList; op : topcg; size : tcgsize; a : tcgint; reg : tregister);
  471. begin
  472. a_op_const_reg_reg(list,op,size,a,reg,reg);
  473. end;
  474. procedure tcgcpu.a_op_reg_reg_reg(list : TAsmList; op : topcg;
  475. size : tcgsize; src1,src2,dst : tregister);
  476. var
  477. tmpreg : TRegister;
  478. begin
  479. if op=OP_NOT then
  480. begin
  481. tmpreg:=getintregister(list,size);
  482. list.concat(taicpu.op_reg_const(A_MOVI,tmpreg,-1));
  483. maybeadjustresult(list,op,size,dst);
  484. end
  485. else if op=OP_NEG then
  486. begin
  487. list.concat(taicpu.op_reg_reg(A_NEG,dst,src1));
  488. maybeadjustresult(list,op,size,dst);
  489. end
  490. else if op in [OP_SAR,OP_SHL,OP_SHR] then
  491. begin
  492. if op=OP_SHL then
  493. list.concat(taicpu.op_reg(A_SSL,src1))
  494. else
  495. list.concat(taicpu.op_reg(A_SSR,src1));
  496. list.concat(taicpu.op_reg_reg(TOpCG2AsmOp[op],dst,src2));
  497. maybeadjustresult(list,op,size,dst);
  498. end
  499. else
  500. case op of
  501. OP_MOVE:
  502. a_load_reg_reg(list,size,size,src1,dst);
  503. else
  504. begin
  505. list.concat(taicpu.op_reg_reg_reg(TOpCG2AsmOp[op],dst,src2,src1));
  506. maybeadjustresult(list,op,size,dst);
  507. end;
  508. end;
  509. end;
  510. procedure tcgcpu.a_call_name(list : TAsmList; const s : string;
  511. weak : boolean);
  512. begin
  513. if not weak then
  514. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.RefAsmSymbol(s,AT_FUNCTION)))
  515. else
  516. list.concat(taicpu.op_sym(txtensaprocinfo(current_procinfo).callins,current_asmdata.WeakRefAsmSymbol(s,AT_FUNCTION)));
  517. end;
  518. procedure tcgcpu.a_call_reg(list : TAsmList; Reg : tregister);
  519. begin
  520. list.concat(taicpu.op_reg(txtensaprocinfo(current_procinfo).callxins,reg));
  521. end;
  522. procedure tcgcpu.a_jmp_name(list : TAsmList; const s : string);
  523. var
  524. ai : taicpu;
  525. tmpreg: TRegister;
  526. begin
  527. { for now, we use A15 here, however, this is not save as it might contain an argument }
  528. ai:=TAiCpu.op_sym_reg(A_J,current_asmdata.RefAsmSymbol(s,AT_FUNCTION),NR_A15);
  529. ai.oppostfix := PF_L; // if destination is too far for J then assembler can convert to JX
  530. ai.is_jmp:=true;
  531. list.Concat(ai);
  532. end;
  533. procedure tcgcpu.a_jmp_flags(list: TAsmList; const f: TResFlags; l: tasmlabel);
  534. var
  535. instr: taicpu;
  536. begin
  537. if CPUXTENSA_HAS_BOOLEAN_OPTION in cpu_capabilities[current_settings.cputype] then
  538. begin
  539. instr:=taicpu.op_reg_sym(A_B,f.register,l);
  540. instr.condition:=flags_to_cond(f.flag);
  541. list.concat(instr);
  542. end
  543. else
  544. Internalerror(2020070401);
  545. end;
  546. procedure tcgcpu.g_proc_entry(list : TAsmList; localsize : longint;
  547. nostackframe : boolean);
  548. var
  549. ref : treference;
  550. r : byte;
  551. regs : tcpuregisterset;
  552. stackmisalignment : pint;
  553. regoffset : LongInt;
  554. stack_parameters : Boolean;
  555. registerarea : PtrInt;
  556. l : TAsmLabel;
  557. begin
  558. LocalSize:=align(LocalSize,4);
  559. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  560. { call instruction does not put anything on the stack }
  561. registerarea:=0;
  562. if not(nostackframe) then
  563. begin
  564. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  565. a_reg_alloc(list,NR_STACK_POINTER_REG);
  566. case target_info.abi of
  567. abi_xtensa_call0:
  568. begin
  569. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  570. Include(regs,RS_A15);
  571. if pi_do_call in current_procinfo.flags then
  572. Include(regs,RS_A0);
  573. if regs<>[] then
  574. begin
  575. for r:=RS_A0 to RS_A15 do
  576. if r in regs then
  577. inc(registerarea,4);
  578. end;
  579. inc(localsize,registerarea);
  580. if LocalSize<>0 then
  581. begin
  582. localsize:=align(localsize,current_settings.alignment.localalignmax);
  583. a_reg_alloc(list,NR_STACK_POINTER_REG);
  584. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,-localsize));
  585. end;
  586. reference_reset(ref,4,[]);
  587. ref.base:=NR_STACK_POINTER_REG;
  588. ref.offset:=localsize;
  589. if ref.offset>1024 then
  590. begin
  591. if ref.offset<=1024+32512 then
  592. begin
  593. list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  594. ref.offset:=ref.offset and $3ff;
  595. ref.base:=NR_A8;
  596. end
  597. else
  598. { fix me! }
  599. Internalerror(2020031101);
  600. end;
  601. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  602. begin
  603. dec(ref.offset,4);
  604. list.concat(taicpu.op_reg_ref(A_S32I,NR_A15,ref));
  605. a_reg_alloc(list,NR_FRAME_POINTER_REG);
  606. list.concat(taicpu.op_reg_reg(A_MOV,NR_A15,NR_STACK_POINTER_REG));
  607. end;
  608. if regs<>[] then
  609. begin
  610. for r:=RS_A14 downto RS_A0 do
  611. if r in regs then
  612. begin
  613. dec(ref.offset,4);
  614. list.concat(taicpu.op_reg_ref(A_S32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  615. end;
  616. end;
  617. end;
  618. abi_xtensa_windowed:
  619. begin
  620. if stack_parameters and (pi_estimatestacksize in current_procinfo.flags) then
  621. begin
  622. if localsize>txtensaprocinfo(current_procinfo).stackframesize then
  623. internalerror(2020031402)
  624. else
  625. localsize:=txtensaprocinfo(current_procinfo).stackframesize-registerarea;
  626. end
  627. else
  628. begin
  629. { default spill area }
  630. inc(localsize,4*4);
  631. { additional spill area? }
  632. if pi_do_call in current_procinfo.flags then
  633. inc(localsize,txtensaprocinfo(current_procinfo).maxcall*4);
  634. localsize:=align(localsize,current_settings.alignment.localalignmax);
  635. end;
  636. if localsize>32760 then
  637. begin
  638. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,32));
  639. reference_reset(ref,4,[]);
  640. ref.symbol:=create_data_entry(nil,longint(localsize-32));
  641. list.concat(taicpu.op_reg_ref(A_L32R,NR_A8,ref));
  642. list.concat(taicpu.op_reg_reg_reg(A_SUB,NR_A8,NR_STACK_POINTER_REG,NR_A8));
  643. list.concat(taicpu.op_reg_reg(A_MOVSP,NR_STACK_POINTER_REG,NR_A8));
  644. end
  645. else
  646. list.concat(taicpu.op_reg_const(A_ENTRY,NR_STACK_POINTER_REG,localsize));
  647. end;
  648. else
  649. Internalerror(2020031401);
  650. end;
  651. end;
  652. end;
  653. procedure tcgcpu.g_proc_exit(list : TAsmList; parasize : longint;
  654. nostackframe : boolean);
  655. var
  656. ref : treference;
  657. r : byte;
  658. regs : tcpuregisterset;
  659. stackmisalignment : pint;
  660. regoffset : LongInt;
  661. stack_parameters : Boolean;
  662. registerarea : PtrInt;
  663. l : TAsmLabel;
  664. LocalSize: longint;
  665. begin
  666. case target_info.abi of
  667. abi_xtensa_windowed:
  668. list.Concat(taicpu.op_none(A_RETW));
  669. abi_xtensa_call0:
  670. begin
  671. if not(nostackframe) then
  672. begin
  673. LocalSize:=current_procinfo.calc_stackframe_size;
  674. LocalSize:=align(LocalSize,4);
  675. stack_parameters:=current_procinfo.procdef.stack_tainting_parameter(calleeside);
  676. registerarea:=0;
  677. regs:=rg[R_INTREGISTER].used_in_proc-paramanager.get_volatile_registers_int(pocall_stdcall);
  678. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  679. Include(regs,RS_A15);
  680. if pi_do_call in current_procinfo.flags then
  681. Include(regs,RS_A0);
  682. if regs<>[] then
  683. begin
  684. for r:=RS_A0 to RS_A15 do
  685. if r in regs then
  686. inc(registerarea,4);
  687. end;
  688. inc(localsize,registerarea);
  689. if LocalSize<>0 then
  690. begin
  691. localsize:=align(localsize,current_settings.alignment.localalignmax);
  692. // Determine reference mode required to access stack
  693. reference_reset(ref,4,[]);
  694. ref.base:=NR_STACK_POINTER_REG;
  695. ref.offset:=localsize;
  696. if ref.offset>1024 then
  697. begin
  698. if ref.offset<=1024+32512 then
  699. begin
  700. // allocation done in proc_entry
  701. //list.concat(taicpu.op_reg_reg_const(A_ADDMI,NR_A8,NR_STACK_POINTER_REG,ref.offset and $fffffc00));
  702. ref.offset:=ref.offset and $3ff;
  703. ref.base:=NR_A8;
  704. end
  705. else
  706. { fix me! }
  707. Internalerror(2020031102);
  708. end;
  709. // restore a15 if used
  710. if current_procinfo.framepointer<>NR_STACK_POINTER_REG then
  711. begin
  712. dec(ref.offset,4);
  713. list.concat(taicpu.op_reg_ref(A_L32I,NR_A15,ref));
  714. a_reg_dealloc(list,NR_FRAME_POINTER_REG);
  715. end;
  716. // restore rest of registers
  717. if regs<>[] then
  718. begin
  719. for r:=RS_A14 downto RS_A0 do
  720. if r in regs then
  721. begin
  722. dec(ref.offset,4);
  723. list.concat(taicpu.op_reg_ref(A_L32I,newreg(R_INTREGISTER,r,R_SUBWHOLE),ref));
  724. end;
  725. end;
  726. // restore stack pointer
  727. list.concat(taicpu.op_reg_reg_const(A_ADDI,NR_STACK_POINTER_REG,NR_STACK_POINTER_REG,localsize));
  728. a_reg_dealloc(list,NR_STACK_POINTER_REG);
  729. end;
  730. end;
  731. list.Concat(taicpu.op_none(A_RET));
  732. end
  733. else
  734. Internalerror(2020031403);
  735. end;
  736. end;
  737. procedure tcgcpu.a_cmp_const_reg_label(list: TAsmList; size: tcgsize; cmp_op: topcmp; a: tcgint; reg: tregister; l: tasmlabel);
  738. function is_b4const(v: tcgint): boolean;
  739. begin
  740. case v of
  741. -1,1,2,3,4,5,6,7,8,
  742. 10,12,16,32,64,128,256:
  743. result:=true;
  744. else
  745. result:=false;
  746. end;
  747. end;
  748. function is_b4constu(v: tcgint): boolean;
  749. begin
  750. case v of
  751. 32768,65536,
  752. 2,3,4,5,6,7,8,
  753. 10,12,16,32,64,128,256:
  754. result:=true;
  755. else
  756. result:=false;
  757. end;
  758. end;
  759. var
  760. op: TAsmCond;
  761. instr: taicpu;
  762. begin
  763. if (a=0) and (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  764. begin
  765. case cmp_op of
  766. OC_EQ: op:=C_EQZ;
  767. OC_NE: op:=C_NEZ;
  768. OC_LT: op:=C_LTZ;
  769. OC_GTE: op:=C_GEZ;
  770. else
  771. Internalerror(2020030801);
  772. end;
  773. instr:=taicpu.op_reg_sym(A_B,reg,l);
  774. instr.condition:=op;
  775. list.concat(instr);
  776. end
  777. else if is_b4const(a) and
  778. (cmp_op in [OC_EQ,OC_NE,OC_LT,OC_GTE]) then
  779. begin
  780. case cmp_op of
  781. OC_EQ: op:=C_EQI;
  782. OC_NE: op:=C_NEI;
  783. OC_LT: op:=C_LTI;
  784. OC_GTE: op:=C_GEI;
  785. else
  786. Internalerror(2020030801);
  787. end;
  788. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  789. instr.condition:=op;
  790. list.concat(instr);
  791. end
  792. else if is_b4constu(a) and
  793. (cmp_op in [OC_B,OC_AE]) then
  794. begin
  795. case cmp_op of
  796. OC_B: op:=C_LTUI;
  797. OC_AE: op:=C_GEUI;
  798. else
  799. Internalerror(2020030801);
  800. end;
  801. instr:=taicpu.op_reg_const_sym(A_B,reg,a,l);
  802. instr.condition:=op;
  803. list.concat(instr);
  804. end
  805. else
  806. inherited a_cmp_const_reg_label(list, size, cmp_op, a, reg, l);
  807. end;
  808. procedure tcgcpu.a_cmp_reg_reg_label(list : TAsmList; size : tcgsize;
  809. cmp_op : topcmp; reg1,reg2 : tregister; l : tasmlabel);
  810. var
  811. tmpreg: TRegister;
  812. instr: taicpu;
  813. begin
  814. if TOpCmp2AsmCond[cmp_op]=C_None then
  815. begin
  816. cmp_op:=swap_opcmp(cmp_op);
  817. tmpreg:=reg1;
  818. reg1:=reg2;
  819. reg2:=tmpreg;
  820. end;
  821. instr:=taicpu.op_reg_reg_sym(A_B,reg2,reg1,l);
  822. instr.condition:=TOpCmp2AsmCond[cmp_op];
  823. list.concat(instr);
  824. end;
  825. procedure tcgcpu.a_jmp_always(list : TAsmList; l : TAsmLabel);
  826. var
  827. ai : taicpu;
  828. begin
  829. if l.bind in [AB_GLOBAL] then
  830. begin
  831. { for now, we use A15 here, however, this is not save as it might contain an argument, I have not figured out a
  832. solution yet }
  833. ai:=taicpu.op_sym_reg(A_J,l,NR_A15);
  834. ai.oppostfix := PF_L;
  835. end
  836. else
  837. ai:=taicpu.op_sym(A_J,l);
  838. ai.is_jmp:=true;
  839. list.concat(ai);
  840. end;
  841. procedure tcgcpu.g_flags2reg(list: TAsmList; size: TCgSize; const f: tresflags; reg: TRegister);
  842. var
  843. hregister: TRegister;
  844. instr: taicpu;
  845. begin
  846. a_load_const_reg(list,size,0,reg);
  847. hregister:=getintregister(list,size);
  848. a_load_const_reg(list,size,1,hregister);
  849. instr:=taicpu.op_reg_reg_reg(A_MOV,reg,hregister,f.register);
  850. instr.condition:=flags_to_cond(f.flag);
  851. list.concat(instr);
  852. end;
  853. procedure tcgcpu.g_concatcopy_move(list: tasmlist; const Source, dest: treference; len: tcgint);
  854. var
  855. paraloc1, paraloc2, paraloc3: TCGPara;
  856. pd: tprocdef;
  857. begin
  858. pd:=search_system_proc('MOVE');
  859. paraloc1.init;
  860. paraloc2.init;
  861. paraloc3.init;
  862. paramanager.getcgtempparaloc(list, pd, 1, paraloc1);
  863. paramanager.getcgtempparaloc(list, pd, 2, paraloc2);
  864. paramanager.getcgtempparaloc(list, pd, 3, paraloc3);
  865. a_load_const_cgpara(list, OS_SINT, len, paraloc3);
  866. a_loadaddr_ref_cgpara(list, dest, paraloc2);
  867. a_loadaddr_ref_cgpara(list, Source, paraloc1);
  868. paramanager.freecgpara(list, paraloc3);
  869. paramanager.freecgpara(list, paraloc2);
  870. paramanager.freecgpara(list, paraloc1);
  871. alloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  872. alloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  873. a_call_name(list, 'FPC_MOVE', false);
  874. dealloccpuregisters(list, R_FPUREGISTER, paramanager.get_volatile_registers_fpu(pocall_default));
  875. dealloccpuregisters(list, R_INTREGISTER, paramanager.get_volatile_registers_int(pocall_default));
  876. paraloc3.done;
  877. paraloc2.done;
  878. paraloc1.done;
  879. end;
  880. procedure tcgcpu.g_concatcopy(list : TAsmList;const source,dest : treference;len : tcgint);
  881. var
  882. tmpreg1, hreg, countreg: TRegister;
  883. src, dst, src2, dst2: TReference;
  884. lab: tasmlabel;
  885. Count, count2: aint;
  886. function reference_is_reusable(const ref: treference): boolean;
  887. begin
  888. result:=(ref.base<>NR_NO) and (ref.index=NR_NO) and
  889. (ref.symbol=nil);
  890. end;
  891. begin
  892. src2:=source;
  893. fixref(list,src2);
  894. dst2:=dest;
  895. fixref(list,dst2);
  896. if len > high(longint) then
  897. internalerror(2002072704);
  898. { A call (to FPC_MOVE) requires the outgoing parameter area to be properly
  899. allocated on stack. This can only be done before tmipsprocinfo.set_first_temp_offset,
  900. i.e. before secondpass. Other internal procedures request correct stack frame
  901. by setting pi_do_call during firstpass, but for this particular one it is impossible.
  902. Therefore, if the current procedure is a leaf one, we have to leave it that way. }
  903. { anybody wants to determine a good value here :)? }
  904. if (len > 100) and
  905. assigned(current_procinfo) and
  906. (pi_do_call in current_procinfo.flags) then
  907. g_concatcopy_move(list, src2, dst2, len)
  908. else
  909. begin
  910. Count := len div 4;
  911. if (count<=4) and reference_is_reusable(src2) then
  912. src:=src2
  913. else
  914. begin
  915. reference_reset(src,sizeof(aint),[]);
  916. { load the address of src2 into src.base }
  917. src.base := GetAddressRegister(list);
  918. a_loadaddr_ref_reg(list, src2, src.base);
  919. end;
  920. if (count<=4) and reference_is_reusable(dst2) then
  921. dst:=dst2
  922. else
  923. begin
  924. reference_reset(dst,sizeof(aint),[]);
  925. { load the address of dst2 into dst.base }
  926. dst.base := GetAddressRegister(list);
  927. a_loadaddr_ref_reg(list, dst2, dst.base);
  928. end;
  929. { generate a loop }
  930. if Count > 4 then
  931. begin
  932. countreg := GetIntRegister(list, OS_INT);
  933. tmpreg1 := GetIntRegister(list, OS_INT);
  934. a_load_const_reg(list, OS_INT, Count, countreg);
  935. current_asmdata.getjumplabel(lab);
  936. a_label(list, lab);
  937. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  938. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  939. list.concat(taicpu.op_reg_reg_const(A_ADDI, src.base, src.base, 4));
  940. list.concat(taicpu.op_reg_reg_const(A_ADDI, dst.base, dst.base, 4));
  941. list.concat(taicpu.op_reg_reg_const(A_ADDI, countreg, countreg, -1));
  942. a_cmp_const_reg_label(list,OS_INT,OC_GT,0,countreg,lab);
  943. { keep the registers alive }
  944. list.concat(taicpu.op_reg_reg(A_MOV,countreg,countreg));
  945. list.concat(taicpu.op_reg_reg(A_MOV,src.base,src.base));
  946. list.concat(taicpu.op_reg_reg(A_MOV,dst.base,dst.base));
  947. len := len mod 4;
  948. end;
  949. { unrolled loop }
  950. Count := len div 4;
  951. if Count > 0 then
  952. begin
  953. tmpreg1 := GetIntRegister(list, OS_INT);
  954. for count2 := 1 to Count do
  955. begin
  956. list.concat(taicpu.op_reg_ref(A_L32I, tmpreg1, src));
  957. list.concat(taicpu.op_reg_ref(A_S32I, tmpreg1, dst));
  958. Inc(src.offset, 4);
  959. Inc(dst.offset, 4);
  960. end;
  961. len := len mod 4;
  962. end;
  963. if (len and 4) <> 0 then
  964. begin
  965. hreg := GetIntRegister(list, OS_INT);
  966. a_load_ref_reg(list, OS_32, OS_32, src, hreg);
  967. a_load_reg_ref(list, OS_32, OS_32, hreg, dst);
  968. Inc(src.offset, 4);
  969. Inc(dst.offset, 4);
  970. end;
  971. { copy the leftovers }
  972. if (len and 2) <> 0 then
  973. begin
  974. hreg := GetIntRegister(list, OS_INT);
  975. a_load_ref_reg(list, OS_16, OS_16, src, hreg);
  976. a_load_reg_ref(list, OS_16, OS_16, hreg, dst);
  977. Inc(src.offset, 2);
  978. Inc(dst.offset, 2);
  979. end;
  980. if (len and 1) <> 0 then
  981. begin
  982. hreg := GetIntRegister(list, OS_INT);
  983. a_load_ref_reg(list, OS_8, OS_8, src, hreg);
  984. a_load_reg_ref(list, OS_8, OS_8, hreg, dst);
  985. end;
  986. end;
  987. end;
  988. procedure tcgcpu.a_loadfpu_reg_reg(list: TAsmList; fromsize,tosize: tcgsize; reg1, reg2: tregister);
  989. var
  990. ai: taicpu;
  991. begin
  992. if not(fromsize in [OS_32,OS_F32]) then
  993. InternalError(2020032603);
  994. ai := taicpu.op_reg_reg(A_MOV,reg2,reg1);
  995. ai.oppostfix := PF_S;
  996. list.concat(ai);
  997. end;
  998. procedure tcgcpu.a_loadfpu_ref_reg(list: TAsmList; fromsize,tosize: tcgsize; const ref: treference; reg: tregister);
  999. var
  1000. href: treference;
  1001. begin
  1002. if not(fromsize in [OS_32,OS_F32]) then
  1003. InternalError(2020032602);
  1004. href:=ref;
  1005. if assigned(href.symbol) or
  1006. (href.index<>NR_NO) or
  1007. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1008. fixref(list,href);
  1009. list.concat(taicpu.op_reg_ref(A_LSI,reg,href));
  1010. if fromsize<>tosize then
  1011. a_loadfpu_reg_reg(list,fromsize,tosize,reg,reg);
  1012. end;
  1013. procedure tcgcpu.a_loadfpu_reg_ref(list: TAsmList; fromsize, tosize: tcgsize; reg: tregister; const ref: treference);
  1014. var
  1015. href: treference;
  1016. begin
  1017. if not(fromsize in [OS_32,OS_F32]) then
  1018. InternalError(2020032604);
  1019. href:=ref;
  1020. if assigned(href.symbol) or
  1021. (href.index<>NR_NO) or
  1022. (((href.offset<0) or (href.offset>1020) or (href.offset mod 4<>0))) then
  1023. fixref(list,href);
  1024. list.concat(taicpu.op_reg_ref(A_SSI,reg,href));
  1025. end;
  1026. procedure tcgcpu.maybeadjustresult(list : TAsmList; op : TOpCg; size : tcgsize; dst : tregister);
  1027. const
  1028. overflowops = [OP_MUL,OP_SHL,OP_ADD,OP_SUB,OP_NEG];
  1029. begin
  1030. if (op in overflowops) and
  1031. (size in [OS_8,OS_S8,OS_16,OS_S16]) then
  1032. a_load_reg_reg(list,OS_32,size,dst,dst);
  1033. end;
  1034. procedure tcgcpu.g_overflowcheck(list: TAsmList; const Loc: tlocation; def: tdef);
  1035. begin
  1036. { no overflow checking yet }
  1037. end;
  1038. function tcgcpu.create_data_entry(symbol: TAsmSymbol;offset: asizeint): TAsmLabel;
  1039. var
  1040. hp: tai;
  1041. begin
  1042. hp:=tai(current_procinfo.aktlocaldata.first);
  1043. while assigned(hp) do
  1044. begin
  1045. if (hp.typ=ait_label) and assigned(hp.Next) and
  1046. (tai(hp.Next).typ=ait_const) and
  1047. (tai_const(hp.Next).consttype=aitconst_ptr) and
  1048. (tai_const(hp.Next).sym=symbol) and
  1049. (tai_const(hp.Next).endsym=nil) and
  1050. ((assigned(symbol) and (tai_const(hp.Next).symofs=offset)) or
  1051. (not(assigned(symbol)) and (tai_const(hp.Next).value=offset))
  1052. ) then
  1053. begin
  1054. Result:=tai_label(hp).labsym;
  1055. exit;
  1056. end;
  1057. hp:=tai(hp.Next);
  1058. end;
  1059. current_asmdata.getjumplabel(Result);
  1060. cg.a_label(current_procinfo.aktlocaldata,Result);
  1061. if assigned(symbol) then
  1062. current_procinfo.aktlocaldata.concat(tai_const.create_sym_offset(symbol,offset))
  1063. else
  1064. current_procinfo.aktlocaldata.concat(tai_const.Create_32bit(offset));
  1065. end;
  1066. procedure tcg64fxtensa.a_op64_reg_reg_reg(list: TAsmList;op:TOpCG;size : tcgsize;regsrc1,regsrc2,regdst : tregister64);
  1067. var
  1068. instr: taicpu;
  1069. no_carry: TAsmLabel;
  1070. tmpreg: TRegister;
  1071. begin
  1072. case op of
  1073. OP_NEG,
  1074. OP_NOT :
  1075. internalerror(2020030810);
  1076. else
  1077. ;
  1078. end;
  1079. case op of
  1080. OP_AND,OP_OR,OP_XOR:
  1081. begin
  1082. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reglo,regsrc2.reglo,regdst.reglo);
  1083. cg.a_op_reg_reg_reg(list,op,OS_32,regsrc1.reghi,regsrc2.reghi,regdst.reghi);
  1084. end;
  1085. OP_ADD:
  1086. begin
  1087. if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then
  1088. Internalerror(2020082205);
  1089. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reglo, regsrc2.reglo, regsrc1.reglo));
  1090. list.concat(taicpu.op_reg_reg_reg(A_ADD, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1091. current_asmdata.getjumplabel(no_carry);
  1092. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regdst.reglo, no_carry);
  1093. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1094. cg.a_label(list,no_carry);
  1095. end;
  1096. OP_SUB:
  1097. begin
  1098. if (regsrc1.reglo=regdst.reglo) or (regsrc1.reghi=regdst.reghi) then
  1099. Internalerror(2020082206);
  1100. { we need the original src2 value for the comparison, do not overwrite it }
  1101. if regsrc2.reglo=regdst.reglo then
  1102. begin
  1103. tmpreg:=cg.GetIntRegister(list,OS_S32);
  1104. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc2.reglo,tmpreg);
  1105. regsrc2.reglo:=tmpreg;
  1106. end;
  1107. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reglo, regsrc2.reglo, regsrc1.reglo));
  1108. list.concat(taicpu.op_reg_reg_reg(A_SUB, regdst.reghi, regsrc2.reghi, regsrc1.reghi));
  1109. current_asmdata.getjumplabel(no_carry);
  1110. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc1.reglo, regsrc2.reglo, no_carry);
  1111. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, -1));
  1112. cg.a_label(list,no_carry);
  1113. end;
  1114. else
  1115. internalerror(2020030813);
  1116. end;
  1117. end;
  1118. procedure tcg64fxtensa.a_op64_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; regsrc,regdst : tregister64);
  1119. var
  1120. tmpreg : TRegister;
  1121. instr : taicpu;
  1122. begin
  1123. case op of
  1124. OP_NEG:
  1125. begin
  1126. tmpreg:=cg.GetIntRegister(list, OS_INT);
  1127. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reglo,regsrc.reglo));
  1128. list.concat(taicpu.op_reg_reg(A_NEG,regdst.reghi,regsrc.reghi));
  1129. list.concat(taicpu.op_reg_reg_const(A_ADDI,tmpreg,regdst.reghi,-1));
  1130. instr:=taicpu.op_reg_reg_reg(A_MOV,regdst.reghi,tmpreg,regdst.reglo);
  1131. instr.condition:=C_NEZ;
  1132. list.concat(instr);
  1133. end;
  1134. OP_NOT:
  1135. begin
  1136. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reglo,regdst.reglo);
  1137. cg.a_op_reg_reg(list,OP_NOT,OS_INT,regsrc.reghi,regdst.reghi);
  1138. end;
  1139. else
  1140. a_op64_reg_reg_reg(list,op,size,regsrc,regdst,regdst);
  1141. end;
  1142. end;
  1143. procedure tcg64fxtensa.a_op64_const_reg_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; regsrc,regdst : tregister64);
  1144. var
  1145. tmpreg64 : tregister64;
  1146. no_carry : TAsmLabel;
  1147. tmpreg: tregister;
  1148. begin
  1149. case op of
  1150. OP_NEG,
  1151. OP_NOT :
  1152. internalerror(2020030904);
  1153. else
  1154. ;
  1155. end;
  1156. case op of
  1157. OP_AND,OP_OR,OP_XOR:
  1158. begin
  1159. cg.a_op_const_reg_reg(list,op,OS_32,aint(lo(value)),regsrc.reglo,regdst.reglo);
  1160. cg.a_op_const_reg_reg(list,op,OS_32,aint(hi(value)),regsrc.reghi,regdst.reghi);
  1161. end;
  1162. OP_ADD:
  1163. begin
  1164. { could do better here (hi(value) in 248..2047), for now we support only the simple cases }
  1165. if (value>=-2048) and (value<=2047) then
  1166. begin
  1167. { we need the original src value for the comparison, do not overwrite it }
  1168. if regsrc.reglo=regdst.reglo then
  1169. begin
  1170. tmpreg:=cg.GetIntRegister(list,OS_S32);
  1171. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,tmpreg);
  1172. regsrc.reglo:=tmpreg;
  1173. end;
  1174. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reglo, regsrc.reglo, value));
  1175. list.concat(taicpu.op_reg_reg(A_MOV, regdst.reghi, regsrc.reghi));
  1176. current_asmdata.getjumplabel(no_carry);
  1177. cg.a_cmp_reg_reg_label(list,OS_INT,OC_AE, regsrc.reglo, regdst.reglo, no_carry);
  1178. list.concat(taicpu.op_reg_reg_const(A_ADDI, regdst.reghi, regdst.reghi, 1));
  1179. cg.a_label(list,no_carry);
  1180. end
  1181. else
  1182. begin
  1183. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1184. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1185. a_load64_const_reg(list,value,tmpreg64);
  1186. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1187. end;
  1188. end;
  1189. OP_SHL:
  1190. begin
  1191. if (value>0) and (value<=16) then
  1192. begin
  1193. tmpreg:=cg.GetIntRegister(list,OS_32);
  1194. list.concat(taicpu.op_reg_reg_const_const(A_EXTUI, tmpreg, regsrc.reglo, 32-value, value));
  1195. list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reglo, regsrc.reglo, value));
  1196. list.concat(taicpu.op_reg_reg_const(A_SLLI, regdst.reghi, regsrc.reghi, value));
  1197. list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reghi, tmpreg, regdst.reghi));
  1198. end
  1199. else if value=32 then
  1200. begin
  1201. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reglo,regdst.reghi);
  1202. cg.a_load_const_reg(list,OS_INT,0,regdst.reglo);
  1203. end
  1204. else
  1205. Internalerror(2020082209);
  1206. end;
  1207. OP_SHR:
  1208. begin
  1209. if (value>0) and (value<=15) then
  1210. begin
  1211. tmpreg:=cg.GetIntRegister(list,OS_32);
  1212. list.concat(taicpu.op_reg_reg_const(A_SLLI, tmpreg, regsrc.reghi, 32-value));
  1213. list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reglo, regsrc.reglo, value));
  1214. list.concat(taicpu.op_reg_reg_reg(A_OR, regdst.reglo, tmpreg, regdst.reglo));
  1215. list.concat(taicpu.op_reg_reg_const(A_SRLI, regdst.reghi, regsrc.reghi, value));
  1216. end
  1217. else if value=32 then
  1218. begin
  1219. cg.a_load_reg_reg(list,OS_INT,OS_INT,regsrc.reghi,regdst.reglo);
  1220. cg.a_load_const_reg(list,OS_INT,0,regdst.reghi);
  1221. end
  1222. else
  1223. Internalerror(2020082210);
  1224. end;
  1225. OP_SUB:
  1226. begin
  1227. { for now, we take the simple approach }
  1228. tmpreg64.reglo := cg.GetIntRegister(list,OS_S32);
  1229. tmpreg64.reghi := cg.GetIntRegister(list,OS_S32);
  1230. a_load64_const_reg(list,value,tmpreg64);
  1231. a_op64_reg_reg_reg(list,op,size,tmpreg64,regsrc,regdst);
  1232. end;
  1233. else
  1234. internalerror(2020030901);
  1235. end;
  1236. end;
  1237. procedure tcg64fxtensa.a_op64_const_reg(list : TAsmList; op : TOpCG; size : tcgsize; value : int64; reg : tregister64);
  1238. begin
  1239. a_op64_const_reg_reg(list,op,size,value,reg,reg);
  1240. end;
  1241. {$warnings off}
  1242. procedure create_codegen;
  1243. begin
  1244. cg:=tcgcpu.Create;
  1245. cg64:=tcg64fxtensa.Create;
  1246. end;
  1247. end.