cgutils.pas 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564
  1. {
  2. Copyright (c) 1998-2004 by Florian Klaempfl
  3. Some basic types and constants for the code generation
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. { This unit exports some helper routines which are used across the code generator }
  18. unit cgutils;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. globtype,
  23. cclasses,
  24. aasmbase,
  25. cpubase,cgbase;
  26. const
  27. { implementation of max function using only functionality that can be
  28. evaluated as a constant expression by the compiler -- this is
  29. basically maxcpureg = max(max(first_int_imreg,first_fpu_imreg),first_mm_imreg)-1 }
  30. tmpmaxcpufpuintreg = first_int_imreg + ((first_fpu_imreg - first_int_imreg) * ord(first_int_imreg < first_fpu_imreg));
  31. maxcpuregister = (tmpmaxcpufpuintreg + ((first_mm_imreg - tmpmaxcpufpuintreg) * ord(tmpmaxcpufpuintreg < first_mm_imreg)))-1;
  32. type
  33. { Set type definition for cpuregisters }
  34. tcpuregisterset = set of 0..maxcpuregister;
  35. tcpuregisterarray = array of tsuperregister;
  36. { use record for type-safety; should only be accessed directly by temp
  37. manager }
  38. treftemppos = record
  39. val: asizeint;
  40. end;
  41. {$packset 1}
  42. { a reference may be volatile for reading, writing, or both. E.g., local variables
  43. inside try-blocks are volatile for writes (writes must not be removed, because at
  44. any point an exception may be triggered and then all previous writes to the
  45. variable must have been performed), but not for reads (these variables' values
  46. won't be changed behind the back of the current code just because they're in a
  47. try-block) }
  48. tvolatility = (vol_read,vol_write);
  49. tvolatilityset = set of tvolatility;
  50. {$packset default}
  51. { reference record, reordered for best alignment }
  52. preference = ^treference;
  53. treference = record
  54. offset : asizeint;
  55. symbol,
  56. relsymbol : tasmsymbol;
  57. temppos : treftemppos;
  58. {$if defined(x86)}
  59. segment,
  60. {$endif defined(x86)}
  61. base,
  62. index : tregister;
  63. refaddr : trefaddr;
  64. scalefactor : byte;
  65. {$if defined(riscv32) or defined(riscv64)}
  66. symboldata : tlinkedlistitem;
  67. {$endif riscv32/64}
  68. {$ifdef arm}
  69. symboldata : tlinkedlistitem;
  70. signindex : shortint;
  71. shiftimm : byte;
  72. addressmode : taddressmode;
  73. shiftmode : tshiftmode;
  74. {$endif arm}
  75. {$ifdef aarch64}
  76. symboldata : tlinkedlistitem;
  77. shiftimm : byte;
  78. addressmode : taddressmode;
  79. shiftmode : tshiftmode;
  80. {$endif aarch64}
  81. {$ifdef avr}
  82. addressmode : taddressmode;
  83. {$endif avr}
  84. {$ifdef m68k}
  85. { indexed increment and decrement mode }
  86. { (An)+ and -(An) }
  87. direction : tdirection;
  88. {$endif m68k}
  89. {$ifdef jvm}
  90. arrayreftype: tarrayreftype;
  91. indexbase: tregister;
  92. indexsymbol: tasmsymbol;
  93. indexoffset: aint;
  94. checkcast: boolean;
  95. {$endif jvm}
  96. volatility: tvolatilityset;
  97. alignment : byte;
  98. end;
  99. const
  100. ctempposinvalid: treftemppos = (val: low(treftemppos.val));
  101. type
  102. tsubsetregister = record
  103. subsetreg : tregister;
  104. startbit, bitlen: byte;
  105. subsetregsize: tcgsize;
  106. end;
  107. tsubsetreference = record
  108. ref: treference;
  109. bitindexreg: tregister;
  110. startbit, bitlen: byte;
  111. end;
  112. tlocation = record
  113. loc : TCGLoc;
  114. size : TCGSize;
  115. case TCGLoc of
  116. {$ifdef cpuflags}
  117. LOC_FLAGS : (resflags : tresflags);
  118. {$endif cpuflags}
  119. LOC_CONSTANT : (
  120. case longint of
  121. {$if defined(cpu64bitalu) or defined(cpuhighleveltarget)}
  122. 1 : (value : Int64);
  123. {$else cpu64bitalu or cpuhighleveltarget}
  124. {$ifdef FPC_BIG_ENDIAN}
  125. 1 : (_valuedummy,value : longint);
  126. {$else FPC_BIG_ENDIAN}
  127. 1 : (value : longint);
  128. {$endif FPC_BIG_ENDIAN}
  129. {$endif cpu64bitalu or cpuhighleveltarget}
  130. 2 : (value64 : Int64);
  131. );
  132. LOC_CREFERENCE,
  133. LOC_REFERENCE : (reference : treference);
  134. { segment in reference at the same place as in loc_register }
  135. LOC_REGISTER,
  136. LOC_CREGISTER : (
  137. case longint of
  138. 1 : (register : tregister;
  139. { some x86_64 targets require two function result registers }
  140. registerhi : tregister;
  141. {$ifdef m68k}
  142. { some m68k OSes require that the result is returned in d0 and a0
  143. the second location must be stored here }
  144. registeralias : tregister;
  145. {$endif m68k}
  146. );
  147. {$ifdef cpu64bitalu}
  148. { overlay a 128 Bit register type }
  149. 2 : (register128 : tregister128);
  150. {$else if not defined(cpuhighleveltarget}
  151. { overlay a 64 Bit register type }
  152. 2 : (register64 : tregister64);
  153. {$endif cpu64bitalu and not cpuhighleveltarget}
  154. );
  155. LOC_SUBSETREG,
  156. LOC_CSUBSETREG : (
  157. sreg: tsubsetregister;
  158. );
  159. LOC_SUBSETREF : (
  160. sref: tsubsetreference;
  161. );
  162. LOC_JUMP : (
  163. truelabel, falselabel: tasmlabel;
  164. );
  165. end;
  166. { trerefence handling }
  167. {# Clear to zero a treference }
  168. procedure reference_reset(var ref : treference; alignment: longint; volatility: tvolatilityset);
  169. {# Clear to zero a treference, and set is base address
  170. to base register.
  171. }
  172. procedure reference_reset_base(var ref: treference; base: tregister; offset: asizeint; temppos: treftemppos; alignment: longint; volatility: tvolatilityset);
  173. procedure reference_reset_symbol(var ref: treference;sym: tasmsymbol; offset: asizeint; alignment : longint; volatility: tvolatilityset);
  174. { This routine verifies if two references are the same, and
  175. if so, returns TRUE, otherwise returns false.
  176. }
  177. function references_equal(const sref,dref : treference) : boolean; {$ifdef USEINLINE}inline;{$endif USEINLINE}
  178. { tlocation handling }
  179. { cannot be used for loc_(c)reference, because that one requires an alignment }
  180. procedure location_reset(var l : tlocation;lt:TCGNonRefLoc;lsize:TCGSize);
  181. { for loc_(c)reference }
  182. procedure location_reset_ref(var l : tlocation;lt:TCGRefLoc;lsize:TCGSize; alignment: longint; volatility: tvolatilityset);
  183. { for loc_jump }
  184. procedure location_reset_jump(out l: tlocation; truelab, falselab: tasmlabel);
  185. procedure location_copy(var destloc:tlocation; const sourceloc : tlocation);
  186. procedure location_swap(var destloc,sourceloc : tlocation);
  187. function location_reg2string(const locreg: tlocation): string;
  188. { returns r with the given alignment }
  189. function setalignment(const r : treference;b : byte) : treference;
  190. { Helper function which calculate "magic" values for replacement of division
  191. by constant operation by multiplication. See the "PowerPC compiler developer
  192. manual" for more information.
  193. N is number of bits to handle, functionality tested for values 32 and 64. }
  194. procedure calc_divconst_magic_signed(N: byte; d: aInt; out magic_m: aInt; out magic_s: byte);
  195. procedure calc_divconst_magic_unsigned(N: byte; d: aWord; out magic_m: aWord; out magic_add: boolean; out magic_shift: byte);
  196. { Functions for calculating the multiplicative inverse, or reciprocal, of
  197. a divisor mod 2^N. That is, a number r such that dr = 1 (mod 2^N).
  198. WARNING: d must not be a power of 2 (including 2^0 = 1) }
  199. procedure calc_mul_inverse(N: byte; d: aWord; out reciprocal: aWord; out shift: Byte);
  200. implementation
  201. uses
  202. systems,
  203. verbose,
  204. cgobj;
  205. {****************************************************************************
  206. TReference
  207. ****************************************************************************}
  208. procedure reference_reset(var ref: treference; alignment: longint; volatility: tvolatilityset);
  209. begin
  210. FillChar(ref,sizeof(treference),0);
  211. {$ifdef arm}
  212. ref.signindex:=1;
  213. {$endif arm}
  214. ref.alignment:=alignment;
  215. ref.volatility:=volatility;
  216. ref.temppos:=ctempposinvalid;
  217. end;
  218. procedure reference_reset_base(var ref: treference; base: tregister; offset: asizeint; temppos: treftemppos ; alignment: longint; volatility: tvolatilityset);
  219. begin
  220. reference_reset(ref,alignment,volatility);
  221. ref.base:=base;
  222. ref.offset:=offset;
  223. ref.temppos:=temppos;
  224. end;
  225. procedure reference_reset_symbol(var ref: treference; sym: tasmsymbol; offset: asizeint; alignment: longint; volatility: tvolatilityset);
  226. begin
  227. reference_reset(ref,alignment,volatility);
  228. ref.symbol:=sym;
  229. ref.offset:=offset;
  230. ref.temppos:=ctempposinvalid;
  231. end;
  232. function references_equal(const sref,dref : treference):boolean; {$ifdef USEINLINE}inline;{$endif USEINLINE}
  233. begin
  234. references_equal:=CompareByte(sref,dref,sizeof(treference))=0;
  235. end;
  236. { returns r with the given alignment }
  237. function setalignment(const r : treference;b : byte) : treference;
  238. begin
  239. result:=r;
  240. result.alignment:=b;
  241. end;
  242. {****************************************************************************
  243. TLocation
  244. ****************************************************************************}
  245. procedure location_reset(var l : tlocation;lt:TCGNonRefLoc;lsize:TCGSize);
  246. begin
  247. FillChar(l,sizeof(tlocation),0);
  248. l.loc:=lt;
  249. l.size:=lsize;
  250. if l.loc in [LOC_REFERENCE,LOC_CREFERENCE,LOC_JUMP] then
  251. { call location_reset_ref/jump instead }
  252. internalerror(2009020705);
  253. end;
  254. procedure location_reset_ref(var l: tlocation; lt: TCGRefLoc; lsize: TCGSize; alignment: longint; volatility: tvolatilityset);
  255. begin
  256. FillChar(l,sizeof(tlocation),0);
  257. l.loc:=lt;
  258. l.size:=lsize;
  259. {$ifdef arm}
  260. l.reference.signindex:=1;
  261. {$endif arm}
  262. l.reference.alignment:=alignment;
  263. l.reference.volatility:=volatility;
  264. l.reference.temppos:=ctempposinvalid;
  265. end;
  266. procedure location_reset_jump(out l: tlocation; truelab, falselab: tasmlabel);
  267. begin
  268. FillChar(l,sizeof(tlocation),0);
  269. l.loc:=LOC_JUMP;
  270. l.size:=OS_NO;
  271. l.truelabel:=truelab;
  272. l.falselabel:=falselab;
  273. end;
  274. procedure location_copy(var destloc:tlocation; const sourceloc : tlocation);
  275. begin
  276. destloc:=sourceloc;
  277. end;
  278. procedure location_swap(var destloc,sourceloc : tlocation);
  279. var
  280. swapl : tlocation;
  281. begin
  282. swapl := destloc;
  283. destloc := sourceloc;
  284. sourceloc := swapl;
  285. end;
  286. function location_reg2string(const locreg: tlocation): string;
  287. begin
  288. if not (locreg.loc in [LOC_REGISTER,LOC_CREGISTER,
  289. LOC_MMXREGISTER,LOC_CMMXREGISTER,
  290. LOC_MMREGISTER,LOC_CMMREGISTER,
  291. LOC_FPUREGISTER,LOC_CFPUREGISTER]) then
  292. internalerror(2013122301);
  293. if locreg.loc in [LOC_REGISTER,LOC_CREGISTER] then
  294. begin
  295. case locreg.size of
  296. {$if defined(cpu64bitalu)}
  297. OS_128,OS_S128:
  298. result:=std_regname(locreg.registerhi)+':'+std_regname(locreg.register);
  299. {$elseif defined(cpu32bitalu)}
  300. OS_64,OS_S64:
  301. result:=std_regname(locreg.registerhi)+':'+std_regname(locreg.register);
  302. {$elseif defined(cpu16bitalu)}
  303. OS_64,OS_S64:
  304. if getsupreg(locreg.register)<first_int_imreg then
  305. result:='??:'+std_regname(locreg.registerhi)
  306. +':??:'+std_regname(locreg.register)
  307. else
  308. result:=std_regname(cg.GetNextReg(locreg.registerhi))+':'+std_regname(locreg.registerhi)
  309. +':'+std_regname(cg.GetNextReg(locreg.register))+':'+std_regname(locreg.register);
  310. OS_32,OS_S32:
  311. if getsupreg(locreg.register)<first_int_imreg then
  312. result:='??:'+std_regname(locreg.register)
  313. else
  314. result:=std_regname(cg.GetNextReg(locreg.register))
  315. +':'+std_regname(locreg.register);
  316. {$elseif defined(cpu8bitalu)}
  317. OS_64,OS_S64:
  318. if getsupreg(locreg.register)<first_int_imreg then
  319. result:='??:??:??:'+std_regname(locreg.registerhi)
  320. +':??:??:??:'+std_regname(locreg.register)
  321. else
  322. result:=std_regname(cg.GetNextReg(cg.GetNextReg(cg.GetNextReg(locreg.registerhi))))
  323. +':'+std_regname(cg.GetNextReg(cg.GetNextReg(locreg.registerhi)))
  324. +':'+std_regname(cg.GetNextReg(locreg.registerhi))
  325. +':'+std_regname(locreg.registerhi)
  326. +':'+std_regname(cg.GetNextReg(cg.GetNextReg(cg.GetNextReg(locreg.register))))
  327. +':'+std_regname(cg.GetNextReg(cg.GetNextReg(locreg.register)))
  328. +':'+std_regname(cg.GetNextReg(locreg.register))
  329. +':'+std_regname(locreg.register);
  330. OS_32,OS_S32:
  331. if getsupreg(locreg.register)<first_int_imreg then
  332. result:='??:??:??:'+std_regname(locreg.register)
  333. else
  334. result:=std_regname(cg.GetNextReg(cg.GetNextReg(cg.GetNextReg(locreg.register))))
  335. +':'+std_regname(cg.GetNextReg(cg.GetNextReg(locreg.register)))
  336. +':'+std_regname(cg.GetNextReg(locreg.register))+':'+std_regname(locreg.register);
  337. OS_16,OS_S16:
  338. if getsupreg(locreg.register)<first_int_imreg then
  339. result:='??:'+std_regname(locreg.register)
  340. else
  341. result:=std_regname(cg.GetNextReg(locreg.register))+':'+std_regname(locreg.register);
  342. {$endif}
  343. else
  344. result:=std_regname(locreg.register);
  345. end;
  346. end
  347. else
  348. begin
  349. if locreg.registerhi<>NR_NO then
  350. result:=std_regname(locreg.registerhi)+':'+std_regname(locreg.register)
  351. else
  352. result:=std_regname(locreg.register);
  353. end;
  354. end;
  355. {$push}
  356. {$r-,q-}
  357. procedure calc_divconst_magic_signed(N: byte; d: aInt; out magic_m: aInt; out magic_s: byte);
  358. var
  359. p: aInt;
  360. ad,anc,delta,q1,r1,q2,r2,t: aWord;
  361. two_N_minus_1: aWord;
  362. begin
  363. assert((d<-1) or (d>1));
  364. two_N_minus_1:=aWord(1) shl (N-1);
  365. ad:=abs(d);
  366. t:=two_N_minus_1+(aWord(d) shr (N-1));
  367. anc:=t-1-t mod ad; { absolute value of nc }
  368. p:=(N-1); { initialize p }
  369. q1:=two_N_minus_1 div anc; { initialize q1 = 2**p/abs(nc) }
  370. r1:=two_N_minus_1-q1*anc; { initialize r1 = rem(2**p,abs(nc)) }
  371. q2:=two_N_minus_1 div ad; { initialize q2 = 2**p/abs(d) }
  372. r2:=two_N_minus_1-q2*ad; { initialize r2 = rem(2**p,abs(d)) }
  373. repeat
  374. inc(p);
  375. q1:=2*q1; { update q1 = 2**p/abs(nc) }
  376. r1:=2*r1; { update r1 = rem(2**p/abs(nc)) }
  377. if (r1>=anc) then { must be unsigned comparison }
  378. begin
  379. inc(q1);
  380. dec(r1,anc);
  381. end;
  382. q2:=2*q2; { update q2 = 2p/abs(d) }
  383. r2:=2*r2; { update r2 = rem(2p/abs(d)) }
  384. if (r2>=ad) then { must be unsigned comparison }
  385. begin
  386. inc(q2);
  387. dec(r2,ad);
  388. end;
  389. delta:=ad-r2;
  390. until not ((q1<delta) or ((q1=delta) and (r1=0)));
  391. magic_m:=q2+1;
  392. if (d<0) then
  393. magic_m:=-magic_m; { resulting magic number }
  394. magic_s:=p-N; { resulting shift }
  395. end;
  396. procedure calc_divconst_magic_unsigned(N: byte; d: aWord; out magic_m: aWord; out magic_add: boolean; out magic_shift: byte);
  397. var
  398. p: aInt;
  399. nc,delta,q1,r1,q2,r2,two_N_minus_1 : aWord;
  400. mask: aWord;
  401. begin
  402. two_N_minus_1:=aWord(1) shl (N-1);
  403. magic_add:=false;
  404. {$push}
  405. {$warnings off }
  406. mask:=aWord(not 0) shr ((64-N) and (sizeof(aWord)*8-1));
  407. nc:=(mask-(-d) mod aInt(d));
  408. {$pop}
  409. p:=N-1; { initialize p }
  410. q1:=two_N_minus_1 div nc; { initialize q1 = 2**p/nc }
  411. r1:=two_N_minus_1-q1*nc; { initialize r1 = rem(2**p,nc) }
  412. q2:=(two_N_minus_1-1) div d; { initialize q2 = (2**p-1)/d }
  413. r2:=(two_N_minus_1-1)-q2*d; { initialize r2 = rem((2**p-1),d) }
  414. repeat
  415. inc(p);
  416. if (r1>=(nc-r1)) then
  417. begin
  418. q1:=2*q1+1; { update q1 }
  419. r1:=2*r1-nc; { update r1 }
  420. end
  421. else
  422. begin
  423. q1:=2*q1; { update q1 }
  424. r1:=2*r1; { update r1 }
  425. end;
  426. if ((r2+1)>=(d-r2)) then
  427. begin
  428. if (q2>=(two_N_minus_1-1)) then
  429. magic_add:=true;
  430. q2:=2*q2+1; { update q2 }
  431. r2:=2*r2+1-d; { update r2 }
  432. end
  433. else
  434. begin
  435. if (q2>=two_N_minus_1) then
  436. magic_add:=true;
  437. q2:=2*q2; { update q2 }
  438. r2:=2*r2+1; { update r2 }
  439. end;
  440. delta:=d-1-r2;
  441. until not ((p<(2*N)) and ((q1<delta) or ((q1=delta) and (r1=0))));
  442. magic_m:=(q2+1) and mask; { resulting magic number }
  443. magic_shift:=p-N; { resulting shift }
  444. end;
  445. procedure calc_mul_inverse(N: byte; d: aWord; out reciprocal: aWord; out shift: Byte);
  446. var
  447. mask, oldr, newd, swap_r, swap_d, q: aWord;
  448. begin
  449. { WARNING: d must not be a power of 2 (including 2^0 = 1) }
  450. {$push}
  451. {$warnings off }
  452. if N=(SizeOf(aWord) * 8) then
  453. newd:=0
  454. else
  455. newd:=aWord(1) shl N; { Used later }
  456. mask:=newd-1;
  457. oldr:=mask;
  458. {$pop}
  459. { Trim off powers of 2 so d is an odd number }
  460. {$if defined(cpu64bitalu)}
  461. shift:=BsfQWord(d);
  462. {$elseif defined(cpu32bitalu)}
  463. shift:=BsfDWord(d);
  464. {$elseif defined(cpu16bitalu)}
  465. shift:=BsfWord(d);
  466. {$elseif defined(cpu8bitalu)}
  467. shift:=BsfByte(d);
  468. {$else}
  469. {$error ALU not defined}
  470. {$endif}
  471. if shift = 255 then
  472. { This is a divide by zero that should have been caught earlier }
  473. InternalError(2021091001);
  474. d := d shr shift;
  475. { Calculate reciprocal using the Extended Euclidean Algorithm as
  476. described on page 244 of Hacker's Delight, Second Edition.
  477. x1 = oldr
  478. x2 = reciprocal
  479. x3 = swap_r
  480. v1 = newd
  481. v2 = d
  482. v3 = swap_d
  483. }
  484. newd:=newd-d; { -d }
  485. reciprocal:=1;
  486. repeat
  487. q := newd div d;
  488. swap_d:=(newd-(q*d)) and mask;
  489. newd:=d;
  490. d:=swap_d;
  491. swap_r:=(oldr-(q*reciprocal)) and mask;
  492. oldr:=reciprocal;
  493. reciprocal:=swap_r;
  494. until d<=1;
  495. end;
  496. {$pop}
  497. end.