n386set.pas 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943
  1. {
  2. $Id$
  3. Copyright (c) 1998-2002 by Florian Klaempfl
  4. Generate i386 assembler for in set/case nodes
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit n386set;
  19. {$i fpcdefs.inc}
  20. interface
  21. uses
  22. node,nset,pass_1,ncgset;
  23. type
  24. ti386innode = class(tinnode)
  25. procedure pass_2;override;
  26. function pass_1 : tnode;override;
  27. end;
  28. ti386casenode = class(tcgcasenode)
  29. procedure optimizevalues(var max_linear_list:longint;var max_dist:cardinal);override;
  30. function has_jumptable : boolean;override;
  31. procedure genjumptable(hp : pcaserecord;min_,max_ : longint);override;
  32. procedure genlinearlist(hp : pcaserecord);override;
  33. end;
  34. implementation
  35. uses
  36. globtype,systems,
  37. verbose,globals,
  38. symconst,symdef,defutil,
  39. aasmbase,aasmtai,aasmcpu,
  40. cginfo,cgbase,pass_2,
  41. ncon,
  42. cpubase,cpuinfo,
  43. cga,cgx86,cgobj,tgobj,ncgutil,rgobj;
  44. {*****************************************************************************
  45. TI386INNODE
  46. *****************************************************************************}
  47. function ti386innode.pass_1 : tnode;
  48. begin
  49. result:=nil;
  50. { this is the only difference from the generic version }
  51. expectloc:=LOC_FLAGS;
  52. firstpass(right);
  53. firstpass(left);
  54. if codegenerror then
  55. exit;
  56. left_right_max;
  57. { this is not allways true due to optimization }
  58. { but if we don't set this we get problems with optimizing self code }
  59. if tsetdef(right.resulttype.def).settype<>smallset then
  60. include(current_procinfo.flags,pi_do_call)
  61. else
  62. begin
  63. { a smallset needs maybe an misc. register }
  64. if (left.nodetype<>ordconstn) and
  65. not(right.location.loc in [LOC_CREGISTER,LOC_REGISTER]) and
  66. (right.registers32<1) then
  67. inc(registers32);
  68. end;
  69. end;
  70. procedure ti386innode.pass_2;
  71. type
  72. Tsetpart=record
  73. range : boolean; {Part is a range.}
  74. start,stop : byte; {Start/stop when range; Stop=element when an element.}
  75. end;
  76. var
  77. genjumps,
  78. use_small,
  79. ranges : boolean;
  80. hr,hr2,
  81. pleftreg : tregister;
  82. href : treference;
  83. opsize : topsize;
  84. setparts : array[1..8] of Tsetpart;
  85. i,numparts : byte;
  86. adjustment : longint;
  87. pushedregs : tmaybesave;
  88. l,l2 : tasmlabel;
  89. r : Tregister;
  90. {$ifdef CORRECT_SET_IN_FPC}
  91. AM : tasmop;
  92. {$endif CORRECT_SET_IN_FPC}
  93. function analizeset(Aset:pconstset;is_small:boolean):boolean;
  94. type
  95. byteset=set of byte;
  96. var
  97. compares,maxcompares:word;
  98. i:byte;
  99. begin
  100. if byteset(Aset^)=[] then
  101. {The expression...
  102. if expr in []
  103. ...is allways false. It should be optimized away in the
  104. resulttype pass, and thus never occur here. Since we
  105. do generate wrong code for it, do internalerror.}
  106. internalerror(2002072301);
  107. analizeset:=false;
  108. ranges:=false;
  109. numparts:=0;
  110. compares:=0;
  111. { Lots of comparisions take a lot of time, so do not allow
  112. too much comparisions. 8 comparisions are, however, still
  113. smalller than emitting the set }
  114. if cs_littlesize in aktglobalswitches then
  115. maxcompares:=8
  116. else
  117. maxcompares:=5;
  118. { when smallset is possible allow only 3 compares the smallset
  119. code is for littlesize also smaller when more compares are used }
  120. if is_small then
  121. maxcompares:=3;
  122. for i:=0 to 255 do
  123. if i in byteset(Aset^) then
  124. begin
  125. if (numparts=0) or (i<>setparts[numparts].stop+1) then
  126. begin
  127. {Set element is a separate element.}
  128. inc(compares);
  129. if compares>maxcompares then
  130. exit;
  131. inc(numparts);
  132. setparts[numparts].range:=false;
  133. setparts[numparts].stop:=i;
  134. end
  135. else
  136. {Set element is part of a range.}
  137. if not setparts[numparts].range then
  138. begin
  139. {Transform an element into a range.}
  140. setparts[numparts].range:=true;
  141. setparts[numparts].start:=setparts[numparts].stop;
  142. setparts[numparts].stop:=i;
  143. ranges := true;
  144. { there's only one compare per range anymore. Only a }
  145. { sub is added, but that's much faster than a }
  146. { cmp/jcc combo so neglect its effect }
  147. { inc(compares);
  148. if compares>maxcompares then
  149. exit; }
  150. end
  151. else
  152. begin
  153. {Extend a range.}
  154. setparts[numparts].stop:=i;
  155. end;
  156. end;
  157. analizeset:=true;
  158. end;
  159. begin
  160. { We check first if we can generate jumps, this can be done
  161. because the resulttype.def is already set in firstpass }
  162. { check if we can use smallset operation using btl which is limited
  163. to 32 bits, the left side may also not contain higher values !! }
  164. use_small:=(tsetdef(right.resulttype.def).settype=smallset) and
  165. ((left.resulttype.def.deftype=orddef) and (torddef(left.resulttype.def).high<=32) or
  166. (left.resulttype.def.deftype=enumdef) and (tenumdef(left.resulttype.def).max<=32));
  167. { Can we generate jumps? Possible for all types of sets }
  168. genjumps:=(right.nodetype=setconstn) and
  169. analizeset(tsetconstnode(right).value_set,use_small);
  170. { calculate both operators }
  171. { the complex one first }
  172. firstcomplex(self);
  173. secondpass(left);
  174. { Only process the right if we are not generating jumps }
  175. if not genjumps then
  176. begin
  177. {$ifndef newra}
  178. maybe_save(exprasmlist,right.registers32,left.location,pushedregs);
  179. {$endif}
  180. secondpass(right);
  181. {$ifndef newra}
  182. maybe_restore(exprasmlist,left.location,pushedregs);
  183. {$endif newra}
  184. end;
  185. if codegenerror then
  186. exit;
  187. { ofcourse not commutative }
  188. if nf_swaped in flags then
  189. swapleftright;
  190. if genjumps then
  191. begin
  192. { It gives us advantage to check for the set elements
  193. separately instead of using the SET_IN_BYTE procedure.
  194. To do: Build in support for LOC_JUMP }
  195. opsize := def_opsize(left.resulttype.def);
  196. { If register is used, use only lower 8 bits }
  197. if left.location.loc in [LOC_REGISTER,LOC_CREGISTER] then
  198. begin
  199. { for ranges we always need a 32bit register, because then we }
  200. { use the register as base in a reference (JM) }
  201. pleftreg.enum:=R_INTREGISTER;
  202. if ranges then
  203. begin
  204. pleftreg.number:=(left.location.register.number and not $ff) or R_SUBWHOLE;
  205. cg.a_load_reg_reg(exprasmlist,left.location.size,OS_INT,left.location.register,pleftreg);
  206. if opsize <> S_L then
  207. emit_const_reg(A_AND,S_L,255,pleftreg);
  208. opsize := S_L;
  209. end
  210. else
  211. { otherwise simply use the lower 8 bits (no "and" }
  212. { necessary this way) (JM) }
  213. begin
  214. pleftreg.number:=(left.location.register.number and not $ff) or R_SUBL;
  215. opsize := S_B;
  216. end;
  217. end
  218. else
  219. begin
  220. { load the value in a register }
  221. {$ifdef newra}
  222. pleftreg:=rg.getregisterint(exprasmlist,OS_INT);
  223. {$else}
  224. pleftreg := rg.getexplicitregisterint(exprasmlist,NR_EDI);
  225. {$endif}
  226. opsize := S_L;
  227. emit_ref_reg(A_MOVZX,S_BL,left.location.reference,pleftreg);
  228. location_release(exprasmlist,left.location);
  229. end;
  230. { Get a label to jump to the end }
  231. location_reset(location,LOC_FLAGS,OS_NO);
  232. { It's better to use the zero flag when there are
  233. no ranges }
  234. if ranges then
  235. location.resflags:=F_C
  236. else
  237. location.resflags:=F_E;
  238. objectlibrary.getlabel(l);
  239. { how much have we already substracted from the x in the }
  240. { "x in [y..z]" expression }
  241. adjustment := 0;
  242. r.enum:=R_NO;
  243. for i:=1 to numparts do
  244. if setparts[i].range then
  245. { use fact that a <= x <= b <=> cardinal(x-a) <= cardinal(b-a) }
  246. begin
  247. { is the range different from all legal values? }
  248. if (setparts[i].stop-setparts[i].start <> 255) then
  249. begin
  250. { yes, is the lower bound <> 0? }
  251. if (setparts[i].start <> 0) then
  252. { we're going to substract from the left register, }
  253. { so in case of a LOC_CREGISTER first move the value }
  254. { to edi (not done before because now we can do the }
  255. { move and substract in one instruction with LEA) }
  256. if {$ifndef newra}(pleftreg.number <> NR_EDI) and{$endif}
  257. (left.location.loc = LOC_CREGISTER) then
  258. begin
  259. rg.ungetregister(exprasmlist,pleftreg);
  260. {$ifdef newra}
  261. r:=rg.getregisterint(exprasmlist,OS_INT);
  262. {$else}
  263. r.enum:=R_INTREGISTER;
  264. r.number:=NR_EDI;
  265. rg.getexplicitregisterint(exprasmlist,NR_EDI);
  266. {$endif}
  267. reference_reset_base(href,pleftreg,-setparts[i].start);
  268. emit_ref_reg(A_LEA,S_L,href,r);
  269. { only now change pleftreg since previous value is }
  270. { still used in previous instruction }
  271. pleftreg := r;
  272. opsize := S_L;
  273. end
  274. else
  275. begin
  276. { otherwise, the value is already in a register }
  277. { that can be modified }
  278. if setparts[i].start-adjustment <> 1 then
  279. emit_const_reg(A_SUB,opsize,
  280. setparts[i].start-adjustment,pleftreg)
  281. else emit_reg(A_DEC,opsize,pleftreg);
  282. end;
  283. { new total value substracted from x: }
  284. { adjustment + (setparts[i].start - adjustment) }
  285. adjustment := setparts[i].start;
  286. { check if result < b-a+1 (not "result <= b-a", since }
  287. { we need a carry in case the element is in the range }
  288. { (this will never overflow since we check at the }
  289. { beginning whether stop-start <> 255) }
  290. emit_const_reg(A_CMP,opsize,
  291. setparts[i].stop-setparts[i].start+1,pleftreg);
  292. { use C_C instead of C_B: the meaning is the same, but }
  293. { then the optimizer can easier trace the jump to its }
  294. { final destination since the resultflag of this node }
  295. { is set to the carryflag }
  296. emitjmp(C_C,l);
  297. end
  298. else
  299. { if setparts[i].start = 0 and setparts[i].stop = 255, }
  300. { it's always true since "in" is only allowed for bytes }
  301. begin
  302. emit_none(A_STC,S_NO);
  303. cg.a_jmp_always(exprasmlist,l);
  304. end;
  305. end
  306. else
  307. begin
  308. { Emit code to check if left is an element }
  309. emit_const_reg(A_CMP,opsize,setparts[i].stop-adjustment,
  310. pleftreg);
  311. { Result should be in carry flag when ranges are used }
  312. if ranges then
  313. emit_none(A_STC,S_NO);
  314. { If found, jump to end }
  315. emitjmp(C_E,l);
  316. end;
  317. if ranges and
  318. { if the last one was a range, the carry flag is already }
  319. { set appropriately }
  320. not(setparts[numparts].range) then
  321. emit_none(A_CLC,S_NO);
  322. { To compensate for not doing a second pass }
  323. right.location.reference.symbol:=nil;
  324. { Now place the end label }
  325. cg.a_label(exprasmlist,l);
  326. {$ifdef newra}
  327. rg.ungetregisterint(exprasmlist,pleftreg);
  328. if r.enum=R_INTREGISTER then
  329. rg.ungetregisterint(exprasmlist,r);
  330. {$else}
  331. case left.location.loc of
  332. LOC_REGISTER,
  333. LOC_CREGISTER :
  334. rg.ungetregisterint(exprasmlist,pleftreg);
  335. else
  336. begin
  337. reference_release(exprasmlist,left.location.reference);
  338. r.enum:=R_INTREGISTER;
  339. r.number:=NR_EDI;
  340. rg.ungetregisterint(exprasmlist,r);
  341. end;
  342. end;
  343. {$endif}
  344. end
  345. else
  346. begin
  347. location_reset(location,LOC_FLAGS,OS_NO);
  348. { We will now generated code to check the set itself, no jmps,
  349. handle smallsets separate, because it allows faster checks }
  350. if use_small then
  351. begin
  352. if left.nodetype=ordconstn then
  353. begin
  354. location.resflags:=F_NE;
  355. case right.location.loc of
  356. LOC_REGISTER,
  357. LOC_CREGISTER:
  358. begin
  359. emit_const_reg(A_TEST,S_L,
  360. 1 shl (tordconstnode(left).value and 31),right.location.register);
  361. end;
  362. LOC_REFERENCE,
  363. LOC_CREFERENCE :
  364. begin
  365. emit_const_ref(A_TEST,S_L,1 shl (tordconstnode(left).value and 31),
  366. right.location.reference);
  367. end;
  368. else
  369. internalerror(200203312);
  370. end;
  371. location_release(exprasmlist,right.location);
  372. end
  373. else
  374. begin
  375. case left.location.loc of
  376. LOC_REGISTER,
  377. LOC_CREGISTER:
  378. begin
  379. hr.enum:=R_INTREGISTER;
  380. hr.number:=(left.location.register.number and not $ff) or R_SUBWHOLE;
  381. cg.a_load_reg_reg(exprasmlist,left.location.size,OS_INT,left.location.register,hr);
  382. end;
  383. else
  384. begin
  385. { the set element isn't never samller than a byte }
  386. { and because it's a small set we need only 5 bits }
  387. { but 8 bits are easier to load }
  388. r.enum:=R_INTREGISTER;
  389. r.number:=NR_EDI;
  390. rg.getexplicitregisterint(exprasmlist,NR_EDI);
  391. emit_ref_reg(A_MOVZX,S_BL,left.location.reference,r);
  392. hr:=r;
  393. location_release(exprasmlist,left.location);
  394. end;
  395. end;
  396. case right.location.loc of
  397. LOC_REGISTER,
  398. LOC_CREGISTER :
  399. begin
  400. emit_reg_reg(A_BT,S_L,hr,
  401. right.location.register);
  402. rg.ungetregisterint(exprasmlist,right.location.register);
  403. end;
  404. LOC_CONSTANT :
  405. begin
  406. { We have to load the value into a register because
  407. btl does not accept values only refs or regs (PFV) }
  408. hr2:=rg.getregisterint(exprasmlist,OS_INT);
  409. emit_const_reg(A_MOV,S_L,
  410. right.location.value,hr2);
  411. emit_reg_reg(A_BT,S_L,hr,hr2);
  412. rg.ungetregisterint(exprasmlist,hr2);
  413. end;
  414. LOC_CREFERENCE,
  415. LOC_REFERENCE :
  416. begin
  417. location_release(exprasmlist,right.location);
  418. emit_reg_ref(A_BT,S_L,hr,right.location.reference);
  419. end;
  420. else
  421. internalerror(2002032210);
  422. end;
  423. { simply to indicate EDI is deallocated here too (JM) }
  424. rg.ungetregisterint(exprasmlist,hr);
  425. location.resflags:=F_C;
  426. end;
  427. end
  428. else
  429. begin
  430. if right.location.loc=LOC_CONSTANT then
  431. begin
  432. location.resflags:=F_C;
  433. objectlibrary.getlabel(l);
  434. objectlibrary.getlabel(l2);
  435. { load constants to a register }
  436. if left.nodetype=ordconstn then
  437. location_force_reg(exprasmlist,left.location,OS_INT,true);
  438. case left.location.loc of
  439. LOC_REGISTER,
  440. LOC_CREGISTER:
  441. begin
  442. hr:=rg.makeregsize(left.location.register,OS_INT);
  443. cg.a_load_reg_reg(exprasmlist,left.location.size,OS_INT,left.location.register,hr);
  444. emit_const_reg(A_CMP,S_L,31,hr);
  445. emitjmp(C_NA,l);
  446. { reset carry flag }
  447. emit_none(A_CLC,S_NO);
  448. cg.a_jmp_always(exprasmlist,l2);
  449. cg.a_label(exprasmlist,l);
  450. { We have to load the value into a register because
  451. btl does not accept values only refs or regs (PFV) }
  452. hr2:=rg.getregisterint(exprasmlist,OS_INT);
  453. emit_const_reg(A_MOV,S_L,right.location.value,hr2);
  454. emit_reg_reg(A_BT,S_L,hr,hr2);
  455. rg.ungetregisterint(exprasmlist,hr2);
  456. end;
  457. else
  458. begin
  459. {$ifdef CORRECT_SET_IN_FPC}
  460. if m_tp in aktmodeswitches then
  461. begin
  462. {***WARNING only correct if
  463. reference is 32 bits (PM) *****}
  464. emit_const_ref(A_CMP,S_L,31,reference_copy(left.location.reference));
  465. end
  466. else
  467. {$endif CORRECT_SET_IN_FPC}
  468. begin
  469. emit_const_ref(A_CMP,S_B,31,left.location.reference);
  470. end;
  471. emitjmp(C_NA,l);
  472. { reset carry flag }
  473. emit_none(A_CLC,S_NO);
  474. cg.a_jmp_always(exprasmlist,l2);
  475. cg.a_label(exprasmlist,l);
  476. location_release(exprasmlist,left.location);
  477. hr:=rg.getregisterint(exprasmlist,OS_INT);
  478. emit_ref_reg(A_MOV,S_L,left.location.reference,hr);
  479. { We have to load the value into a register because
  480. btl does not accept values only refs or regs (PFV) }
  481. hr2:=rg.getregisterint(exprasmlist,OS_INT);
  482. emit_const_reg(A_MOV,S_L,
  483. right.location.value,hr2);
  484. emit_reg_reg(A_BT,S_L,hr,hr2);
  485. rg.ungetregisterint(exprasmlist,hr2);
  486. end;
  487. end;
  488. cg.a_label(exprasmlist,l2);
  489. end { of right.location.loc=LOC_CONSTANT }
  490. { do search in a normal set which could have >32 elementsm
  491. but also used if the left side contains higher values > 32 }
  492. else if left.nodetype=ordconstn then
  493. begin
  494. location.resflags:=F_NE;
  495. inc(right.location.reference.offset,tordconstnode(left).value shr 3);
  496. emit_const_ref(A_TEST,S_B,1 shl (tordconstnode(left).value and 7),right.location.reference);
  497. location_release(exprasmlist,right.location);
  498. end
  499. else
  500. begin
  501. if (left.location.loc in [LOC_REGISTER,LOC_CREGISTER]) then
  502. begin
  503. pleftreg.enum:=R_INTREGISTER;
  504. pleftreg.number:=(left.location.register.number and not $ff) or R_SUBWHOLE;
  505. end
  506. else
  507. {$ifdef newra}
  508. pleftreg:=rg.getregisterint(exprasmlist,OS_INT);
  509. {$else}
  510. pleftreg:=rg.getexplicitregisterint(exprasmlist,NR_EDI);
  511. {$endif}
  512. cg.a_load_loc_reg(exprasmlist,left.location,pleftreg);
  513. location_freetemp(exprasmlist,left.location);
  514. location_release(exprasmlist,left.location);
  515. emit_reg_ref(A_BT,S_L,pleftreg,right.location.reference);
  516. rg.ungetregisterint(exprasmlist,pleftreg);
  517. location_release(exprasmlist,right.location);
  518. { tg.ungetiftemp(exprasmlist,right.location.reference) happens below }
  519. location.resflags:=F_C;
  520. end;
  521. end;
  522. end;
  523. if not genjumps then
  524. location_freetemp(exprasmlist,right.location);
  525. end;
  526. {*****************************************************************************
  527. TI386CASENODE
  528. *****************************************************************************}
  529. procedure ti386casenode.optimizevalues(var max_linear_list:longint;var max_dist:cardinal);
  530. begin
  531. { a jump table crashes the pipeline! }
  532. if aktoptprocessor=Class386 then
  533. inc(max_linear_list,3)
  534. else if aktoptprocessor=ClassP5 then
  535. inc(max_linear_list,6)
  536. else if aktoptprocessor>=ClassP6 then
  537. inc(max_linear_list,9);
  538. end;
  539. function ti386casenode.has_jumptable : boolean;
  540. begin
  541. has_jumptable:=true;
  542. end;
  543. procedure ti386casenode.genjumptable(hp : pcaserecord;min_,max_ : longint);
  544. var
  545. table : tasmlabel;
  546. last : TConstExprInt;
  547. indexreg : tregister;
  548. href : treference;
  549. jumpsegment : TAAsmOutput;
  550. procedure genitem(t : pcaserecord);
  551. var
  552. i : longint;
  553. begin
  554. if assigned(t^.less) then
  555. genitem(t^.less);
  556. { fill possible hole }
  557. for i:=last+1 to t^._low-1 do
  558. jumpSegment.concat(Tai_const_symbol.Create(elselabel));
  559. for i:=t^._low to t^._high do
  560. jumpSegment.concat(Tai_const_symbol.Create(t^.statement));
  561. last:=t^._high;
  562. if assigned(t^.greater) then
  563. genitem(t^.greater);
  564. end;
  565. begin
  566. if (cs_create_smart in aktmoduleswitches) then
  567. jumpsegment:=current_procinfo.aktlocaldata
  568. else
  569. jumpsegment:=datasegment;
  570. if not(jumptable_no_range) then
  571. begin
  572. { case expr less than min_ => goto elselabel }
  573. cg.a_cmp_const_reg_label(exprasmlist,OS_INT,jmp_lt,aword(min_),hregister,elselabel);
  574. { case expr greater than max_ => goto elselabel }
  575. cg.a_cmp_const_reg_label(exprasmlist,OS_INT,jmp_gt,aword(max_),hregister,elselabel);
  576. end;
  577. objectlibrary.getlabel(table);
  578. { make it a 32bit register }
  579. indexreg.enum:=R_INTREGISTER;
  580. indexreg.number:=(hregister.number and not $ff) or R_SUBWHOLE;
  581. cg.a_load_reg_reg(exprasmlist,opsize,OS_INT,hregister,indexreg);
  582. { create reference }
  583. reference_reset_symbol(href,table,0);
  584. href.offset:=(-longint(min_))*4;
  585. href.index:=indexreg;
  586. href.scalefactor:=4;
  587. emit_ref(A_JMP,S_NO,href);
  588. { generate jump table }
  589. if not(cs_littlesize in aktglobalswitches) then
  590. jumpSegment.concat(Tai_Align.Create_Op(4,0));
  591. jumpSegment.concat(Tai_label.Create(table));
  592. last:=min_;
  593. genitem(hp);
  594. end;
  595. procedure ti386casenode.genlinearlist(hp : pcaserecord);
  596. var
  597. first : boolean;
  598. lastrange : boolean;
  599. last : TConstExprInt;
  600. cond_lt,cond_le : tasmcond;
  601. procedure genitem(t : pcaserecord);
  602. begin
  603. if assigned(t^.less) then
  604. genitem(t^.less);
  605. { need we to test the first value }
  606. if first and (t^._low>get_min_value(left.resulttype.def)) then
  607. begin
  608. cg.a_cmp_const_reg_label(exprasmlist,OS_INT,jmp_lt,aword(t^._low),hregister,elselabel);
  609. end;
  610. if t^._low=t^._high then
  611. begin
  612. if t^._low-last=0 then
  613. cg.a_cmp_const_reg_label(exprasmlist, OS_INT, OC_EQ,0,hregister,t^.statement)
  614. else
  615. begin
  616. cg.a_op_const_reg(exprasmlist, OP_SUB, aword(t^._low-last), hregister);
  617. emitjmp(C_Z,t^.statement);
  618. end;
  619. last:=t^._low;
  620. lastrange:=false;
  621. end
  622. else
  623. begin
  624. { it begins with the smallest label, if the value }
  625. { is even smaller then jump immediately to the }
  626. { ELSE-label }
  627. if first then
  628. begin
  629. { have we to ajust the first value ? }
  630. if (t^._low>get_min_value(left.resulttype.def)) then
  631. cg.a_op_const_reg(exprasmlist, OP_SUB, longint(t^._low), hregister);
  632. end
  633. else
  634. begin
  635. { if there is no unused label between the last and the }
  636. { present label then the lower limit can be checked }
  637. { immediately. else check the range in between: }
  638. cg.a_op_const_reg(exprasmlist, OP_SUB, longint(t^._low-last), hregister);
  639. { no jump necessary here if the new range starts at }
  640. { at the value following the previous one }
  641. if ((t^._low-last) <> 1) or
  642. (not lastrange) then
  643. emitjmp(cond_lt,elselabel);
  644. end;
  645. {we need to use A_SUB, because A_DEC does not set the correct flags, therefor
  646. using a_op_const_reg(OP_SUB) is not possible }
  647. emit_const_reg(A_SUB,TCGSize2OpSize[opsize],longint(t^._high-t^._low),hregister);
  648. emitjmp(cond_le,t^.statement);
  649. last:=t^._high;
  650. lastrange:=true;
  651. end;
  652. first:=false;
  653. if assigned(t^.greater) then
  654. genitem(t^.greater);
  655. end;
  656. begin
  657. if with_sign then
  658. begin
  659. cond_lt:=C_L;
  660. cond_le:=C_LE;
  661. end
  662. else
  663. begin
  664. cond_lt:=C_B;
  665. cond_le:=C_BE;
  666. end;
  667. { do we need to generate cmps? }
  668. if (with_sign and (min_label<0)) then
  669. genlinearcmplist(hp)
  670. else
  671. begin
  672. last:=0;
  673. lastrange:=false;
  674. first:=true;
  675. genitem(hp);
  676. cg.a_jmp_always(exprasmlist,elselabel);
  677. end;
  678. end;
  679. begin
  680. {$ifndef TEST_GENERIC}
  681. cinnode:=ti386innode;
  682. {$endif}
  683. ccasenode:=ti386casenode;
  684. end.
  685. {
  686. $Log$
  687. Revision 1.57 2003-04-27 11:21:35 peter
  688. * aktprocdef renamed to current_procdef
  689. * procinfo renamed to current_procinfo
  690. * procinfo will now be stored in current_module so it can be
  691. cleaned up properly
  692. * gen_main_procsym changed to create_main_proc and release_main_proc
  693. to also generate a tprocinfo structure
  694. * fixed unit implicit initfinal
  695. Revision 1.56 2003/04/25 08:25:26 daniel
  696. * Ifdefs around a lot of calls to cleartempgen
  697. * Fixed registers that are allocated but not freed in several nodes
  698. * Tweak to register allocator to cause less spills
  699. * 8-bit registers now interfere with esi,edi and ebp
  700. Compiler can now compile rtl successfully when using new register
  701. allocator
  702. Revision 1.55 2003/04/23 09:51:16 daniel
  703. * Removed usage of edi in a lot of places when new register allocator used
  704. + Added newra versions of g_concatcopy and secondadd_float
  705. Revision 1.54 2003/04/22 23:50:23 peter
  706. * firstpass uses expectloc
  707. * checks if there are differences between the expectloc and
  708. location.loc from secondpass in EXTDEBUG
  709. Revision 1.53 2003/04/22 14:33:38 peter
  710. * removed some notes/hints
  711. Revision 1.52 2003/04/22 10:09:35 daniel
  712. + Implemented the actual register allocator
  713. + Scratch registers unavailable when new register allocator used
  714. + maybe_save/maybe_restore unavailable when new register allocator used
  715. Revision 1.51 2003/03/13 19:52:23 jonas
  716. * and more new register allocator fixes (in the i386 code generator this
  717. time). At least now the ppc cross compiler can compile the linux
  718. system unit again, but I haven't tested it.
  719. Revision 1.50 2003/02/26 23:06:13 daniel
  720. * Fixed an illegal use of makeregsize
  721. Revision 1.49 2003/02/19 22:39:56 daniel
  722. * Fixed a few issues
  723. Revision 1.48 2003/02/19 22:00:15 daniel
  724. * Code generator converted to new register notation
  725. - Horribily outdated todo.txt removed
  726. Revision 1.47 2003/01/13 14:54:34 daniel
  727. * Further work to convert codegenerator register convention;
  728. internalerror bug fixed.
  729. Revision 1.46 2003/01/08 18:43:57 daniel
  730. * Tregister changed into a record
  731. Revision 1.45 2002/11/25 17:43:27 peter
  732. * splitted defbase in defutil,symutil,defcmp
  733. * merged isconvertable and is_equal into compare_defs(_ext)
  734. * made operator search faster by walking the list only once
  735. Revision 1.44 2002/10/03 21:34:45 carl
  736. * range check error fixes
  737. Revision 1.43 2002/09/17 18:54:05 jonas
  738. * a_load_reg_reg() now has two size parameters: source and dest. This
  739. allows some optimizations on architectures that don't encode the
  740. register size in the register name.
  741. Revision 1.42 2002/09/16 18:08:26 peter
  742. * fix last optimization in genlinearlist, detected by bug tw1066
  743. * use generic casenode.pass2 routine and override genlinearlist
  744. * add jumptable support to generic casenode, by default there is
  745. no jumptable support
  746. Revision 1.41 2002/09/09 13:57:45 jonas
  747. * small optimization to case genlist() case statements
  748. Revision 1.40 2002/08/17 09:23:46 florian
  749. * first part of procinfo rewrite
  750. Revision 1.39 2002/08/12 15:08:42 carl
  751. + stab register indexes for powerpc (moved from gdb to cpubase)
  752. + tprocessor enumeration moved to cpuinfo
  753. + linker in target_info is now a class
  754. * many many updates for m68k (will soon start to compile)
  755. - removed some ifdef or correct them for correct cpu
  756. Revision 1.38 2002/08/11 14:32:30 peter
  757. * renamed current_library to objectlibrary
  758. Revision 1.37 2002/08/11 13:24:17 peter
  759. * saving of asmsymbols in ppu supported
  760. * asmsymbollist global is removed and moved into a new class
  761. tasmlibrarydata that will hold the info of a .a file which
  762. corresponds with a single module. Added librarydata to tmodule
  763. to keep the library info stored for the module. In the future the
  764. objectfiles will also be stored to the tasmlibrarydata class
  765. * all getlabel/newasmsymbol and friends are moved to the new class
  766. Revision 1.36 2002/07/23 14:31:00 daniel
  767. * Added internal error when asked to generate code for 'if expr in []'
  768. Revision 1.35 2002/07/20 11:58:04 florian
  769. * types.pas renamed to defbase.pas because D6 contains a types
  770. unit so this would conflicts if D6 programms are compiled
  771. + Willamette/SSE2 instructions to assembler added
  772. Revision 1.34 2002/07/11 14:41:34 florian
  773. * start of the new generic parameter handling
  774. Revision 1.33 2002/07/06 20:27:26 carl
  775. + generic set handling
  776. Revision 1.32 2002/07/01 18:46:33 peter
  777. * internal linker
  778. * reorganized aasm layer
  779. Revision 1.31 2002/05/18 13:34:25 peter
  780. * readded missing revisions
  781. Revision 1.30 2002/05/16 19:46:52 carl
  782. + defines.inc -> fpcdefs.inc to avoid conflicts if compiling by hand
  783. + try to fix temp allocation (still in ifdef)
  784. + generic constructor calls
  785. + start of tassembler / tmodulebase class cleanup
  786. Revision 1.28 2002/05/13 19:54:38 peter
  787. * removed n386ld and n386util units
  788. * maybe_save/maybe_restore added instead of the old maybe_push
  789. Revision 1.27 2002/05/12 16:53:17 peter
  790. * moved entry and exitcode to ncgutil and cgobj
  791. * foreach gets extra argument for passing local data to the
  792. iterator function
  793. * -CR checks also class typecasts at runtime by changing them
  794. into as
  795. * fixed compiler to cycle with the -CR option
  796. * fixed stabs with elf writer, finally the global variables can
  797. be watched
  798. * removed a lot of routines from cga unit and replaced them by
  799. calls to cgobj
  800. * u32bit-s32bit updates for and,or,xor nodes. When one element is
  801. u32bit then the other is typecasted also to u32bit without giving
  802. a rangecheck warning/error.
  803. * fixed pascal calling method with reversing also the high tree in
  804. the parast, detected by tcalcst3 test
  805. Revision 1.26 2002/04/25 20:16:40 peter
  806. * moved more routines from cga/n386util
  807. Revision 1.25 2002/04/21 19:02:07 peter
  808. * removed newn and disposen nodes, the code is now directly
  809. inlined from pexpr
  810. * -an option that will write the secondpass nodes to the .s file, this
  811. requires EXTDEBUG define to actually write the info
  812. * fixed various internal errors and crashes due recent code changes
  813. Revision 1.24 2002/04/21 15:37:26 carl
  814. * changeregsize -> rg.makeregsize
  815. Revision 1.23 2002/04/19 15:39:35 peter
  816. * removed some more routines from cga
  817. * moved location_force_reg/mem to ncgutil
  818. * moved arrayconstructnode secondpass to ncgld
  819. Revision 1.22 2002/04/15 19:44:21 peter
  820. * fixed stackcheck that would be called recursively when a stack
  821. error was found
  822. * generic changeregsize(reg,size) for i386 register resizing
  823. * removed some more routines from cga unit
  824. * fixed returnvalue handling
  825. * fixed default stacksize of linux and go32v2, 8kb was a bit small :-)
  826. Revision 1.21 2002/04/02 17:11:36 peter
  827. * tlocation,treference update
  828. * LOC_CONSTANT added for better constant handling
  829. * secondadd splitted in multiple routines
  830. * location_force_reg added for loading a location to a register
  831. of a specified size
  832. * secondassignment parses now first the right and then the left node
  833. (this is compatible with Kylix). This saves a lot of push/pop especially
  834. with string operations
  835. * adapted some routines to use the new cg methods
  836. Revision 1.20 2002/03/31 20:26:39 jonas
  837. + a_loadfpu_* and a_loadmm_* methods in tcg
  838. * register allocation is now handled by a class and is mostly processor
  839. independent (+rgobj.pas and i386/rgcpu.pas)
  840. * temp allocation is now handled by a class (+tgobj.pas, -i386\tgcpu.pas)
  841. * some small improvements and fixes to the optimizer
  842. * some register allocation fixes
  843. * some fpuvaroffset fixes in the unary minus node
  844. * push/popusedregisters is now called rg.save/restoreusedregisters and
  845. (for i386) uses temps instead of push/pop's when using -Op3 (that code is
  846. also better optimizable)
  847. * fixed and optimized register saving/restoring for new/dispose nodes
  848. * LOC_FPU locations now also require their "register" field to be set to
  849. R_ST, not R_ST0 (the latter is used for LOC_CFPUREGISTER locations only)
  850. - list field removed of the tnode class because it's not used currently
  851. and can cause hard-to-find bugs
  852. }