aoptcpu.pas 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492
  1. {
  2. Copyright (c) 1998-2002 by Jonas Maebe, member of the Free Pascal
  3. Development Team
  4. This unit implements the Z80 optimizer object
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. Unit aoptcpu;
  19. {$i fpcdefs.inc}
  20. {$ifdef EXTDEBUG}
  21. {$define DEBUG_AOPTCPU}
  22. {$endif EXTDEBUG}
  23. Interface
  24. uses cpubase, cgbase, aasmtai, aopt,AoptObj, aoptcpub;
  25. Type
  26. TCpuAsmOptimizer = class(TAsmOptimizer)
  27. { outputs a debug message into the assembler file }
  28. procedure DebugMsg(const s: string; p: tai);
  29. { checks whether loading a new value in reg1 overwrites the entirety of reg2 }
  30. function Reg1WriteOverwritesReg2Entirely(reg1, reg2: tregister): boolean;
  31. Function GetNextInstructionUsingReg(Current: tai; Var Next: tai;reg : TRegister): Boolean;
  32. function RegLoadedWithNewValue(reg : tregister; hp : tai) : boolean; override;
  33. function InstructionLoadsFromReg(const reg : TRegister; const hp : tai) : boolean; override;
  34. { uses the same constructor as TAopObj }
  35. function PeepHoleOptPass1Cpu(var p: tai): boolean; override;
  36. procedure PeepHoleOptPass2;override;
  37. End;
  38. Implementation
  39. uses
  40. cutils,
  41. verbose,
  42. cpuinfo,
  43. aasmbase,aasmcpu,aasmdata,
  44. globals,globtype,
  45. cgutils;
  46. type
  47. TAsmOpSet = set of TAsmOp;
  48. function CanBeCond(p : tai) : boolean;
  49. begin
  50. result:=(p.typ=ait_instruction) and (taicpu(p).condition=C_None);
  51. end;
  52. function RefsEqual(const r1, r2: treference): boolean;
  53. begin
  54. refsequal :=
  55. (r1.offset = r2.offset) and
  56. (r1.base = r2.base) and
  57. (r1.index = r2.index) and (r1.scalefactor = r2.scalefactor) and
  58. (r1.symbol=r2.symbol) and (r1.refaddr = r2.refaddr) and
  59. (r1.relsymbol = r2.relsymbol);
  60. end;
  61. function MatchOperand(const oper1: TOper; const oper2: TOper): boolean; inline;
  62. begin
  63. result:=oper1.typ=oper2.typ;
  64. if result then
  65. case oper1.typ of
  66. top_const:
  67. Result:=oper1.val = oper2.val;
  68. top_reg:
  69. Result:=oper1.reg = oper2.reg;
  70. top_ref:
  71. Result:=RefsEqual(oper1.ref^, oper2.ref^);
  72. else Result:=false;
  73. end
  74. end;
  75. function MatchOperand(const oper: TOper; const reg: TRegister): boolean; inline;
  76. begin
  77. result := (oper.typ = top_reg) and (oper.reg = reg);
  78. end;
  79. function MatchInstruction(const instr: tai; const op: TAsmOp): boolean;
  80. begin
  81. result :=
  82. (instr.typ = ait_instruction) and
  83. (taicpu(instr).opcode = op);
  84. end;
  85. function MatchInstruction(const instr: tai; const ops: TAsmOpSet): boolean;
  86. begin
  87. result :=
  88. (instr.typ = ait_instruction) and
  89. (taicpu(instr).opcode in ops);
  90. end;
  91. function MatchInstruction(const instr: tai; const ops: TAsmOpSet;opcount : byte): boolean;
  92. begin
  93. result :=
  94. (instr.typ = ait_instruction) and
  95. (taicpu(instr).opcode in ops) and
  96. (taicpu(instr).ops=opcount);
  97. end;
  98. function MatchOpType(const instr : tai;ot0,ot1 : toptype) : Boolean;
  99. begin
  100. Result:=(taicpu(instr).ops=2) and
  101. (taicpu(instr).oper[0]^.typ=ot0) and
  102. (taicpu(instr).oper[1]^.typ=ot1);
  103. end;
  104. {$ifdef DEBUG_AOPTCPU}
  105. procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);
  106. begin
  107. asml.insertbefore(tai_comment.Create(strpnew(s)), p);
  108. end;
  109. {$else DEBUG_AOPTCPU}
  110. procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);inline;
  111. begin
  112. end;
  113. {$endif DEBUG_AOPTCPU}
  114. function TCpuAsmOptimizer.Reg1WriteOverwritesReg2Entirely(reg1, reg2: tregister): boolean;
  115. begin
  116. case reg1 of
  117. NR_F:
  118. result:=SuperRegistersEqual(reg2,NR_DEFAULTFLAGS);
  119. NR_AF:
  120. result:=(reg2=NR_A) or (reg2=NR_AF) or SuperRegistersEqual(reg2,NR_DEFAULTFLAGS);
  121. NR_BC:
  122. result:=(reg2=NR_B) or (reg2=NR_C) or (reg2=NR_BC);
  123. NR_DE:
  124. result:=(reg2=NR_D) or (reg2=NR_E) or (reg2=NR_DE);
  125. NR_HL:
  126. result:=(reg2=NR_H) or (reg2=NR_L) or (reg2=NR_HL);
  127. NR_F_:
  128. result:=SuperRegistersEqual(reg2,NR_F_);
  129. NR_AF_:
  130. result:=(reg2=NR_A_) or (reg2=NR_AF_) or SuperRegistersEqual(reg2,NR_F_);
  131. NR_BC_:
  132. result:=(reg2=NR_B_) or (reg2=NR_C_) or (reg2=NR_BC_);
  133. NR_DE_:
  134. result:=(reg2=NR_D_) or (reg2=NR_E_) or (reg2=NR_DE_);
  135. NR_HL_:
  136. result:=(reg2=NR_H_) or (reg2=NR_L_) or (reg2=NR_HL_);
  137. else
  138. result:=reg1=reg2;
  139. end;
  140. end;
  141. function TCpuAsmOptimizer.GetNextInstructionUsingReg(Current: tai;
  142. var Next: tai; reg: TRegister): Boolean;
  143. begin
  144. Next:=Current;
  145. repeat
  146. Result:=GetNextInstruction(Next,Next);
  147. until not(cs_opt_level3 in current_settings.optimizerswitches) or not(Result) or (Next.typ<>ait_instruction) or (RegInInstruction(reg,Next)) or
  148. (is_calljmp(taicpu(Next).opcode));
  149. end;
  150. function TCpuAsmOptimizer.RegLoadedWithNewValue(reg: tregister; hp: tai): boolean;
  151. var
  152. p: taicpu;
  153. begin
  154. if not assigned(hp) or
  155. (hp.typ <> ait_instruction) then
  156. begin
  157. Result := false;
  158. exit;
  159. end;
  160. p := taicpu(hp);
  161. if SuperRegistersEqual(reg,NR_DEFAULTFLAGS) and (reg<>NR_AF) then
  162. begin
  163. case p.opcode of
  164. A_PUSH,A_POP,A_EX,A_EXX,A_NOP,A_HALT,A_DI,A_EI,A_IM,A_SET,A_RES,A_JP,A_JR,A_JRJP,A_DJNZ,A_CALL,A_RET,A_RETI,A_RETN,A_RST,A_OUT:
  165. result:=false;
  166. A_LD:
  167. begin
  168. if p.ops<>2 then
  169. internalerror(2020051112);
  170. { LD A,I or LD A,R ? }
  171. if (p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  172. (p.oper[1]^.typ=top_reg) and ((p.oper[1]^.reg=NR_I) or (p.oper[1]^.reg=NR_R)) then
  173. result:=(reg=NR_ADDSUBTRACTFLAG) or
  174. (reg=NR_PARITYOVERFLOWFLAG) or
  175. (reg=NR_HALFCARRYFLAG) or
  176. (reg=NR_ZEROFLAG) or
  177. (reg=NR_SIGNFLAG)
  178. else
  179. result:=false;
  180. end;
  181. A_LDI,A_LDIR,A_LDD,A_LDDR:
  182. result:=(reg=NR_ADDSUBTRACTFLAG) or
  183. (reg=NR_PARITYOVERFLOWFLAG) or
  184. (reg=NR_HALFCARRYFLAG);
  185. A_INC,A_DEC:
  186. begin
  187. if p.ops<>1 then
  188. internalerror(2020051602);
  189. if (p.oper[0]^.typ=top_reg) and ((p.oper[0]^.reg=NR_BC) or
  190. (p.oper[0]^.reg=NR_DE) or
  191. (p.oper[0]^.reg=NR_HL) or
  192. (p.oper[0]^.reg=NR_SP) or
  193. (p.oper[0]^.reg=NR_IX) or
  194. (p.oper[0]^.reg=NR_IY)) then
  195. result:=false
  196. else
  197. result:=(reg=NR_ADDSUBTRACTFLAG) or
  198. (reg=NR_PARITYOVERFLOWFLAG) or
  199. (reg=NR_HALFCARRYFLAG) or
  200. (reg=NR_ZEROFLAG) or
  201. (reg=NR_SIGNFLAG);
  202. end;
  203. A_CPI,A_CPIR,A_CPD,A_CPDR,A_RLD,A_RRD,A_BIT,A_INI,A_INIR,A_IND,A_INDR,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  204. result:=(reg=NR_ADDSUBTRACTFLAG) or
  205. (reg=NR_PARITYOVERFLOWFLAG) or
  206. (reg=NR_HALFCARRYFLAG) or
  207. (reg=NR_ZEROFLAG) or
  208. (reg=NR_SIGNFLAG);
  209. A_ADD:
  210. begin
  211. if p.ops<>2 then
  212. internalerror(2020051601);
  213. if (p.oper[0]^.typ=top_reg) and ((p.oper[0]^.reg=NR_HL) or (p.oper[0]^.reg=NR_IX) or (p.oper[0]^.reg=NR_IY)) then
  214. result:=(reg=NR_HALFCARRYFLAG) or
  215. (reg=NR_ADDSUBTRACTFLAG) or
  216. (reg=NR_CARRYFLAG)
  217. else
  218. result:=true;
  219. end;
  220. A_ADC,A_SUB,A_SBC,A_AND,A_OR,A_XOR,A_CP,A_NEG,A_RLC,A_RL,A_RRC,A_RR,A_SLA,A_SRA,A_SRL:
  221. result:=true;
  222. A_DAA:
  223. result:=(reg=NR_PARITYOVERFLOWFLAG) or
  224. (reg=NR_HALFCARRYFLAG) or
  225. (reg=NR_ZEROFLAG) or
  226. (reg=NR_SIGNFLAG) or
  227. (reg=NR_CARRYFLAG);
  228. A_CPL:
  229. result:=(reg=NR_HALFCARRYFLAG) or
  230. (reg=NR_ADDSUBTRACTFLAG);
  231. A_CCF,A_SCF,A_RLCA,A_RLA,A_RRCA,A_RRA:
  232. result:=(reg=NR_HALFCARRYFLAG) or
  233. (reg=NR_ADDSUBTRACTFLAG) or
  234. (reg=NR_CARRYFLAG);
  235. A_IN:
  236. begin
  237. if p.ops<>2 then
  238. internalerror(2020051612);
  239. if (p.oper[1]^.typ=top_ref) and ((p.oper[1]^.ref^.base=NR_C) or (p.oper[1]^.ref^.index=NR_C)) then
  240. result:=(reg=NR_ADDSUBTRACTFLAG) or
  241. (reg=NR_PARITYOVERFLOWFLAG) or
  242. (reg=NR_HALFCARRYFLAG) or
  243. (reg=NR_ZEROFLAG) or
  244. (reg=NR_SIGNFLAG)
  245. else
  246. result:=false;
  247. end;
  248. else
  249. internalerror(2020051111);
  250. end;
  251. end
  252. else
  253. case p.opcode of
  254. A_LD:
  255. begin
  256. if p.ops<>2 then
  257. internalerror(2020051114);
  258. result:=(p.oper[0]^.typ = top_reg) and
  259. (Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg)) and
  260. ((p.oper[1]^.typ = top_const) or
  261. ((p.oper[1]^.typ = top_reg) and not(Reg1ReadDependsOnReg2(p.oper[1]^.reg,reg))) or
  262. ((p.oper[1]^.typ = top_ref) and not RegInRef(reg,p.oper[1]^.ref^)));
  263. end;
  264. A_PUSH,A_EX,A_EXX,A_LDI,A_LDIR,A_LDD,A_LDDR,A_CPI,A_CPIR,A_CPD,A_CPDR,
  265. A_ADD,A_ADC,A_SBC,A_CP,A_INC,A_DEC,A_DAA,A_CPL,A_NEG,A_CCF,A_SCF,
  266. A_NOP,A_HALT,A_DI,A_EI,A_IM,A_RLCA,A_RLA,A_RRCA,A_RRA,A_RLC,A_RL,
  267. A_RRC,A_RR,A_SLA,A_SRA,A_SRL,A_RLD,A_RRD,A_BIT,A_SET,A_RES,A_JP,A_JR,A_JRJP,
  268. A_DJNZ,A_CALL,A_RET,A_RETI,A_RETN,A_RST,A_INI,A_INIR,A_IND,A_INDR,
  269. A_OUT,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  270. result:=false;
  271. A_POP:
  272. begin
  273. if p.ops<>1 then
  274. internalerror(2020051603);
  275. if p.oper[0]^.typ<>top_reg then
  276. internalerror(2020051604);
  277. result:=Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg);
  278. end;
  279. A_SUB,A_XOR:
  280. begin
  281. if p.ops<>2 then
  282. internalerror(2020051605);
  283. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  284. (p.oper[1]^.typ=top_reg) and (p.oper[1]^.reg=NR_A) and
  285. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  286. end;
  287. A_AND:
  288. begin
  289. if p.ops<>2 then
  290. internalerror(2020051606);
  291. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  292. (p.oper[1]^.typ=top_const) and (p.oper[1]^.val=0) and
  293. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  294. end;
  295. A_OR:
  296. begin
  297. if p.ops<>2 then
  298. internalerror(2020051607);
  299. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  300. (p.oper[1]^.typ=top_const) and (byte(p.oper[1]^.val)=255) and
  301. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  302. end;
  303. A_IN:
  304. begin
  305. if p.ops<>2 then
  306. internalerror(2020051608);
  307. if p.oper[0]^.typ<>top_reg then
  308. internalerror(2020051609);
  309. if p.oper[1]^.typ<>top_ref then
  310. internalerror(2020051610);
  311. result:=Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg) and
  312. (((p.oper[1]^.ref^.base<>NR_C) and (p.oper[1]^.ref^.index<>NR_C)) or
  313. not(Reg1ReadDependsOnReg2(NR_BC,reg)));
  314. end;
  315. else
  316. internalerror(2020051108);
  317. end;
  318. end;
  319. function TCpuAsmOptimizer.InstructionLoadsFromReg(const reg: TRegister; const hp: tai): boolean;
  320. var
  321. p: taicpu;
  322. begin
  323. Result := false;
  324. if not (assigned(hp) and (hp.typ = ait_instruction)) then
  325. exit;
  326. p:=taicpu(hp);
  327. case p.opcode of
  328. A_LD,A_BIT,A_SET,A_RES:
  329. begin
  330. if p.ops<>2 then
  331. internalerror(2020051102);
  332. result:=((p.oper[0]^.typ=top_ref) and RegInRef(reg,p.oper[0]^.ref^)) or
  333. RegInOp(reg,p.oper[1]^);
  334. end;
  335. A_PUSH,A_INC,A_DEC,A_RLC,A_RRC,A_SLA,A_SRA,A_SRL:
  336. begin
  337. if p.ops<>1 then
  338. internalerror(2020051103);
  339. result:=RegInOp(reg,p.oper[0]^);
  340. end;
  341. A_POP:
  342. result:=(reg=NR_SP);
  343. A_EX,A_ADD,A_SUB,A_AND,A_OR,A_XOR,A_CP:
  344. begin
  345. if p.ops<>2 then
  346. internalerror(2020051104);
  347. result:=RegInOp(reg,p.oper[0]^) or
  348. RegInOp(reg,p.oper[1]^);
  349. end;
  350. A_EXX:
  351. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_DE) or SuperRegistersEqual(reg,NR_HL) or
  352. SuperRegistersEqual(reg,NR_BC_) or SuperRegistersEqual(reg,NR_DE_) or SuperRegistersEqual(reg,NR_HL_);
  353. A_LDI,A_LDIR,A_LDD,A_LDDR:
  354. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_DE) or SuperRegistersEqual(reg,NR_HL);
  355. A_CPI,A_CPIR,A_CPD,A_CPDR:
  356. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_HL) or RegistersInterfere(reg,NR_A);
  357. A_ADC,A_SBC:
  358. begin
  359. if p.ops<>2 then
  360. internalerror(2020051105);
  361. result:=RegInOp(reg,p.oper[0]^) or
  362. RegInOp(reg,p.oper[1]^) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  363. end;
  364. A_DAA:
  365. result:=RegistersInterfere(reg,NR_A) or (reg=NR_CARRYFLAG) or (reg=NR_HALFCARRYFLAG) or (reg=NR_ADDSUBTRACTFLAG) or (reg=NR_DEFAULTFLAGS);
  366. A_CPL,A_NEG,A_RLCA,A_RRCA:
  367. result:=RegistersInterfere(reg,NR_A);
  368. A_CCF:
  369. result:=(reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  370. A_SCF,A_NOP,A_HALT,A_DI,A_EI,A_IM:
  371. result:=false;
  372. A_RLA,A_RRA:
  373. result:=RegistersInterfere(reg,NR_A) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  374. A_RL,A_RR:
  375. begin
  376. if p.ops<>1 then
  377. internalerror(2020051106);
  378. result:=RegInOp(reg,p.oper[0]^) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  379. end;
  380. A_RLD,A_RRD:
  381. result:=RegistersInterfere(reg,NR_A) or RegistersInterfere(reg,NR_HL);
  382. A_JP,A_JR,A_JRJP:
  383. begin
  384. if p.ops<>1 then
  385. internalerror(2020051107);
  386. if RegInOp(reg,p.oper[0]^) then
  387. result:=true
  388. else
  389. case p.condition of
  390. C_None:
  391. result:=false;
  392. C_NZ,C_Z:
  393. result:=(reg=NR_ZEROFLAG) or (reg=NR_DEFAULTFLAGS);
  394. C_NC,C_C:
  395. result:=(reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  396. C_PO,C_PE:
  397. result:=(reg=NR_PARITYOVERFLOWFLAG) or (reg=NR_DEFAULTFLAGS);
  398. C_P,C_M:
  399. result:=(reg=NR_SIGNFLAG) or (reg=NR_DEFAULTFLAGS);
  400. end;
  401. end;
  402. A_DJNZ:
  403. result:=RegistersInterfere(reg,NR_B);
  404. A_CALL,A_RET,A_RETI,A_RETN,A_RST:
  405. result:=true;
  406. A_IN:
  407. begin
  408. if p.ops<>2 then
  409. internalerror(2020051109);
  410. result:=(p.oper[1]^.typ=top_ref) and (p.oper[1]^.ref^.base=NR_C) and RegistersInterfere(reg,NR_BC);
  411. end;
  412. A_OUT:
  413. begin
  414. if p.ops<>2 then
  415. internalerror(2020051110);
  416. result:=RegInOp(reg,p.oper[1]^) or (p.oper[0]^.typ=top_ref) and (p.oper[0]^.ref^.base=NR_C) and RegistersInterfere(reg,NR_BC);
  417. end;
  418. A_INI,A_INIR,A_IND,A_INDR,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  419. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_HL);
  420. else
  421. internalerror(2020051101);
  422. end;
  423. end;
  424. function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;
  425. var
  426. hp1,hp2,hp3,hp4,hp5: tai;
  427. alloc, dealloc: tai_regalloc;
  428. i: integer;
  429. l: TAsmLabel;
  430. //TmpUsedRegs : TAllUsedRegs;
  431. begin
  432. result := false;
  433. //case p.typ of
  434. // ait_instruction:
  435. // begin
  436. // end;
  437. //end;
  438. end;
  439. procedure TCpuAsmOptimizer.PeepHoleOptPass2;
  440. begin
  441. end;
  442. begin
  443. casmoptimizer:=TCpuAsmOptimizer;
  444. End.