2
0

aoptcpu.pas 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490
  1. {
  2. Copyright (c) 1998-2002 by Jonas Maebe, member of the Free Pascal
  3. Development Team
  4. This unit implements the Z80 optimizer object
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. Unit aoptcpu;
  19. {$i fpcdefs.inc}
  20. {$define DEBUG_AOPTCPU}
  21. Interface
  22. uses cpubase, cgbase, aasmtai, aopt,AoptObj, aoptcpub;
  23. Type
  24. TCpuAsmOptimizer = class(TAsmOptimizer)
  25. { outputs a debug message into the assembler file }
  26. procedure DebugMsg(const s: string; p: tai);
  27. { checks whether loading a new value in reg1 overwrites the entirety of reg2 }
  28. function Reg1WriteOverwritesReg2Entirely(reg1, reg2: tregister): boolean;
  29. Function GetNextInstructionUsingReg(Current: tai; Var Next: tai;reg : TRegister): Boolean;
  30. function RegLoadedWithNewValue(reg : tregister; hp : tai) : boolean; override;
  31. function InstructionLoadsFromReg(const reg : TRegister; const hp : tai) : boolean; override;
  32. { uses the same constructor as TAopObj }
  33. function PeepHoleOptPass1Cpu(var p: tai): boolean; override;
  34. procedure PeepHoleOptPass2;override;
  35. End;
  36. Implementation
  37. uses
  38. cutils,
  39. verbose,
  40. cpuinfo,
  41. aasmbase,aasmcpu,aasmdata,
  42. globals,globtype,
  43. cgutils;
  44. type
  45. TAsmOpSet = set of TAsmOp;
  46. function CanBeCond(p : tai) : boolean;
  47. begin
  48. result:=(p.typ=ait_instruction) and (taicpu(p).condition=C_None);
  49. end;
  50. function RefsEqual(const r1, r2: treference): boolean;
  51. begin
  52. refsequal :=
  53. (r1.offset = r2.offset) and
  54. (r1.base = r2.base) and
  55. (r1.index = r2.index) and (r1.scalefactor = r2.scalefactor) and
  56. (r1.symbol=r2.symbol) and (r1.refaddr = r2.refaddr) and
  57. (r1.relsymbol = r2.relsymbol);
  58. end;
  59. function MatchOperand(const oper1: TOper; const oper2: TOper): boolean; inline;
  60. begin
  61. result:=oper1.typ=oper2.typ;
  62. if result then
  63. case oper1.typ of
  64. top_const:
  65. Result:=oper1.val = oper2.val;
  66. top_reg:
  67. Result:=oper1.reg = oper2.reg;
  68. top_ref:
  69. Result:=RefsEqual(oper1.ref^, oper2.ref^);
  70. else Result:=false;
  71. end
  72. end;
  73. function MatchOperand(const oper: TOper; const reg: TRegister): boolean; inline;
  74. begin
  75. result := (oper.typ = top_reg) and (oper.reg = reg);
  76. end;
  77. function MatchInstruction(const instr: tai; const op: TAsmOp): boolean;
  78. begin
  79. result :=
  80. (instr.typ = ait_instruction) and
  81. (taicpu(instr).opcode = op);
  82. end;
  83. function MatchInstruction(const instr: tai; const ops: TAsmOpSet): boolean;
  84. begin
  85. result :=
  86. (instr.typ = ait_instruction) and
  87. (taicpu(instr).opcode in ops);
  88. end;
  89. function MatchInstruction(const instr: tai; const ops: TAsmOpSet;opcount : byte): boolean;
  90. begin
  91. result :=
  92. (instr.typ = ait_instruction) and
  93. (taicpu(instr).opcode in ops) and
  94. (taicpu(instr).ops=opcount);
  95. end;
  96. function MatchOpType(const instr : tai;ot0,ot1 : toptype) : Boolean;
  97. begin
  98. Result:=(taicpu(instr).ops=2) and
  99. (taicpu(instr).oper[0]^.typ=ot0) and
  100. (taicpu(instr).oper[1]^.typ=ot1);
  101. end;
  102. {$ifdef DEBUG_AOPTCPU}
  103. procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);
  104. begin
  105. asml.insertbefore(tai_comment.Create(strpnew(s)), p);
  106. end;
  107. {$else DEBUG_AOPTCPU}
  108. procedure TCpuAsmOptimizer.DebugMsg(const s: string;p : tai);inline;
  109. begin
  110. end;
  111. {$endif DEBUG_AOPTCPU}
  112. function TCpuAsmOptimizer.Reg1WriteOverwritesReg2Entirely(reg1, reg2: tregister): boolean;
  113. begin
  114. case reg1 of
  115. NR_F:
  116. result:=SuperRegistersEqual(reg2,NR_DEFAULTFLAGS);
  117. NR_AF:
  118. result:=(reg2=NR_A) or (reg2=NR_AF) or SuperRegistersEqual(reg2,NR_DEFAULTFLAGS);
  119. NR_BC:
  120. result:=(reg2=NR_B) or (reg2=NR_C) or (reg2=NR_BC);
  121. NR_DE:
  122. result:=(reg2=NR_D) or (reg2=NR_E) or (reg2=NR_DE);
  123. NR_HL:
  124. result:=(reg2=NR_H) or (reg2=NR_L) or (reg2=NR_HL);
  125. NR_F_:
  126. result:=SuperRegistersEqual(reg2,NR_F_);
  127. NR_AF_:
  128. result:=(reg2=NR_A_) or (reg2=NR_AF_) or SuperRegistersEqual(reg2,NR_F_);
  129. NR_BC_:
  130. result:=(reg2=NR_B_) or (reg2=NR_C_) or (reg2=NR_BC_);
  131. NR_DE_:
  132. result:=(reg2=NR_D_) or (reg2=NR_E_) or (reg2=NR_DE_);
  133. NR_HL_:
  134. result:=(reg2=NR_H_) or (reg2=NR_L_) or (reg2=NR_HL_);
  135. else
  136. result:=reg1=reg2;
  137. end;
  138. end;
  139. function TCpuAsmOptimizer.GetNextInstructionUsingReg(Current: tai;
  140. var Next: tai; reg: TRegister): Boolean;
  141. begin
  142. Next:=Current;
  143. repeat
  144. Result:=GetNextInstruction(Next,Next);
  145. until not(cs_opt_level3 in current_settings.optimizerswitches) or not(Result) or (Next.typ<>ait_instruction) or (RegInInstruction(reg,Next)) or
  146. (is_calljmp(taicpu(Next).opcode));
  147. end;
  148. function TCpuAsmOptimizer.RegLoadedWithNewValue(reg: tregister; hp: tai): boolean;
  149. var
  150. p: taicpu;
  151. begin
  152. if not assigned(hp) or
  153. (hp.typ <> ait_instruction) then
  154. begin
  155. Result := false;
  156. exit;
  157. end;
  158. p := taicpu(hp);
  159. if SuperRegistersEqual(reg,NR_DEFAULTFLAGS) and (reg<>NR_AF) then
  160. begin
  161. case p.opcode of
  162. A_PUSH,A_POP,A_EX,A_EXX,A_NOP,A_HALT,A_DI,A_EI,A_IM,A_SET,A_RES,A_JP,A_JR,A_JRJP,A_DJNZ,A_CALL,A_RET,A_RETI,A_RETN,A_RST,A_OUT:
  163. result:=false;
  164. A_LD:
  165. begin
  166. if p.ops<>2 then
  167. internalerror(2020051112);
  168. { LD A,I or LD A,R ? }
  169. if (p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  170. (p.oper[1]^.typ=top_reg) and ((p.oper[1]^.reg=NR_I) or (p.oper[1]^.reg=NR_R)) then
  171. result:=(reg=NR_ADDSUBTRACTFLAG) or
  172. (reg=NR_PARITYOVERFLOWFLAG) or
  173. (reg=NR_HALFCARRYFLAG) or
  174. (reg=NR_ZEROFLAG) or
  175. (reg=NR_SIGNFLAG)
  176. else
  177. result:=false;
  178. end;
  179. A_LDI,A_LDIR,A_LDD,A_LDDR:
  180. result:=(reg=NR_ADDSUBTRACTFLAG) or
  181. (reg=NR_PARITYOVERFLOWFLAG) or
  182. (reg=NR_HALFCARRYFLAG);
  183. A_INC,A_DEC:
  184. begin
  185. if p.ops<>1 then
  186. internalerror(2020051602);
  187. if (p.oper[0]^.typ=top_reg) and ((p.oper[0]^.reg=NR_BC) or
  188. (p.oper[0]^.reg=NR_DE) or
  189. (p.oper[0]^.reg=NR_HL) or
  190. (p.oper[0]^.reg=NR_SP) or
  191. (p.oper[0]^.reg=NR_IX) or
  192. (p.oper[0]^.reg=NR_IY)) then
  193. result:=false
  194. else
  195. result:=(reg=NR_ADDSUBTRACTFLAG) or
  196. (reg=NR_PARITYOVERFLOWFLAG) or
  197. (reg=NR_HALFCARRYFLAG) or
  198. (reg=NR_ZEROFLAG) or
  199. (reg=NR_SIGNFLAG);
  200. end;
  201. A_CPI,A_CPIR,A_CPD,A_CPDR,A_RLD,A_RRD,A_BIT,A_INI,A_INIR,A_IND,A_INDR,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  202. result:=(reg=NR_ADDSUBTRACTFLAG) or
  203. (reg=NR_PARITYOVERFLOWFLAG) or
  204. (reg=NR_HALFCARRYFLAG) or
  205. (reg=NR_ZEROFLAG) or
  206. (reg=NR_SIGNFLAG);
  207. A_ADD:
  208. begin
  209. if p.ops<>2 then
  210. internalerror(2020051601);
  211. if (p.oper[0]^.typ=top_reg) and ((p.oper[0]^.reg=NR_HL) or (p.oper[0]^.reg=NR_IX) or (p.oper[0]^.reg=NR_IY)) then
  212. result:=(reg=NR_HALFCARRYFLAG) or
  213. (reg=NR_ADDSUBTRACTFLAG) or
  214. (reg=NR_CARRYFLAG)
  215. else
  216. result:=true;
  217. end;
  218. A_ADC,A_SUB,A_SBC,A_AND,A_OR,A_XOR,A_CP,A_NEG,A_RLC,A_RL,A_RRC,A_RR,A_SLA,A_SRA,A_SRL:
  219. result:=true;
  220. A_DAA:
  221. result:=(reg=NR_PARITYOVERFLOWFLAG) or
  222. (reg=NR_HALFCARRYFLAG) or
  223. (reg=NR_ZEROFLAG) or
  224. (reg=NR_SIGNFLAG) or
  225. (reg=NR_CARRYFLAG);
  226. A_CPL:
  227. result:=(reg=NR_HALFCARRYFLAG) or
  228. (reg=NR_ADDSUBTRACTFLAG);
  229. A_CCF,A_SCF,A_RLCA,A_RLA,A_RRCA,A_RRA:
  230. result:=(reg=NR_HALFCARRYFLAG) or
  231. (reg=NR_ADDSUBTRACTFLAG) or
  232. (reg=NR_CARRYFLAG);
  233. A_IN:
  234. begin
  235. if p.ops<>2 then
  236. internalerror(2020051612);
  237. if (p.oper[1]^.typ=top_ref) and ((p.oper[1]^.ref^.base=NR_C) or (p.oper[1]^.ref^.index=NR_C)) then
  238. result:=(reg=NR_ADDSUBTRACTFLAG) or
  239. (reg=NR_PARITYOVERFLOWFLAG) or
  240. (reg=NR_HALFCARRYFLAG) or
  241. (reg=NR_ZEROFLAG) or
  242. (reg=NR_SIGNFLAG)
  243. else
  244. result:=false;
  245. end;
  246. else
  247. internalerror(2020051111);
  248. end;
  249. end
  250. else
  251. case p.opcode of
  252. A_LD:
  253. begin
  254. if p.ops<>2 then
  255. internalerror(2020051114);
  256. result:=(p.oper[0]^.typ = top_reg) and
  257. (Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg)) and
  258. ((p.oper[1]^.typ = top_const) or
  259. ((p.oper[1]^.typ = top_reg) and not(Reg1ReadDependsOnReg2(p.oper[1]^.reg,reg))) or
  260. ((p.oper[1]^.typ = top_ref) and not RegInRef(reg,p.oper[1]^.ref^)));
  261. end;
  262. A_PUSH,A_EX,A_EXX,A_LDI,A_LDIR,A_LDD,A_LDDR,A_CPI,A_CPIR,A_CPD,A_CPDR,
  263. A_ADD,A_ADC,A_SBC,A_CP,A_INC,A_DEC,A_DAA,A_CPL,A_NEG,A_CCF,A_SCF,
  264. A_NOP,A_HALT,A_DI,A_EI,A_IM,A_RLCA,A_RLA,A_RRCA,A_RRA,A_RLC,A_RL,
  265. A_RRC,A_RR,A_SLA,A_SRA,A_SRL,A_RLD,A_RRD,A_BIT,A_SET,A_RES,A_JP,A_JR,A_JRJP,
  266. A_DJNZ,A_CALL,A_RET,A_RETI,A_RETN,A_RST,A_INI,A_INIR,A_IND,A_INDR,
  267. A_OUT,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  268. result:=false;
  269. A_POP:
  270. begin
  271. if p.ops<>1 then
  272. internalerror(2020051603);
  273. if p.oper[0]^.typ<>top_reg then
  274. internalerror(2020051604);
  275. result:=Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg);
  276. end;
  277. A_SUB,A_XOR:
  278. begin
  279. if p.ops<>2 then
  280. internalerror(2020051605);
  281. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  282. (p.oper[1]^.typ=top_reg) and (p.oper[1]^.reg=NR_A) and
  283. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  284. end;
  285. A_AND:
  286. begin
  287. if p.ops<>2 then
  288. internalerror(2020051606);
  289. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  290. (p.oper[1]^.typ=top_const) and (p.oper[1]^.val=0) and
  291. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  292. end;
  293. A_OR:
  294. begin
  295. if p.ops<>2 then
  296. internalerror(2020051607);
  297. result:=(p.oper[0]^.typ=top_reg) and (p.oper[0]^.reg=NR_A) and
  298. (p.oper[1]^.typ=top_const) and (byte(p.oper[1]^.val)=255) and
  299. Reg1WriteOverwritesReg2Entirely(NR_A,reg);
  300. end;
  301. A_IN:
  302. begin
  303. if p.ops<>2 then
  304. internalerror(2020051608);
  305. if p.oper[0]^.typ<>top_reg then
  306. internalerror(2020051609);
  307. if p.oper[1]^.typ<>top_ref then
  308. internalerror(2020051610);
  309. result:=Reg1WriteOverwritesReg2Entirely(p.oper[0]^.reg,reg) and
  310. (((p.oper[1]^.ref^.base<>NR_C) and (p.oper[1]^.ref^.index<>NR_C)) or
  311. not(Reg1ReadDependsOnReg2(NR_BC,reg)));
  312. end;
  313. else
  314. internalerror(2020051108);
  315. end;
  316. end;
  317. function TCpuAsmOptimizer.InstructionLoadsFromReg(const reg: TRegister; const hp: tai): boolean;
  318. var
  319. p: taicpu;
  320. begin
  321. Result := false;
  322. if not (assigned(hp) and (hp.typ = ait_instruction)) then
  323. exit;
  324. p:=taicpu(hp);
  325. case p.opcode of
  326. A_LD,A_BIT,A_SET,A_RES:
  327. begin
  328. if p.ops<>2 then
  329. internalerror(2020051102);
  330. result:=((p.oper[0]^.typ=top_ref) and RegInRef(reg,p.oper[0]^.ref^)) or
  331. RegInOp(reg,p.oper[1]^);
  332. end;
  333. A_PUSH,A_INC,A_DEC,A_RLC,A_RRC,A_SLA,A_SRA,A_SRL:
  334. begin
  335. if p.ops<>1 then
  336. internalerror(2020051103);
  337. result:=RegInOp(reg,p.oper[0]^);
  338. end;
  339. A_POP:
  340. result:=(reg=NR_SP);
  341. A_EX,A_ADD,A_SUB,A_AND,A_OR,A_XOR,A_CP:
  342. begin
  343. if p.ops<>2 then
  344. internalerror(2020051104);
  345. result:=RegInOp(reg,p.oper[0]^) or
  346. RegInOp(reg,p.oper[1]^);
  347. end;
  348. A_EXX:
  349. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_DE) or SuperRegistersEqual(reg,NR_HL) or
  350. SuperRegistersEqual(reg,NR_BC_) or SuperRegistersEqual(reg,NR_DE_) or SuperRegistersEqual(reg,NR_HL_);
  351. A_LDI,A_LDIR,A_LDD,A_LDDR:
  352. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_DE) or SuperRegistersEqual(reg,NR_HL);
  353. A_CPI,A_CPIR,A_CPD,A_CPDR:
  354. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_HL) or RegistersInterfere(reg,NR_A);
  355. A_ADC,A_SBC:
  356. begin
  357. if p.ops<>2 then
  358. internalerror(2020051105);
  359. result:=RegInOp(reg,p.oper[0]^) or
  360. RegInOp(reg,p.oper[1]^) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  361. end;
  362. A_DAA:
  363. result:=RegistersInterfere(reg,NR_A) or (reg=NR_CARRYFLAG) or (reg=NR_HALFCARRYFLAG) or (reg=NR_ADDSUBTRACTFLAG) or (reg=NR_DEFAULTFLAGS);
  364. A_CPL,A_NEG,A_RLCA,A_RRCA:
  365. result:=RegistersInterfere(reg,NR_A);
  366. A_CCF:
  367. result:=(reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  368. A_SCF,A_NOP,A_HALT,A_DI,A_EI,A_IM:
  369. result:=false;
  370. A_RLA,A_RRA:
  371. result:=RegistersInterfere(reg,NR_A) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  372. A_RL,A_RR:
  373. begin
  374. if p.ops<>1 then
  375. internalerror(2020051106);
  376. result:=RegInOp(reg,p.oper[0]^) or (reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  377. end;
  378. A_RLD,A_RRD:
  379. result:=RegistersInterfere(reg,NR_A) or RegistersInterfere(reg,NR_HL);
  380. A_JP,A_JR,A_JRJP:
  381. begin
  382. if p.ops<>1 then
  383. internalerror(2020051107);
  384. if RegInOp(reg,p.oper[0]^) then
  385. result:=true
  386. else
  387. case p.condition of
  388. C_None:
  389. result:=false;
  390. C_NZ,C_Z:
  391. result:=(reg=NR_ZEROFLAG) or (reg=NR_DEFAULTFLAGS);
  392. C_NC,C_C:
  393. result:=(reg=NR_CARRYFLAG) or (reg=NR_DEFAULTFLAGS);
  394. C_PO,C_PE:
  395. result:=(reg=NR_PARITYOVERFLOWFLAG) or (reg=NR_DEFAULTFLAGS);
  396. C_P,C_M:
  397. result:=(reg=NR_SIGNFLAG) or (reg=NR_DEFAULTFLAGS);
  398. end;
  399. end;
  400. A_DJNZ:
  401. result:=RegistersInterfere(reg,NR_B);
  402. A_CALL,A_RET,A_RETI,A_RETN,A_RST:
  403. result:=true;
  404. A_IN:
  405. begin
  406. if p.ops<>2 then
  407. internalerror(2020051109);
  408. result:=(p.oper[1]^.typ=top_ref) and (p.oper[1]^.ref^.base=NR_C) and RegistersInterfere(reg,NR_BC);
  409. end;
  410. A_OUT:
  411. begin
  412. if p.ops<>2 then
  413. internalerror(2020051110);
  414. result:=RegInOp(reg,p.oper[1]^) or (p.oper[0]^.typ=top_ref) and (p.oper[0]^.ref^.base=NR_C) and RegistersInterfere(reg,NR_BC);
  415. end;
  416. A_INI,A_INIR,A_IND,A_INDR,A_OUTI,A_OTIR,A_OUTD,A_OTDR:
  417. result:=SuperRegistersEqual(reg,NR_BC) or SuperRegistersEqual(reg,NR_HL);
  418. else
  419. internalerror(2020051101);
  420. end;
  421. end;
  422. function TCpuAsmOptimizer.PeepHoleOptPass1Cpu(var p: tai): boolean;
  423. var
  424. hp1,hp2,hp3,hp4,hp5: tai;
  425. alloc, dealloc: tai_regalloc;
  426. i: integer;
  427. l: TAsmLabel;
  428. //TmpUsedRegs : TAllUsedRegs;
  429. begin
  430. result := false;
  431. //case p.typ of
  432. // ait_instruction:
  433. // begin
  434. // end;
  435. //end;
  436. end;
  437. procedure TCpuAsmOptimizer.PeepHoleOptPass2;
  438. begin
  439. end;
  440. begin
  441. casmoptimizer:=TCpuAsmOptimizer;
  442. End.