cpupara.pas 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533
  1. {
  2. Copyright (c) 2002 by Florian Klaempfl
  3. Generates the argument location information for x86-64 target
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published bymethodpointer
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit cpupara;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. globtype,
  22. cpubase,cgbase,
  23. symconst,symtype,symsym,symdef,
  24. aasmtai,aasmdata,
  25. parabase,paramgr;
  26. type
  27. tx86_64paramanager = class(tparamanager)
  28. private
  29. procedure create_funcretloc_info(p : tabstractprocdef; side: tcallercallee);
  30. procedure create_paraloc_info_intern(p : tabstractprocdef; side: tcallercallee;paras:tparalist;
  31. var intparareg,mmparareg,parasize:longint);
  32. public
  33. function param_use_paraloc(const cgpara:tcgpara):boolean;override;
  34. function push_addr_param(varspez:tvarspez;def : tdef;calloption : tproccalloption) : boolean;override;
  35. procedure getintparaloc(calloption : tproccalloption; nr : longint;var cgpara:TCGPara);override;
  36. function get_volatile_registers_int(calloption : tproccalloption):tcpuregisterset;override;
  37. function get_volatile_registers_mm(calloption : tproccalloption):tcpuregisterset;override;
  38. function get_volatile_registers_fpu(calloption : tproccalloption):tcpuregisterset;override;
  39. function create_paraloc_info(p : tabstractprocdef; side: tcallercallee):longint;override;
  40. function create_varargs_paraloc_info(p : tabstractprocdef; varargspara:tvarargsparalist):longint;override;
  41. end;
  42. implementation
  43. uses
  44. cutils,verbose,
  45. systems,
  46. defutil,
  47. cgutils;
  48. const
  49. paraintsupregs : array[0..5] of tsuperregister = (RS_RDI,RS_RSI,RS_RDX,RS_RCX,RS_R8,RS_R9);
  50. parammsupregs : array[0..7] of tsuperregister = (RS_XMM0,RS_XMM1,RS_XMM2,RS_XMM3,RS_XMM4,RS_XMM5,RS_XMM6,RS_XMM7);
  51. paraintsupregs_winx64 : array[0..3] of tsuperregister = (RS_RCX,RS_RDX,RS_R8,RS_R9);
  52. parammsupregs_winx64 : array[0..3] of tsuperregister = (RS_XMM0,RS_XMM1,RS_XMM2,RS_XMM3);
  53. procedure getvalueparaloc(p : tdef;var loc1,loc2:tcgloc);
  54. begin
  55. loc1:=LOC_INVALID;
  56. loc2:=LOC_INVALID;
  57. case p.deftype of
  58. orddef:
  59. begin
  60. loc1:=LOC_REGISTER;
  61. {$warning TODO 128bit also needs lochigh}
  62. end;
  63. floatdef:
  64. begin
  65. case tfloatdef(p).typ of
  66. s80real:
  67. loc1:=LOC_REFERENCE;
  68. s32real,
  69. s64real :
  70. loc1:=LOC_MMREGISTER;
  71. s64currency,
  72. s64comp :
  73. loc1:=LOC_REGISTER;
  74. s128real:
  75. begin
  76. loc1:=LOC_MMREGISTER;
  77. loc2:=LOC_MMREGISTER;
  78. {$warning TODO float 128bit needs SSEUP lochigh}
  79. end;
  80. end;
  81. end;
  82. recorddef:
  83. begin
  84. if p.size<=16 then
  85. begin
  86. {$warning TODO location depends on the fields}
  87. loc1:=LOC_REFERENCE;
  88. end
  89. else
  90. loc1:=LOC_REFERENCE;
  91. end;
  92. objectdef:
  93. begin
  94. if is_object(p) then
  95. loc1:=LOC_REFERENCE
  96. else
  97. loc1:=LOC_REGISTER;
  98. end;
  99. arraydef:
  100. begin
  101. loc1:=LOC_REFERENCE;
  102. end;
  103. variantdef:
  104. loc1:=LOC_REFERENCE;
  105. stringdef:
  106. if is_shortstring(p) or is_longstring(p) then
  107. loc1:=LOC_REFERENCE
  108. else
  109. loc1:=LOC_REGISTER;
  110. setdef:
  111. if is_smallset(p) then
  112. loc1:=LOC_REGISTER
  113. else
  114. loc1:=LOC_REFERENCE;
  115. procvardef:
  116. begin
  117. { This is a record < 16 bytes }
  118. if (po_methodpointer in tprocvardef(p).procoptions) then
  119. begin
  120. loc1:=LOC_REGISTER;
  121. loc2:=LOC_REGISTER;
  122. end
  123. else
  124. loc1:=LOC_REGISTER;
  125. end;
  126. else
  127. begin
  128. { default for pointers,enums,etc }
  129. loc1:=LOC_REGISTER;
  130. end;
  131. end;
  132. end;
  133. function tx86_64paramanager.param_use_paraloc(const cgpara:tcgpara):boolean;
  134. var
  135. paraloc : pcgparalocation;
  136. begin
  137. if not assigned(cgpara.location) then
  138. internalerror(200410102);
  139. result:=true;
  140. { All locations are LOC_REFERENCE }
  141. paraloc:=cgpara.location;
  142. while assigned(paraloc) do
  143. begin
  144. if (paraloc^.loc<>LOC_REFERENCE) then
  145. begin
  146. result:=false;
  147. exit;
  148. end;
  149. paraloc:=paraloc^.next;
  150. end;
  151. end;
  152. { true if a parameter is too large to copy and only the address is pushed }
  153. function tx86_64paramanager.push_addr_param(varspez:tvarspez;def : tdef;calloption : tproccalloption) : boolean;
  154. begin
  155. result:=false;
  156. { var,out always require address }
  157. if varspez in [vs_var,vs_out] then
  158. begin
  159. result:=true;
  160. exit;
  161. end;
  162. { Only vs_const, vs_value here }
  163. case def.deftype of
  164. variantdef,
  165. formaldef :
  166. result:=true;
  167. recorddef :
  168. result:=(def.size>sizeof(aint));
  169. arraydef :
  170. begin
  171. result:=not(
  172. { cdecl array of const need to be ignored and therefor be puhsed
  173. as value parameter with length 0 }
  174. (calloption in [pocall_cdecl,pocall_cppdecl]) and
  175. (is_array_of_const(def) or
  176. is_dynamic_array(def))
  177. );
  178. end;
  179. objectdef :
  180. result:=is_object(def);
  181. stringdef :
  182. result:=(tstringdef(def).string_typ in [st_shortstring,st_longstring]);
  183. procvardef :
  184. result:=(po_methodpointer in tprocvardef(def).procoptions);
  185. setdef :
  186. result:=(tsetdef(def).settype<>smallset);
  187. end;
  188. end;
  189. function tx86_64paramanager.get_volatile_registers_int(calloption : tproccalloption):tcpuregisterset;
  190. begin
  191. result:=[RS_RAX,RS_RCX,RS_RDX,RS_RSI,RS_RDI,RS_R8,RS_R9,RS_R10,RS_R11];
  192. end;
  193. function tx86_64paramanager.get_volatile_registers_mm(calloption : tproccalloption):tcpuregisterset;
  194. begin
  195. result:=[RS_XMM0..RS_XMM15];
  196. end;
  197. function tx86_64paramanager.get_volatile_registers_fpu(calloption : tproccalloption):tcpuregisterset;
  198. begin
  199. result:=[RS_ST0..RS_ST7];
  200. end;
  201. procedure tx86_64paramanager.getintparaloc(calloption : tproccalloption; nr : longint;var cgpara:TCGPara);
  202. var
  203. paraloc : pcgparalocation;
  204. begin
  205. cgpara.reset;
  206. cgpara.size:=OS_INT;
  207. cgpara.intsize:=tcgsize2size[OS_INT];
  208. cgpara.alignment:=get_para_align(calloption);
  209. paraloc:=cgpara.add_location;
  210. with paraloc^ do
  211. begin
  212. size:=OS_INT;
  213. if target_info.system=system_x86_64_win64 then
  214. begin
  215. if nr<1 then
  216. internalerror(200304303)
  217. else if nr<=high(paraintsupregs_winx64)+1 then
  218. begin
  219. loc:=LOC_REGISTER;
  220. register:=newreg(R_INTREGISTER,paraintsupregs_winx64[nr-1],R_SUBWHOLE);
  221. end
  222. else
  223. begin
  224. loc:=LOC_REFERENCE;
  225. reference.index:=NR_STACK_POINTER_REG;
  226. reference.offset:=(nr-6)*sizeof(aint);
  227. end;
  228. end
  229. else
  230. begin
  231. if nr<1 then
  232. internalerror(200304303)
  233. else if nr<=high(paraintsupregs)+1 then
  234. begin
  235. loc:=LOC_REGISTER;
  236. register:=newreg(R_INTREGISTER,paraintsupregs[nr-1],R_SUBWHOLE);
  237. end
  238. else
  239. begin
  240. loc:=LOC_REFERENCE;
  241. reference.index:=NR_STACK_POINTER_REG;
  242. reference.offset:=(nr-6)*sizeof(aint);
  243. end;
  244. end;
  245. end;
  246. end;
  247. procedure tx86_64paramanager.create_funcretloc_info(p : tabstractprocdef; side: tcallercallee);
  248. var
  249. retcgsize : tcgsize;
  250. begin
  251. { Constructors return self instead of a boolean }
  252. if (p.proctypeoption=potype_constructor) then
  253. retcgsize:=OS_ADDR
  254. else
  255. retcgsize:=def_cgsize(p.rettype.def);
  256. location_reset(p.funcretloc[side],LOC_INVALID,OS_NO);
  257. { void has no location }
  258. if is_void(p.rettype.def) then
  259. begin
  260. location_reset(p.funcretloc[side],LOC_VOID,OS_NO);
  261. exit;
  262. end;
  263. { Return in FPU register? }
  264. if p.rettype.def.deftype=floatdef then
  265. begin
  266. case tfloatdef(p.rettype.def).typ of
  267. s32real,s64real:
  268. begin
  269. p.funcretloc[side].loc:=LOC_MMREGISTER;
  270. p.funcretloc[side].register:=NR_MM_RESULT_REG;
  271. p.funcretloc[side].size:=retcgsize;
  272. end;
  273. s64currency,
  274. s64comp,
  275. s80real:
  276. begin
  277. p.funcretloc[side].loc:=LOC_FPUREGISTER;
  278. p.funcretloc[side].register:=NR_FPU_RESULT_REG;
  279. p.funcretloc[side].size:=retcgsize;
  280. end;
  281. else
  282. internalerror(200405034);
  283. end;
  284. end
  285. else
  286. { Return in register? }
  287. if not ret_in_param(p.rettype.def,p.proccalloption) then
  288. begin
  289. p.funcretloc[side].loc:=LOC_REGISTER;
  290. p.funcretloc[side].size:=retcgsize;
  291. if side=callerside then
  292. p.funcretloc[side].register:=newreg(R_INTREGISTER,RS_FUNCTION_RESULT_REG,cgsize2subreg(retcgsize))
  293. else
  294. p.funcretloc[side].register:=newreg(R_INTREGISTER,RS_FUNCTION_RETURN_REG,cgsize2subreg(retcgsize));
  295. end
  296. else
  297. begin
  298. p.funcretloc[side].loc:=LOC_REFERENCE;
  299. p.funcretloc[side].size:=retcgsize;
  300. end;
  301. end;
  302. procedure tx86_64paramanager.create_paraloc_info_intern(p : tabstractprocdef; side: tcallercallee;paras:tparalist;
  303. var intparareg,mmparareg,parasize:longint);
  304. var
  305. hp : tparavarsym;
  306. paraloc : pcgparalocation;
  307. subreg : tsubregister;
  308. pushaddr : boolean;
  309. paracgsize : tcgsize;
  310. loc : array[1..2] of tcgloc;
  311. paralen,
  312. locidx,
  313. l,i,
  314. varalign,
  315. paraalign : longint;
  316. begin
  317. paraalign:=get_para_align(p.proccalloption);
  318. { Register parameters are assigned from left to right }
  319. for i:=0 to paras.count-1 do
  320. begin
  321. hp:=tparavarsym(paras[i]);
  322. pushaddr:=push_addr_param(hp.varspez,hp.vartype.def,p.proccalloption);
  323. if pushaddr then
  324. begin
  325. loc[1]:=LOC_REGISTER;
  326. loc[2]:=LOC_INVALID;
  327. paracgsize:=OS_ADDR;
  328. paralen:=sizeof(aint);
  329. end
  330. else
  331. begin
  332. getvalueparaloc(hp.vartype.def,loc[1],loc[2]);
  333. paralen:=push_size(hp.varspez,hp.vartype.def,p.proccalloption);
  334. paracgsize:=def_cgsize(hp.vartype.def);
  335. end;
  336. hp.paraloc[side].reset;
  337. hp.paraloc[side].size:=paracgsize;
  338. hp.paraloc[side].intsize:=paralen;
  339. hp.paraloc[side].Alignment:=paraalign;
  340. if paralen>0 then
  341. begin
  342. locidx:=1;
  343. while (paralen>0) do
  344. begin
  345. if locidx>2 then
  346. internalerror(200501283);
  347. { Enough registers free? }
  348. case loc[locidx] of
  349. LOC_REGISTER :
  350. begin
  351. { winx64 uses different registers }
  352. if ((target_info.system=system_x86_64_win64) and
  353. (intparareg>high(paraintsupregs_winx64))) or
  354. ((target_info.system<>system_x86_64_win64) and
  355. (intparareg>high(paraintsupregs))) then
  356. loc[locidx]:=LOC_REFERENCE;
  357. end;
  358. LOC_MMREGISTER :
  359. begin
  360. { winx64 uses different registers }
  361. if ((target_info.system=system_x86_64_win64) and
  362. (mmparareg>high(parammsupregs_winx64))) or
  363. ((target_info.system<>system_x86_64_win64) and
  364. (mmparareg>high(parammsupregs))) then
  365. loc[locidx]:=LOC_REFERENCE;
  366. end;
  367. end;
  368. { Allocate }
  369. case loc[locidx] of
  370. LOC_REGISTER :
  371. begin
  372. paraloc:=hp.paraloc[side].add_location;
  373. paraloc^.loc:=LOC_REGISTER;
  374. if (paracgsize=OS_NO) or (loc[2]<>LOC_INVALID) then
  375. begin
  376. paraloc^.size:=OS_INT;
  377. subreg:=R_SUBWHOLE;
  378. end
  379. else
  380. begin
  381. paraloc^.size:=paracgsize;
  382. { s64comp is pushed in an int register }
  383. if paraloc^.size=OS_C64 then
  384. paraloc^.size:=OS_64;
  385. subreg:=cgsize2subreg(paraloc^.size);
  386. end;
  387. { winx64 uses different registers }
  388. if target_info.system=system_x86_64_win64 then
  389. paraloc^.register:=newreg(R_INTREGISTER,paraintsupregs_winx64[intparareg],subreg)
  390. else
  391. paraloc^.register:=newreg(R_INTREGISTER,paraintsupregs[intparareg],subreg);
  392. inc(intparareg);
  393. dec(paralen,tcgsize2size[paraloc^.size]);
  394. end;
  395. LOC_MMREGISTER :
  396. begin
  397. paraloc:=hp.paraloc[side].add_location;
  398. paraloc^.loc:=LOC_MMREGISTER;
  399. { winx64 uses different registers }
  400. if target_info.system=system_x86_64_win64 then
  401. paraloc^.register:=newreg(R_MMREGISTER,parammsupregs_winx64[mmparareg],R_SUBNONE)
  402. else
  403. paraloc^.register:=newreg(R_MMREGISTER,parammsupregs[mmparareg],R_SUBNONE);
  404. if paracgsize=OS_F128 then
  405. paraloc^.size:=OS_F64
  406. else
  407. paraloc^.size:=paracgsize;
  408. inc(mmparareg);
  409. dec(paralen,tcgsize2size[paraloc^.size]);
  410. end;
  411. LOC_REFERENCE :
  412. begin
  413. paraloc:=hp.paraloc[side].add_location;
  414. paraloc^.loc:=LOC_REFERENCE;
  415. if paracgsize in [OS_F32,OS_F64,OS_F80,OS_F128] then
  416. paraloc^.size:=int_float_cgsize(paralen)
  417. else
  418. paraloc^.size:=int_cgsize(paralen);
  419. if side=callerside then
  420. paraloc^.reference.index:=NR_STACK_POINTER_REG
  421. else
  422. paraloc^.reference.index:=NR_FRAME_POINTER_REG;
  423. varalign:=used_align(size_2_align(paralen),paraalign,paraalign);
  424. paraloc^.reference.offset:=parasize;
  425. parasize:=align(parasize+paralen,varalign);
  426. paralen:=0;
  427. end;
  428. end;
  429. if (locidx<2) and
  430. (loc[locidx+1]<>LOC_INVALID) then
  431. inc(locidx);
  432. end;
  433. end
  434. else
  435. begin
  436. paraloc:=hp.paraloc[side].add_location;
  437. paraloc^.loc:=LOC_VOID;
  438. end;
  439. end;
  440. { Register parameters are assigned from left-to-right, but the
  441. offsets on the stack are right-to-left. There is no need
  442. to reverse the offset, only adapt the calleeside with the
  443. start offset of the first param on the stack }
  444. if side=calleeside then
  445. begin
  446. for i:=0 to paras.count-1 do
  447. begin
  448. hp:=tparavarsym(paras[i]);
  449. with hp.paraloc[side].location^ do
  450. if (loc=LOC_REFERENCE) then
  451. inc(reference.offset,target_info.first_parm_offset);
  452. end;
  453. end;
  454. end;
  455. function tx86_64paramanager.create_varargs_paraloc_info(p : tabstractprocdef; varargspara:tvarargsparalist):longint;
  456. var
  457. intparareg,mmparareg,
  458. parasize : longint;
  459. begin
  460. intparareg:=0;
  461. mmparareg:=0;
  462. if target_info.system=system_x86_64_win64 then
  463. parasize:=4*8
  464. else
  465. parasize:=0;
  466. { calculate the registers for the normal parameters }
  467. create_paraloc_info_intern(p,callerside,p.paras,intparareg,mmparareg,parasize);
  468. { append the varargs }
  469. create_paraloc_info_intern(p,callerside,varargspara,intparareg,mmparareg,parasize);
  470. { store used no. of SSE registers, that needs to be passed in %AL }
  471. varargspara.mmregsused:=mmparareg;
  472. result:=parasize;
  473. end;
  474. function tx86_64paramanager.create_paraloc_info(p : tabstractprocdef; side: tcallercallee):longint;
  475. var
  476. intparareg,mmparareg,
  477. parasize : longint;
  478. begin
  479. intparareg:=0;
  480. mmparareg:=0;
  481. if target_info.system=system_x86_64_win64 then
  482. parasize:=4*8
  483. else
  484. parasize:=0;
  485. create_paraloc_info_intern(p,side,p.paras,intparareg,mmparareg,parasize);
  486. { Create Function result paraloc }
  487. create_funcretloc_info(p,side);
  488. { We need to return the size allocated on the stack }
  489. result:=parasize;
  490. end;
  491. begin
  492. paramanager:=tx86_64paramanager.create;
  493. end.