cpupara.pas 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486
  1. {
  2. Copyright (c) 2002 by Florian Klaempfl
  3. Generates the argument location information for x86-64 target
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published bymethodpointer
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit cpupara;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. globtype,
  22. cpubase,cgbase,
  23. symconst,symtype,symsym,symdef,
  24. aasmtai,aasmdata,
  25. parabase,paramgr;
  26. type
  27. tx86_64paramanager = class(tparamanager)
  28. private
  29. procedure create_funcretloc_info(p : tabstractprocdef; side: tcallercallee);
  30. procedure create_paraloc_info_intern(p : tabstractprocdef; side: tcallercallee;paras:tparalist;
  31. var intparareg,mmparareg,parasize:longint);
  32. public
  33. function param_use_paraloc(const cgpara:tcgpara):boolean;override;
  34. function push_addr_param(varspez:tvarspez;def : tdef;calloption : tproccalloption) : boolean;override;
  35. procedure getintparaloc(calloption : tproccalloption; nr : longint;var cgpara:TCGPara);override;
  36. function get_volatile_registers_int(calloption : tproccalloption):tcpuregisterset;override;
  37. function get_volatile_registers_mm(calloption : tproccalloption):tcpuregisterset;override;
  38. function get_volatile_registers_fpu(calloption : tproccalloption):tcpuregisterset;override;
  39. function create_paraloc_info(p : tabstractprocdef; side: tcallercallee):longint;override;
  40. function create_varargs_paraloc_info(p : tabstractprocdef; varargspara:tvarargsparalist):longint;override;
  41. end;
  42. implementation
  43. uses
  44. cutils,verbose,
  45. systems,
  46. defutil,
  47. cgutils;
  48. const
  49. paraintsupregs : array[0..5] of tsuperregister = (RS_RDI,RS_RSI,RS_RDX,RS_RCX,RS_R8,RS_R9);
  50. parammsupregs : array[0..7] of tsuperregister = (RS_XMM0,RS_XMM1,RS_XMM2,RS_XMM3,RS_XMM4,RS_XMM5,RS_XMM6,RS_XMM7);
  51. procedure getvalueparaloc(p : tdef;var loc1,loc2:tcgloc);
  52. begin
  53. loc1:=LOC_INVALID;
  54. loc2:=LOC_INVALID;
  55. case p.deftype of
  56. orddef:
  57. begin
  58. loc1:=LOC_REGISTER;
  59. {$warning TODO 128bit also needs lochigh}
  60. end;
  61. floatdef:
  62. begin
  63. case tfloatdef(p).typ of
  64. s80real:
  65. loc1:=LOC_REFERENCE;
  66. s32real,
  67. s64real :
  68. loc1:=LOC_MMREGISTER;
  69. s64currency,
  70. s64comp :
  71. loc1:=LOC_REGISTER;
  72. s128real:
  73. begin
  74. loc1:=LOC_MMREGISTER;
  75. loc2:=LOC_MMREGISTER;
  76. {$warning TODO float 128bit needs SSEUP lochigh}
  77. end;
  78. end;
  79. end;
  80. recorddef:
  81. begin
  82. if p.size<=16 then
  83. begin
  84. {$warning TODO location depends on the fields}
  85. loc1:=LOC_REFERENCE;
  86. end
  87. else
  88. loc1:=LOC_REFERENCE;
  89. end;
  90. objectdef:
  91. begin
  92. if is_object(p) then
  93. loc1:=LOC_REFERENCE
  94. else
  95. loc1:=LOC_REGISTER;
  96. end;
  97. arraydef:
  98. begin
  99. loc1:=LOC_REFERENCE;
  100. end;
  101. variantdef:
  102. loc1:=LOC_REFERENCE;
  103. stringdef:
  104. if is_shortstring(p) or is_longstring(p) then
  105. loc1:=LOC_REFERENCE
  106. else
  107. loc1:=LOC_REGISTER;
  108. setdef:
  109. if is_smallset(p) then
  110. loc1:=LOC_REGISTER
  111. else
  112. loc1:=LOC_REFERENCE;
  113. procvardef:
  114. begin
  115. { This is a record < 16 bytes }
  116. if (po_methodpointer in tprocvardef(p).procoptions) then
  117. begin
  118. loc1:=LOC_REGISTER;
  119. loc2:=LOC_REGISTER;
  120. end
  121. else
  122. loc1:=LOC_REGISTER;
  123. end;
  124. else
  125. begin
  126. { default for pointers,enums,etc }
  127. loc1:=LOC_REGISTER;
  128. end;
  129. end;
  130. end;
  131. function tx86_64paramanager.param_use_paraloc(const cgpara:tcgpara):boolean;
  132. var
  133. paraloc : pcgparalocation;
  134. begin
  135. if not assigned(cgpara.location) then
  136. internalerror(200410102);
  137. result:=true;
  138. { All locations are LOC_REFERENCE }
  139. paraloc:=cgpara.location;
  140. while assigned(paraloc) do
  141. begin
  142. if (paraloc^.loc<>LOC_REFERENCE) then
  143. begin
  144. result:=false;
  145. exit;
  146. end;
  147. paraloc:=paraloc^.next;
  148. end;
  149. end;
  150. { true if a parameter is too large to copy and only the address is pushed }
  151. function tx86_64paramanager.push_addr_param(varspez:tvarspez;def : tdef;calloption : tproccalloption) : boolean;
  152. begin
  153. result:=false;
  154. { var,out always require address }
  155. if varspez in [vs_var,vs_out] then
  156. begin
  157. result:=true;
  158. exit;
  159. end;
  160. { Only vs_const, vs_value here }
  161. case def.deftype of
  162. variantdef,
  163. formaldef :
  164. result:=true;
  165. recorddef :
  166. result:=(def.size>sizeof(aint));
  167. arraydef :
  168. begin
  169. result:=not(
  170. { cdecl array of const need to be ignored and therefor be puhsed
  171. as value parameter with length 0 }
  172. (calloption in [pocall_cdecl,pocall_cppdecl]) and
  173. (is_array_of_const(def) or
  174. is_dynamic_array(def))
  175. );
  176. end;
  177. objectdef :
  178. result:=is_object(def);
  179. stringdef :
  180. result:=(tstringdef(def).string_typ in [st_shortstring,st_longstring]);
  181. procvardef :
  182. result:=(po_methodpointer in tprocvardef(def).procoptions);
  183. setdef :
  184. result:=(tsetdef(def).settype<>smallset);
  185. end;
  186. end;
  187. function tx86_64paramanager.get_volatile_registers_int(calloption : tproccalloption):tcpuregisterset;
  188. begin
  189. result:=[RS_RAX,RS_RCX,RS_RDX,RS_RSI,RS_RDI,RS_R8,RS_R9,RS_R10,RS_R11];
  190. end;
  191. function tx86_64paramanager.get_volatile_registers_mm(calloption : tproccalloption):tcpuregisterset;
  192. begin
  193. result:=[RS_XMM0..RS_XMM15];
  194. end;
  195. function tx86_64paramanager.get_volatile_registers_fpu(calloption : tproccalloption):tcpuregisterset;
  196. begin
  197. result:=[RS_ST0..RS_ST7];
  198. end;
  199. procedure tx86_64paramanager.getintparaloc(calloption : tproccalloption; nr : longint;var cgpara:TCGPara);
  200. var
  201. paraloc : pcgparalocation;
  202. begin
  203. cgpara.reset;
  204. cgpara.size:=OS_INT;
  205. cgpara.intsize:=tcgsize2size[OS_INT];
  206. cgpara.alignment:=get_para_align(calloption);
  207. paraloc:=cgpara.add_location;
  208. with paraloc^ do
  209. begin
  210. size:=OS_INT;
  211. if nr<1 then
  212. internalerror(200304303)
  213. else if nr<=high(paraintsupregs)+1 then
  214. begin
  215. loc:=LOC_REGISTER;
  216. register:=newreg(R_INTREGISTER,paraintsupregs[nr-1],R_SUBWHOLE);
  217. end
  218. else
  219. begin
  220. loc:=LOC_REFERENCE;
  221. reference.index:=NR_STACK_POINTER_REG;
  222. reference.offset:=(nr-6)*sizeof(aint);
  223. end;
  224. end;
  225. end;
  226. procedure tx86_64paramanager.create_funcretloc_info(p : tabstractprocdef; side: tcallercallee);
  227. var
  228. retcgsize : tcgsize;
  229. begin
  230. { Constructors return self instead of a boolean }
  231. if (p.proctypeoption=potype_constructor) then
  232. retcgsize:=OS_ADDR
  233. else
  234. retcgsize:=def_cgsize(p.rettype.def);
  235. location_reset(p.funcretloc[side],LOC_INVALID,OS_NO);
  236. { void has no location }
  237. if is_void(p.rettype.def) then
  238. begin
  239. location_reset(p.funcretloc[side],LOC_VOID,OS_NO);
  240. exit;
  241. end;
  242. { Return in FPU register? }
  243. if p.rettype.def.deftype=floatdef then
  244. begin
  245. case tfloatdef(p.rettype.def).typ of
  246. s32real,s64real:
  247. begin
  248. p.funcretloc[side].loc:=LOC_MMREGISTER;
  249. p.funcretloc[side].register:=NR_MM_RESULT_REG;
  250. p.funcretloc[side].size:=retcgsize;
  251. end;
  252. s64currency,
  253. s64comp,
  254. s80real:
  255. begin
  256. p.funcretloc[side].loc:=LOC_FPUREGISTER;
  257. p.funcretloc[side].register:=NR_FPU_RESULT_REG;
  258. p.funcretloc[side].size:=retcgsize;
  259. end;
  260. else
  261. internalerror(200405034);
  262. end;
  263. end
  264. else
  265. { Return in register? }
  266. if not ret_in_param(p.rettype.def,p.proccalloption) then
  267. begin
  268. p.funcretloc[side].loc:=LOC_REGISTER;
  269. p.funcretloc[side].size:=retcgsize;
  270. if side=callerside then
  271. p.funcretloc[side].register:=newreg(R_INTREGISTER,RS_FUNCTION_RESULT_REG,cgsize2subreg(retcgsize))
  272. else
  273. p.funcretloc[side].register:=newreg(R_INTREGISTER,RS_FUNCTION_RETURN_REG,cgsize2subreg(retcgsize));
  274. end
  275. else
  276. begin
  277. p.funcretloc[side].loc:=LOC_REFERENCE;
  278. p.funcretloc[side].size:=retcgsize;
  279. end;
  280. end;
  281. procedure tx86_64paramanager.create_paraloc_info_intern(p : tabstractprocdef; side: tcallercallee;paras:tparalist;
  282. var intparareg,mmparareg,parasize:longint);
  283. var
  284. hp : tparavarsym;
  285. paraloc : pcgparalocation;
  286. subreg : tsubregister;
  287. pushaddr : boolean;
  288. paracgsize : tcgsize;
  289. loc : array[1..2] of tcgloc;
  290. paralen,
  291. locidx,
  292. l,i,
  293. varalign,
  294. paraalign : longint;
  295. begin
  296. paraalign:=get_para_align(p.proccalloption);
  297. { Register parameters are assigned from left to right }
  298. for i:=0 to paras.count-1 do
  299. begin
  300. hp:=tparavarsym(paras[i]);
  301. pushaddr:=push_addr_param(hp.varspez,hp.vartype.def,p.proccalloption);
  302. if pushaddr then
  303. begin
  304. loc[1]:=LOC_REGISTER;
  305. loc[2]:=LOC_INVALID;
  306. paracgsize:=OS_ADDR;
  307. paralen:=sizeof(aint);
  308. end
  309. else
  310. begin
  311. getvalueparaloc(hp.vartype.def,loc[1],loc[2]);
  312. paralen:=push_size(hp.varspez,hp.vartype.def,p.proccalloption);
  313. paracgsize:=def_cgsize(hp.vartype.def);
  314. end;
  315. hp.paraloc[side].reset;
  316. hp.paraloc[side].size:=paracgsize;
  317. hp.paraloc[side].intsize:=paralen;
  318. hp.paraloc[side].Alignment:=paraalign;
  319. if paralen>0 then
  320. begin
  321. locidx:=1;
  322. while (paralen>0) do
  323. begin
  324. if locidx>2 then
  325. internalerror(200501283);
  326. { Enough registers free? }
  327. case loc[locidx] of
  328. LOC_REGISTER :
  329. begin
  330. if (intparareg>high(paraintsupregs)) then
  331. loc[locidx]:=LOC_REFERENCE;
  332. end;
  333. LOC_MMREGISTER :
  334. begin
  335. if (mmparareg>high(parammsupregs)) then
  336. loc[locidx]:=LOC_REFERENCE;
  337. end;
  338. end;
  339. { Allocate }
  340. case loc[locidx] of
  341. LOC_REGISTER :
  342. begin
  343. paraloc:=hp.paraloc[side].add_location;
  344. paraloc^.loc:=LOC_REGISTER;
  345. if (paracgsize=OS_NO) or (loc[2]<>LOC_INVALID) then
  346. begin
  347. paraloc^.size:=OS_INT;
  348. subreg:=R_SUBWHOLE;
  349. end
  350. else
  351. begin
  352. paraloc^.size:=paracgsize;
  353. { s64comp is pushed in an int register }
  354. if paraloc^.size=OS_C64 then
  355. paraloc^.size:=OS_64;
  356. subreg:=cgsize2subreg(paraloc^.size);
  357. end;
  358. paraloc^.register:=newreg(R_INTREGISTER,paraintsupregs[intparareg],subreg);
  359. inc(intparareg);
  360. dec(paralen,tcgsize2size[paraloc^.size]);
  361. end;
  362. LOC_MMREGISTER :
  363. begin
  364. paraloc:=hp.paraloc[side].add_location;
  365. paraloc^.loc:=LOC_MMREGISTER;
  366. paraloc^.register:=newreg(R_MMREGISTER,parammsupregs[mmparareg],R_SUBNONE);
  367. if paracgsize=OS_F128 then
  368. paraloc^.size:=OS_F64
  369. else
  370. paraloc^.size:=paracgsize;
  371. inc(mmparareg);
  372. dec(paralen,tcgsize2size[paraloc^.size]);
  373. end;
  374. LOC_REFERENCE :
  375. begin
  376. paraloc:=hp.paraloc[side].add_location;
  377. paraloc^.loc:=LOC_REFERENCE;
  378. if paracgsize in [OS_F32,OS_F64,OS_F80,OS_F128] then
  379. paraloc^.size:=int_float_cgsize(paralen)
  380. else
  381. paraloc^.size:=int_cgsize(paralen);
  382. if side=callerside then
  383. paraloc^.reference.index:=NR_STACK_POINTER_REG
  384. else
  385. paraloc^.reference.index:=NR_FRAME_POINTER_REG;
  386. varalign:=used_align(size_2_align(paralen),paraalign,paraalign);
  387. paraloc^.reference.offset:=parasize;
  388. parasize:=align(parasize+paralen,varalign);
  389. paralen:=0;
  390. end;
  391. end;
  392. if (locidx<2) and
  393. (loc[locidx+1]<>LOC_INVALID) then
  394. inc(locidx);
  395. end;
  396. end
  397. else
  398. begin
  399. paraloc:=hp.paraloc[side].add_location;
  400. paraloc^.loc:=LOC_VOID;
  401. end;
  402. end;
  403. { Register parameters are assigned from left-to-right, but the
  404. offsets on the stack are right-to-left. There is no need
  405. to reverse the offset, only adapt the calleeside with the
  406. start offset of the first param on the stack }
  407. if side=calleeside then
  408. begin
  409. for i:=0 to paras.count-1 do
  410. begin
  411. hp:=tparavarsym(paras[i]);
  412. with hp.paraloc[side].location^ do
  413. if (loc=LOC_REFERENCE) then
  414. inc(reference.offset,target_info.first_parm_offset);
  415. end;
  416. end;
  417. end;
  418. function tx86_64paramanager.create_varargs_paraloc_info(p : tabstractprocdef; varargspara:tvarargsparalist):longint;
  419. var
  420. intparareg,mmparareg,
  421. parasize : longint;
  422. begin
  423. intparareg:=0;
  424. mmparareg:=0;
  425. parasize:=0;
  426. { calculate the registers for the normal parameters }
  427. create_paraloc_info_intern(p,callerside,p.paras,intparareg,mmparareg,parasize);
  428. { append the varargs }
  429. create_paraloc_info_intern(p,callerside,varargspara,intparareg,mmparareg,parasize);
  430. { store used no. of SSE registers, that needs to be passed in %AL }
  431. varargspara.mmregsused:=mmparareg;
  432. result:=parasize;
  433. end;
  434. function tx86_64paramanager.create_paraloc_info(p : tabstractprocdef; side: tcallercallee):longint;
  435. var
  436. intparareg,mmparareg,
  437. parasize : longint;
  438. begin
  439. intparareg:=0;
  440. mmparareg:=0;
  441. parasize:=0;
  442. create_paraloc_info_intern(p,side,p.paras,intparareg,mmparareg,parasize);
  443. { Create Function result paraloc }
  444. create_funcretloc_info(p,side);
  445. { We need to return the size allocated on the stack }
  446. result:=parasize;
  447. end;
  448. begin
  449. paramanager:=tx86_64paramanager.create;
  450. end.