llvmdef.pas 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919
  1. {
  2. Copyright (c) 2013 by Jonas Maebe
  3. This unit implements some LLVM type helper routines.
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. {$i fpcdefs.inc}
  18. unit llvmdef;
  19. interface
  20. uses
  21. cclasses,globtype,
  22. aasmbase,
  23. parabase,
  24. symbase,symtype,symdef,
  25. llvmbase;
  26. type
  27. { there are three different circumstances in which procdefs are used:
  28. a) definition of a procdef that's implemented in the current module
  29. b) declaration of an external routine that's called in the current one
  30. c) alias declaration of a procdef implemented in the current module
  31. d) defining a procvar type
  32. The main differences between the contexts are:
  33. a) information about sign extension of result type, proc name, parameter names & sign-extension info & types
  34. b) information about sign extension of result type, proc name, no parameter names, with parameter sign-extension info & types
  35. c) no information about sign extension of result type, proc name, no parameter names, no information about sign extension of parameters, parameter types
  36. d) no information about sign extension of result type, no proc name, no parameter names, no information about sign extension of parameters, parameter types
  37. }
  38. tllvmprocdefdecltype = (lpd_def,lpd_decl,lpd_alias,lpd_procvar);
  39. { returns the identifier to use as typename for a def in llvm (llvm only
  40. allows naming struct types) -- only supported for defs with a typesym, and
  41. only for tabstractrecorddef descendantds and complex procvars }
  42. function llvmtypeidentifier(def: tdef): TSymStr;
  43. { encode a type into the internal format used by LLVM (for a type
  44. declaration) }
  45. function llvmencodetypedecl(def: tdef): TSymStr;
  46. { same as above, but use a type name if possible (for any use) }
  47. function llvmencodetypename(def: tdef): TSymStr;
  48. { encode a procdef/procvardef into the internal format used by LLVM }
  49. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  50. { incremental version of the above }
  51. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  52. { function result types may have to be represented differently, e.g. a
  53. record consisting of 4 longints must be returned as a record consisting of
  54. two int64's on x86-64. This function is used to create (and reuse)
  55. temporary recorddefs for such purposes.}
  56. function llvmgettemprecorddef(fieldtypes: tfplist; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  57. { get the llvm type corresponding to a parameter, e.g. a record containing
  58. two integer int64 for an arbitrary record split over two individual int64
  59. parameters, or an int32 for an int16 parameter on a platform that requires
  60. such parameters to be zero/sign extended. The second parameter can be used
  61. to get the type before zero/sign extension, as e.g. required to generate
  62. function declarations. }
  63. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  64. { can be used to extract the value extension info from acgpara. Pass in
  65. the def of the cgpara as first parameter and a local variable holding
  66. a copy of the def of the location (value extension only makes sense for
  67. ordinal parameters that are smaller than a single location). The routine
  68. will return the def of the location without sign extension (if applicable)
  69. and the kind of sign extension that was originally performed in the
  70. signext parameter }
  71. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  72. { returns whether a paraloc should be translated into an llvm "byval"
  73. parameter. These are declared as pointers to a particular type, but
  74. usually turned into copies onto the stack. The exact behaviour for
  75. parameters that should be passed in registers is undefined and depends on
  76. the platform, and furthermore this modifier sometimes inhibits
  77. optimizations. As a result,we only use it for aggregate parameters of
  78. which we know that they should be passed on the stack }
  79. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  80. { returns whether a def is representated by an aggregate type in llvm
  81. (struct, array) }
  82. function llvmaggregatetype(def: tdef): boolean;
  83. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  84. { mangle a global identifier so that it's recognised by LLVM as a global
  85. (in the sense of module-global) label and so that it won't mangle the
  86. name further according to platform conventions (we already did that) }
  87. function llvmmangledname(const s: TSymStr): TSymStr;
  88. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  89. implementation
  90. uses
  91. globals,cutils,constexp,
  92. verbose,systems,
  93. fmodule,
  94. symtable,symconst,symsym,
  95. llvmsym,hlcgobj,
  96. defutil,blockutl,cgbase,paramgr;
  97. {******************************************************************
  98. Type encoding
  99. *******************************************************************}
  100. function llvmtypeidentifier(def: tdef): TSymStr;
  101. begin
  102. if not assigned(def.typesym) then
  103. internalerror(2015041901);
  104. result:='%"typ.'+def.fullownerhierarchyname(false)+def.typesym.realname+'"'
  105. end;
  106. function llvmaggregatetype(def: tdef): boolean;
  107. begin
  108. result:=
  109. (def.typ in [recorddef,filedef,variantdef]) or
  110. ((def.typ=arraydef) and
  111. not is_dynamic_array(def)) or
  112. ((def.typ=setdef) and
  113. not is_smallset(def)) or
  114. is_shortstring(def) or
  115. is_object(def) or
  116. ((def.typ=procvardef) and
  117. not tprocvardef(def).is_addressonly)
  118. end;
  119. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  120. var
  121. fromregtyp,
  122. toregtyp: tregistertype;
  123. frombytesize,
  124. tobytesize: asizeint;
  125. begin
  126. fromregtyp:=chlcgobj.def2regtyp(fromsize);
  127. toregtyp:=chlcgobj.def2regtyp(tosize);
  128. { int to pointer or vice versa }
  129. if fromregtyp=R_ADDRESSREGISTER then
  130. begin
  131. case toregtyp of
  132. R_INTREGISTER:
  133. result:=la_ptrtoint;
  134. R_ADDRESSREGISTER:
  135. result:=la_bitcast;
  136. else
  137. result:=la_ptrtoint_to_x;
  138. end;
  139. end
  140. else if toregtyp=R_ADDRESSREGISTER then
  141. begin
  142. case fromregtyp of
  143. R_INTREGISTER:
  144. result:=la_inttoptr;
  145. R_ADDRESSREGISTER:
  146. result:=la_bitcast;
  147. else
  148. result:=la_x_to_inttoptr;
  149. end;
  150. end
  151. else
  152. begin
  153. { treat comp and currency as extended in registers (see comment at start
  154. of thlgcobj.a_loadfpu_ref_reg) }
  155. if inregs and
  156. (fromsize.typ=floatdef) then
  157. begin
  158. if tfloatdef(fromsize).floattype in [s64comp,s64currency] then
  159. fromsize:=sc80floattype;
  160. { at the value level, s80real and sc80real are the same }
  161. if tfloatdef(fromsize).floattype<>s80real then
  162. frombytesize:=fromsize.size
  163. else
  164. frombytesize:=sc80floattype.size;
  165. end
  166. else
  167. frombytesize:=fromsize.size;
  168. if inregs and
  169. (tosize.typ=floatdef) then
  170. begin
  171. if tfloatdef(tosize).floattype in [s64comp,s64currency] then
  172. tosize:=sc80floattype;
  173. if tfloatdef(tosize).floattype<>s80real then
  174. tobytesize:=tosize.size
  175. else
  176. tobytesize:=sc80floattype.size;
  177. end
  178. else
  179. tobytesize:=tosize.size;
  180. { need zero/sign extension, float truncation or plain bitcast? }
  181. if tobytesize<>frombytesize then
  182. begin
  183. case fromregtyp of
  184. R_FPUREGISTER,
  185. R_MMREGISTER:
  186. begin
  187. { todo: update once we support vectors }
  188. if not(toregtyp in [R_FPUREGISTER,R_MMREGISTER]) then
  189. internalerror(2014062203);
  190. if tobytesize<frombytesize then
  191. result:=la_fptrunc
  192. else
  193. result:=la_fpext
  194. end;
  195. else
  196. begin
  197. if tobytesize<frombytesize then
  198. result:=la_trunc
  199. else if is_signed(fromsize) then
  200. { fromsize is signed -> sign extension }
  201. result:=la_sext
  202. else
  203. result:=la_zext;
  204. end;
  205. end;
  206. end
  207. else if (fromsize=llvmbool1type) and
  208. (tosize<>llvmbool1type) then
  209. begin
  210. if is_cbool(tosize) then
  211. result:=la_sext
  212. else
  213. result:=la_zext
  214. end
  215. else if (tosize=llvmbool1type) and
  216. (fromsize<>llvmbool1type) then
  217. begin
  218. { would have to compare with 0, can't just take the lowest bit }
  219. if is_cbool(fromsize) then
  220. internalerror(2016052001)
  221. else
  222. result:=la_trunc
  223. end
  224. else
  225. result:=la_bitcast;
  226. end;
  227. end;
  228. function llvmmangledname(const s: TSymStr): TSymStr;
  229. begin
  230. if copy(s,1,length('llvm.'))<>'llvm.' then
  231. if s[1]<>'"' then
  232. result:='@"\01'+s+'"'
  233. else
  234. begin
  235. { already quoted -> insert \01 and prepend @ }
  236. result:='@'+s;
  237. insert('\01',result,3);
  238. end
  239. else
  240. result:='@'+s
  241. end;
  242. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  243. begin
  244. { AT_ADDR and AT_LABEL represent labels in the code, which have
  245. a different type in llvm compared to (global) data labels }
  246. if sym.bind=AB_TEMP then
  247. result:='%'+sym.name
  248. else if not(sym.typ in [AT_LABEL,AT_ADDR]) then
  249. result:=llvmmangledname(sym.name)
  250. else
  251. result:='label %'+sym.name;
  252. end;
  253. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  254. begin
  255. { "byval" is broken for register paras on several platforms in llvm
  256. (search for "byval" in llvm's bug tracker). Additionally, it should only
  257. be used to pass aggregate parameters on the stack, because it reportedly
  258. inhibits llvm's midlevel optimizers.
  259. Exception (for now?): parameters that have special shifting
  260. requirements, because modelling those in llvm is not easy (and clang
  261. nor llvm-gcc seem to do so either) }
  262. result:=
  263. ((paraloc^.loc=LOC_REFERENCE) and
  264. llvmaggregatetype(paraloc^.def)) or
  265. ((paraloc^.loc in [LOC_REGISTER,LOC_CREGISTER]) and
  266. (paraloc^.shiftval<>0))
  267. end;
  268. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr); forward;
  269. type
  270. tllvmencodeflag = (lef_inaggregate, lef_noimplicitderef, lef_typedecl);
  271. tllvmencodeflags = set of tllvmencodeflag;
  272. procedure llvmaddencodedtype_intern(def: tdef; const flags: tllvmencodeflags; var encodedstr: TSymStr);
  273. begin
  274. case def.typ of
  275. stringdef :
  276. begin
  277. case tstringdef(def).stringtype of
  278. st_widestring,
  279. st_unicodestring:
  280. { the variable does not point to the header, but to a
  281. null-terminated string/array with undefined bounds }
  282. encodedstr:=encodedstr+'i16*';
  283. st_ansistring:
  284. encodedstr:=encodedstr+'i8*';
  285. st_shortstring:
  286. { length byte followed by string bytes }
  287. if tstringdef(def).len>0 then
  288. encodedstr:=encodedstr+'['+tostr(tstringdef(def).len+1)+' x i8]'
  289. else
  290. encodedstr:=encodedstr+'[0 x i8]';
  291. else
  292. internalerror(2013100201);
  293. end;
  294. end;
  295. enumdef:
  296. begin
  297. encodedstr:=encodedstr+'i'+tostr(def.size*8);
  298. end;
  299. orddef :
  300. begin
  301. if is_void(def) then
  302. encodedstr:=encodedstr+'void'
  303. { mainly required because comparison operations return i1, and
  304. we need a way to represent the i1 type in Pascal. We don't
  305. reuse pasbool8type, because putting an i1 in a record or
  306. passing it as a parameter may result in unexpected behaviour }
  307. else if def=llvmbool1type then
  308. encodedstr:=encodedstr+'i1'
  309. else
  310. encodedstr:=encodedstr+'i'+tostr(def.size*8);
  311. end;
  312. pointerdef :
  313. begin
  314. if is_voidpointer(def) then
  315. encodedstr:=encodedstr+'i8*'
  316. else
  317. begin
  318. llvmaddencodedtype_intern(tpointerdef(def).pointeddef,[],encodedstr);
  319. encodedstr:=encodedstr+'*';
  320. end;
  321. end;
  322. floatdef :
  323. begin
  324. case tfloatdef(def).floattype of
  325. s32real:
  326. encodedstr:=encodedstr+'float';
  327. s64real:
  328. encodedstr:=encodedstr+'double';
  329. { necessary to be able to force our own size/alignment }
  330. s80real:
  331. { prevent llvm from allocating the standard ABI size for
  332. extended }
  333. if lef_inaggregate in flags then
  334. encodedstr:=encodedstr+'[10 x i8]'
  335. else
  336. encodedstr:=encodedstr+'x86_fp80';
  337. sc80real:
  338. encodedstr:=encodedstr+'x86_fp80';
  339. s64comp,
  340. s64currency:
  341. encodedstr:=encodedstr+'i64';
  342. s128real:
  343. {$if defined(powerpc) or defined(powerpc128)}
  344. encodedstr:=encodedstr+'ppc_fp128';
  345. {$else}
  346. encodedstr:=encodedstr+'fp128';
  347. {$endif}
  348. else
  349. internalerror(2013100202);
  350. end;
  351. end;
  352. filedef :
  353. begin
  354. case tfiledef(def).filetyp of
  355. ft_text :
  356. llvmaddencodedtype_intern(search_system_type('TEXTREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  357. ft_typed :
  358. begin
  359. { in case of ISO-like I/O, the typed file def includes a
  360. get/put buffer of the size of the file's elements }
  361. if (m_isolike_io in current_settings.modeswitches) and
  362. not is_void(tfiledef(def).typedfiledef) then
  363. encodedstr:=encodedstr+'<{';
  364. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  365. if (m_isolike_io in current_settings.modeswitches) and
  366. not is_void(tfiledef(def).typedfiledef) then
  367. begin
  368. encodedstr:=encodedstr+',[';
  369. encodedstr:=encodedstr+tostr(tfiledef(def).typedfiledef.size);
  370. encodedstr:=encodedstr+' x i8]}>'
  371. end;
  372. end;
  373. ft_untyped :
  374. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  375. else
  376. internalerror(2013100203);
  377. end;
  378. end;
  379. recorddef :
  380. begin
  381. { avoid endlessly recursive definitions }
  382. if assigned(def.typesym) and
  383. ((lef_inaggregate in flags) or
  384. not(lef_typedecl in flags)) then
  385. encodedstr:=encodedstr+llvmtypeidentifier(def)
  386. else
  387. llvmaddencodedabstractrecordtype(trecorddef(def),encodedstr);
  388. end;
  389. variantdef :
  390. begin
  391. llvmaddencodedtype_intern(search_system_type('TVARDATA').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  392. end;
  393. classrefdef :
  394. begin
  395. if is_class(tclassrefdef(def).pointeddef) then
  396. begin
  397. llvmaddencodedtype_intern(tobjectdef(tclassrefdef(def).pointeddef).vmt_def,flags,encodedstr);
  398. encodedstr:=encodedstr+'*';
  399. end
  400. else if is_objcclass(tclassrefdef(def).pointeddef) then
  401. llvmaddencodedtype_intern(objc_idtype,flags,encodedstr)
  402. else
  403. encodedstr:=encodedstr+'i8*'
  404. end;
  405. setdef :
  406. begin
  407. { just an array as far as llvm is concerned; don't use a "packed
  408. array of i1" or so, this requires special support in backends
  409. and guarantees nothing about the internal format }
  410. if is_smallset(def) then
  411. llvmaddencodedtype_intern(cgsize_orddef(def_cgsize(def)),[lef_inaggregate],encodedstr)
  412. else
  413. encodedstr:=encodedstr+'['+tostr(tsetdef(def).size)+' x i8]';
  414. end;
  415. formaldef :
  416. begin
  417. { var/const/out x (always treated as "pass by reference" -> don't
  418. add extra "*" here) }
  419. encodedstr:=encodedstr+'i8';
  420. end;
  421. arraydef :
  422. begin
  423. if is_array_of_const(def) then
  424. begin
  425. encodedstr:=encodedstr+'[0 x ';
  426. llvmaddencodedtype_intern(search_system_type('TVARREC').typedef,[lef_inaggregate],encodedstr);
  427. encodedstr:=encodedstr+']';
  428. end
  429. else if is_open_array(def) then
  430. begin
  431. encodedstr:=encodedstr+'[0 x ';
  432. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  433. encodedstr:=encodedstr+']';
  434. end
  435. else if is_dynamic_array(def) then
  436. begin
  437. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  438. encodedstr:=encodedstr+'*';
  439. end
  440. else if is_packed_array(def) and
  441. (tarraydef(def).elementdef.typ in [enumdef,orddef]) then
  442. begin
  443. { encode as an array of bytes rather than as an array of
  444. packedbitsloadsize(elesize), because even if the load size
  445. is e.g. 2 bytes, the array may only be 1 or 3 bytes long
  446. (and if this array is inside a record, it must not be
  447. encoded as a type that is too long) }
  448. encodedstr:=encodedstr+'['+tostr(tarraydef(def).size)+' x ';
  449. llvmaddencodedtype_intern(u8inttype,[lef_inaggregate],encodedstr);
  450. encodedstr:=encodedstr+']';
  451. end
  452. else
  453. begin
  454. encodedstr:=encodedstr+'['+tostr(tarraydef(def).elecount)+' x ';
  455. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  456. encodedstr:=encodedstr+']';
  457. end;
  458. end;
  459. procdef,
  460. procvardef :
  461. begin
  462. if (def.typ=procdef) or
  463. tprocvardef(def).is_addressonly then
  464. begin
  465. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  466. if def.typ=procvardef then
  467. encodedstr:=encodedstr+'*';
  468. end
  469. else if ((lef_inaggregate in flags) or
  470. not(lef_typedecl in flags)) and
  471. assigned(tprocvardef(def).typesym) then
  472. begin
  473. { in case the procvardef recursively references itself, e.g.
  474. via a pointer }
  475. encodedstr:=encodedstr+llvmtypeidentifier(def);
  476. { blocks are implicit pointers }
  477. if is_block(def) then
  478. encodedstr:=encodedstr+'*'
  479. end
  480. else if is_block(def) then
  481. begin
  482. llvmaddencodedtype_intern(get_block_literal_type_for_proc(tabstractprocdef(def)),flags,encodedstr);
  483. end
  484. else
  485. begin
  486. encodedstr:=encodedstr+'<{';
  487. { code pointer }
  488. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  489. { data pointer (maybe todo: generate actual layout if
  490. available) }
  491. encodedstr:=encodedstr+'*, i8*}>';
  492. end;
  493. end;
  494. objectdef :
  495. case tobjectdef(def).objecttype of
  496. odt_class,
  497. odt_objcclass,
  498. odt_object,
  499. odt_cppclass:
  500. begin
  501. if not(lef_typedecl in flags) and
  502. assigned(def.typesym) then
  503. encodedstr:=encodedstr+llvmtypeidentifier(def)
  504. else
  505. llvmaddencodedabstractrecordtype(tabstractrecorddef(def),encodedstr);
  506. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) and
  507. is_implicit_pointer_object_type(def) then
  508. encodedstr:=encodedstr+'*'
  509. end;
  510. odt_interfacecom,
  511. odt_interfacecorba,
  512. odt_dispinterface:
  513. begin
  514. { type is a pointer to a pointer to the vmt }
  515. llvmaddencodedtype_intern(tobjectdef(def).vmt_def,flags,encodedstr);
  516. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) then
  517. encodedstr:=encodedstr+'**';
  518. end;
  519. odt_interfacecom_function,
  520. odt_interfacecom_property,
  521. odt_objcprotocol:
  522. begin
  523. { opaque for now }
  524. encodedstr:=encodedstr+'i8*'
  525. end;
  526. else
  527. internalerror(2013100601);
  528. end;
  529. undefineddef,
  530. errordef :
  531. internalerror(2013100604);
  532. else
  533. internalerror(2013100603);
  534. end;
  535. end;
  536. function llvmencodetypename(def: tdef): TSymStr;
  537. begin
  538. result:='';
  539. llvmaddencodedtype_intern(def,[],result);
  540. end;
  541. procedure llvmaddencodedtype(def: tdef; inaggregate: boolean; var encodedstr: TSymStr);
  542. var
  543. flags: tllvmencodeflags;
  544. begin
  545. if inaggregate then
  546. flags:=[lef_inaggregate]
  547. else
  548. flags:=[];
  549. llvmaddencodedtype_intern(def,flags,encodedstr);
  550. end;
  551. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr);
  552. var
  553. st: tllvmshadowsymtable;
  554. symdeflist: tfpobjectlist;
  555. i: longint;
  556. nopacked: boolean;
  557. begin
  558. st:=tabstractrecordsymtable(def.symtable).llvmst;
  559. symdeflist:=st.symdeflist;
  560. nopacked:=df_llvm_no_struct_packing in def.defoptions;
  561. if nopacked then
  562. encodedstr:=encodedstr+'{ '
  563. else
  564. encodedstr:=encodedstr+'<{ ';
  565. if symdeflist.count>0 then
  566. begin
  567. i:=0;
  568. if (def.typ=objectdef) and
  569. assigned(tobjectdef(def).childof) and
  570. is_class_or_interface_or_dispinterface(tllvmshadowsymtableentry(symdeflist[0]).def) then
  571. begin
  572. { insert the struct for the class rather than a pointer to the struct }
  573. if (tllvmshadowsymtableentry(symdeflist[0]).def.typ<>objectdef) then
  574. internalerror(2008070601);
  575. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[0]).def,[lef_inaggregate,lef_noimplicitderef],encodedstr);
  576. inc(i);
  577. end;
  578. while i<symdeflist.count do
  579. begin
  580. if i<>0 then
  581. encodedstr:=encodedstr+', ';
  582. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[i]).def,[lef_inaggregate],encodedstr);
  583. inc(i);
  584. end;
  585. end;
  586. if nopacked then
  587. encodedstr:=encodedstr+' }'
  588. else
  589. encodedstr:=encodedstr+' }>';
  590. end;
  591. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  592. begin
  593. { implicit zero/sign extension for ABI compliance? (yes, if the size
  594. of a paraloc is larger than the size of the entire parameter) }
  595. if is_ordinal(paradef) and
  596. is_ordinal(paralocdef) and
  597. (paradef.size<paralocdef.size) then
  598. begin
  599. paralocdef:=paradef;
  600. if is_signed(paradef) then
  601. signext:=lve_signext
  602. else
  603. signext:=lve_zeroext
  604. end
  605. else
  606. signext:=lve_none;
  607. end;
  608. procedure llvmaddencodedparaloctype(hp: tparavarsym; proccalloption: tproccalloption; withparaname, withattributes: boolean; var first: boolean; var encodedstr: TSymStr);
  609. var
  610. paraloc: PCGParaLocation;
  611. signext: tllvmvalueextension;
  612. usedef: tdef;
  613. begin
  614. if (proccalloption in cdecl_pocalls) and
  615. is_array_of_const(hp.vardef) then
  616. begin
  617. if not first then
  618. encodedstr:=encodedstr+', '
  619. else
  620. first:=false;
  621. encodedstr:=encodedstr+'...';
  622. exit
  623. end;
  624. if withparaname then
  625. paraloc:=hp.paraloc[calleeside].location
  626. else
  627. paraloc:=hp.paraloc[callerside].location;
  628. repeat
  629. usedef:=paraloc^.def;
  630. llvmextractvalueextinfo(hp.vardef,usedef,signext);
  631. { implicit zero/sign extension for ABI compliance? }
  632. if not first then
  633. encodedstr:=encodedstr+', '
  634. else
  635. first:=false;
  636. llvmaddencodedtype_intern(usedef,[],encodedstr);
  637. { in case signextstr<>'', there should be only one paraloc -> no need
  638. to clear (reason: it means that the paraloc is larger than the
  639. original parameter) }
  640. if withattributes then
  641. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  642. { sret: hidden pointer for structured function result }
  643. if vo_is_funcret in hp.varoptions then
  644. begin
  645. { "sret" is only valid for the firstparameter, while in FPC this
  646. can sometimes be second one (self comes before). In general,
  647. this is not a problem: we can just leave out sret, which means
  648. the result will be a bit less well optimised), but it is for
  649. AArch64: there, the sret parameter must be passed in a different
  650. register (-> paranr_result is smaller than paranr_self for that
  651. platform in symconst) }
  652. {$ifdef aarch64}
  653. if not first then
  654. internalerror(2015101404);
  655. {$endif aarch64}
  656. if withattributes then
  657. if first then
  658. encodedstr:=encodedstr+' sret'
  659. else { we can add some other attributes to optimise things,}
  660. encodedstr:=encodedstr+' noalias nocapture';
  661. end
  662. else if not paramanager.push_addr_param(hp.varspez,hp.vardef,proccalloption) and
  663. llvmbyvalparaloc(paraloc) then
  664. begin
  665. if withattributes then
  666. encodedstr:=encodedstr+'* byval'
  667. else
  668. encodedstr:=encodedstr+'*';
  669. end;
  670. if withparaname then
  671. begin
  672. if paraloc^.llvmloc.loc<>LOC_REFERENCE then
  673. internalerror(2014010803);
  674. encodedstr:=encodedstr+' '+llvmasmsymname(paraloc^.llvmloc.sym);
  675. end;
  676. paraloc:=paraloc^.next;
  677. until not assigned(paraloc);
  678. end;
  679. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  680. begin
  681. result:='';
  682. llvmaddencodedproctype(def,customname,pddecltype,result);
  683. end;
  684. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  685. var
  686. usedef: tdef;
  687. paranr: longint;
  688. hp: tparavarsym;
  689. signext: tllvmvalueextension;
  690. useside: tcallercallee;
  691. first: boolean;
  692. begin
  693. { when writing a definition, we have to write the parameter names, and
  694. those are only available on the callee side. In all other cases,
  695. we are at the callerside }
  696. if pddecltype=lpd_def then
  697. useside:=calleeside
  698. else
  699. useside:=callerside;
  700. def.init_paraloc_info(useside);
  701. first:=true;
  702. { function result (return-by-ref is handled explicitly) }
  703. if not paramanager.ret_in_param(def.returndef,def) then
  704. begin
  705. usedef:=llvmgetcgparadef(def.funcretloc[useside],false);
  706. llvmextractvalueextinfo(def.returndef,usedef,signext);
  707. { specifying result sign extention information for an alias causes
  708. an error for some reason }
  709. if pddecltype in [lpd_decl,lpd_def] then
  710. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  711. encodedstr:=encodedstr+' ';
  712. llvmaddencodedtype_intern(usedef,[],encodedstr);
  713. end
  714. else
  715. begin
  716. encodedstr:=encodedstr+' ';
  717. llvmaddencodedtype(voidtype,false,encodedstr);
  718. end;
  719. encodedstr:=encodedstr+' ';
  720. { add procname? }
  721. if (pddecltype in [lpd_decl,lpd_def]) and
  722. (def.typ=procdef) then
  723. if customname='' then
  724. encodedstr:=encodedstr+llvmmangledname(tprocdef(def).mangledname)
  725. else
  726. encodedstr:=encodedstr+llvmmangledname(customname);
  727. encodedstr:=encodedstr+'(';
  728. { parameters }
  729. first:=true;
  730. for paranr:=0 to def.paras.count-1 do
  731. begin
  732. hp:=tparavarsym(def.paras[paranr]);
  733. llvmaddencodedparaloctype(hp,def.proccalloption,pddecltype in [lpd_def],not(pddecltype in [lpd_procvar,lpd_alias]),first,encodedstr);
  734. end;
  735. if po_varargs in def.procoptions then
  736. begin
  737. if not first then
  738. encodedstr:=encodedstr+', ';
  739. encodedstr:=encodedstr+'...';
  740. end;
  741. encodedstr:=encodedstr+')'
  742. end;
  743. function llvmgettemprecorddef(fieldtypes: tfplist; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  744. var
  745. i: longint;
  746. res: PHashSetItem;
  747. oldsymtablestack: tsymtablestack;
  748. hrecst: trecordsymtable;
  749. hdef: tdef;
  750. hrecdef: trecorddef;
  751. sym: tfieldvarsym;
  752. typename: string;
  753. begin
  754. typename:=internaltypeprefixName[itp_llvmstruct];
  755. for i:=0 to fieldtypes.count-1 do
  756. begin
  757. hdef:=tdef(fieldtypes[i]);
  758. case hdef.typ of
  759. orddef:
  760. case torddef(hdef).ordtype of
  761. s8bit,
  762. u8bit:
  763. typename:=typename+'i8';
  764. s16bit,
  765. u16bit:
  766. typename:=typename+'i16';
  767. s32bit,
  768. u32bit:
  769. typename:=typename+'i32';
  770. s64bit,
  771. u64bit:
  772. typename:=typename+'i64';
  773. else
  774. { other types should not appear currently, add as needed }
  775. internalerror(2014012001);
  776. end;
  777. floatdef:
  778. case tfloatdef(hdef).floattype of
  779. s32real:
  780. typename:=typename+'f32';
  781. s64real:
  782. typename:=typename+'f64';
  783. else
  784. { other types should not appear currently, add as needed }
  785. internalerror(2014012008);
  786. end;
  787. else
  788. typename:=typename+'d'+hdef.unique_id_str;
  789. end;
  790. end;
  791. if not assigned(current_module) then
  792. internalerror(2014012002);
  793. res:=current_module.llvmdefs.FindOrAdd(@typename[1],length(typename));
  794. if not assigned(res^.Data) then
  795. begin
  796. res^.Data:=crecorddef.create_global_internal(typename,packrecords,
  797. recordalignmin,maxcrecordalign);
  798. for i:=0 to fieldtypes.count-1 do
  799. trecorddef(res^.Data).add_field_by_def('F'+tostr(i),tdef(fieldtypes[i]));
  800. end;
  801. trecordsymtable(trecorddef(res^.Data).symtable).addalignmentpadding;
  802. result:=trecorddef(res^.Data);
  803. end;
  804. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  805. var
  806. retdeflist: tfplist;
  807. retloc: pcgparalocation;
  808. usedef: tdef;
  809. valueext: tllvmvalueextension;
  810. begin
  811. { single location }
  812. if not assigned(cgpara.location^.next) then
  813. begin
  814. { def of the location, except in case of zero/sign-extension and
  815. zero-sized records }
  816. if not is_special_array(cgpara.def) and
  817. (cgpara.def.size=0) then
  818. usedef:=cgpara.def
  819. else
  820. usedef:=cgpara.location^.def;
  821. if beforevalueext then
  822. llvmextractvalueextinfo(cgpara.def,usedef,valueext);
  823. { comp and currency are handled by the x87 in this case. They cannot
  824. be represented directly in llvm, and llvmdef translates them into
  825. i64 (since that's their storage size and internally they also are
  826. int64). Solve this by changing the type to s80real in the
  827. returndef/parameter declaration. }
  828. if (usedef.typ=floatdef) and
  829. (tfloatdef(usedef).floattype in [s64comp,s64currency]) then
  830. usedef:=s80floattype;
  831. result:=usedef;
  832. exit
  833. end;
  834. { multiple locations -> create temp record }
  835. retdeflist:=tfplist.create;
  836. retloc:=cgpara.location;
  837. repeat
  838. retdeflist.add(retloc^.def);
  839. retloc:=retloc^.next;
  840. until not assigned(retloc);
  841. result:=llvmgettemprecorddef(retdeflist,C_alignment,
  842. targetinfos[target_info.system]^.alignment.recordalignmin,
  843. targetinfos[target_info.system]^.alignment.maxCrecordalign);
  844. include(result.defoptions,df_llvm_no_struct_packing);
  845. end;
  846. function llvmencodetypedecl(def: tdef): TSymStr;
  847. begin
  848. result:='';
  849. llvmaddencodedtype_intern(def,[lef_typedecl],result);
  850. end;
  851. end.