llvmdef.pas 40 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026
  1. {
  2. Copyright (c) 2013 by Jonas Maebe
  3. This unit implements some LLVM type helper routines.
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. {$i fpcdefs.inc}
  18. unit llvmdef;
  19. interface
  20. uses
  21. cclasses,globtype,
  22. aasmbase,
  23. parabase,
  24. symbase,symtype,symdef,
  25. llvmbase;
  26. type
  27. { there are three different circumstances in which procdefs are used:
  28. a) definition of a procdef that's implemented in the current module
  29. b) declaration of an external routine that's called in the current one
  30. c) alias declaration of a procdef implemented in the current module
  31. d) defining a procvar type
  32. The main differences between the contexts are:
  33. a) information about sign extension of result type, proc name, parameter names & sign-extension info & types
  34. b) information about sign extension of result type, proc name, no parameter names, with parameter sign-extension info & types
  35. c) no information about sign extension of result type, proc name, no parameter names, no information about sign extension of parameters, parameter types
  36. d) no information about sign extension of result type, no proc name, no parameter names, no information about sign extension of parameters, parameter types
  37. }
  38. tllvmprocdefdecltype = (lpd_def,lpd_decl,lpd_alias,lpd_procvar);
  39. { returns the identifier to use as typename for a def in llvm (llvm only
  40. allows naming struct types) -- only supported for defs with a typesym, and
  41. only for tabstractrecorddef descendantds and complex procvars }
  42. function llvmtypeidentifier(def: tdef): TSymStr;
  43. { encode a type into the internal format used by LLVM (for a type
  44. declaration) }
  45. function llvmencodetypedecl(def: tdef): TSymStr;
  46. { same as above, but use a type name if possible (for any use) }
  47. function llvmencodetypename(def: tdef): TSymStr;
  48. { encode a procdef/procvardef into the internal format used by LLVM }
  49. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  50. { incremental version of the above }
  51. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  52. { function result types may have to be represented differently, e.g. a
  53. record consisting of 4 longints must be returned as a record consisting of
  54. two int64's on x86-64. This function is used to create (and reuse)
  55. temporary recorddefs for such purposes.}
  56. function llvmgettemprecorddef(fieldtypes: array of tdef; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  57. { get the llvm type corresponding to a parameter, e.g. a record containing
  58. two integer int64 for an arbitrary record split over two individual int64
  59. parameters, or an int32 for an int16 parameter on a platform that requires
  60. such parameters to be zero/sign extended. The second parameter can be used
  61. to get the type before zero/sign extension, as e.g. required to generate
  62. function declarations. }
  63. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  64. { can be used to extract the value extension info from acgpara. Pass in
  65. the def of the cgpara as first parameter and a local variable holding
  66. a copy of the def of the location (value extension only makes sense for
  67. ordinal parameters that are smaller than a single location). The routine
  68. will return the def of the location without sign extension (if applicable)
  69. and the kind of sign extension that was originally performed in the
  70. signext parameter }
  71. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  72. { returns whether a paraloc should be translated into an llvm "byval"
  73. parameter. These are declared as pointers to a particular type, but
  74. usually turned into copies onto the stack. The exact behaviour for
  75. parameters that should be passed in registers is undefined and depends on
  76. the platform, and furthermore this modifier sometimes inhibits
  77. optimizations. As a result,we only use it for aggregate parameters of
  78. which we know that they should be passed on the stack }
  79. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  80. { returns whether a def is representated by an aggregate type in llvm
  81. (struct, array) }
  82. function llvmaggregatetype(def: tdef): boolean;
  83. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  84. { mangle a global identifier so that it's recognised by LLVM as a global
  85. (in the sense of module-global) label and so that it won't mangle the
  86. name further according to platform conventions (we already did that) }
  87. function llvmmangledname(const s: TSymStr): TSymStr;
  88. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  89. implementation
  90. uses
  91. globals,cutils,constexp,
  92. verbose,systems,
  93. fmodule,
  94. symtable,symconst,symsym,
  95. llvmsym,hlcgobj,
  96. defutil,blockutl,cgbase,paramgr,
  97. cpubase;
  98. {******************************************************************
  99. Type encoding
  100. *******************************************************************}
  101. function llvmtypeidentifier(def: tdef): TSymStr;
  102. begin
  103. if not assigned(def.typesym) then
  104. internalerror(2015041901);
  105. result:='%"typ.'+def.fullownerhierarchyname(false)+def.typesym.realname+'"'
  106. end;
  107. function llvmaggregatetype(def: tdef): boolean;
  108. begin
  109. result:=
  110. (def.typ in [recorddef,filedef,variantdef]) or
  111. ((def.typ=arraydef) and
  112. not is_dynamic_array(def)) or
  113. ((def.typ=setdef) and
  114. not is_smallset(def)) or
  115. is_shortstring(def) or
  116. is_object(def) or
  117. ((def.typ=procvardef) and
  118. not tprocvardef(def).is_addressonly)
  119. end;
  120. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  121. var
  122. fromregtyp,
  123. toregtyp: tregistertype;
  124. frombytesize,
  125. tobytesize: asizeint;
  126. begin
  127. fromregtyp:=chlcgobj.def2regtyp(fromsize);
  128. toregtyp:=chlcgobj.def2regtyp(tosize);
  129. { int to pointer or vice versa }
  130. if fromregtyp=R_ADDRESSREGISTER then
  131. begin
  132. case toregtyp of
  133. R_INTREGISTER:
  134. result:=la_ptrtoint;
  135. R_ADDRESSREGISTER:
  136. result:=la_bitcast;
  137. else
  138. result:=la_ptrtoint_to_x;
  139. end;
  140. end
  141. else if toregtyp=R_ADDRESSREGISTER then
  142. begin
  143. case fromregtyp of
  144. R_INTREGISTER:
  145. result:=la_inttoptr;
  146. R_ADDRESSREGISTER:
  147. result:=la_bitcast;
  148. else
  149. result:=la_x_to_inttoptr;
  150. end;
  151. end
  152. else
  153. begin
  154. { treat comp and currency as extended in registers (see comment at start
  155. of thlgcobj.a_loadfpu_ref_reg) }
  156. if inregs and
  157. (fromsize.typ=floatdef) then
  158. begin
  159. if tfloatdef(fromsize).floattype in [s64comp,s64currency] then
  160. fromsize:=sc80floattype;
  161. { at the value level, s80real and sc80real are the same }
  162. if tfloatdef(fromsize).floattype<>s80real then
  163. frombytesize:=fromsize.size
  164. else
  165. frombytesize:=sc80floattype.size;
  166. end
  167. else
  168. frombytesize:=fromsize.size;
  169. if inregs and
  170. (tosize.typ=floatdef) then
  171. begin
  172. if tfloatdef(tosize).floattype in [s64comp,s64currency] then
  173. tosize:=sc80floattype;
  174. if tfloatdef(tosize).floattype<>s80real then
  175. tobytesize:=tosize.size
  176. else
  177. tobytesize:=sc80floattype.size;
  178. end
  179. else
  180. tobytesize:=tosize.size;
  181. { need zero/sign extension, float truncation or plain bitcast? }
  182. if tobytesize<>frombytesize then
  183. begin
  184. case fromregtyp of
  185. R_FPUREGISTER,
  186. R_MMREGISTER:
  187. begin
  188. { todo: update once we support vectors }
  189. if not(toregtyp in [R_FPUREGISTER,R_MMREGISTER]) then
  190. internalerror(2014062203);
  191. if tobytesize<frombytesize then
  192. result:=la_fptrunc
  193. else
  194. result:=la_fpext
  195. end;
  196. else
  197. begin
  198. if tobytesize<frombytesize then
  199. result:=la_trunc
  200. else if is_signed(fromsize) then
  201. { fromsize is signed -> sign extension }
  202. result:=la_sext
  203. else
  204. result:=la_zext;
  205. end;
  206. end;
  207. end
  208. else if (fromsize=llvmbool1type) and
  209. (tosize<>llvmbool1type) then
  210. begin
  211. if is_cbool(tosize) then
  212. result:=la_sext
  213. else
  214. result:=la_zext
  215. end
  216. else if (tosize=llvmbool1type) and
  217. (fromsize<>llvmbool1type) then
  218. begin
  219. { would have to compare with 0, can't just take the lowest bit }
  220. if is_cbool(fromsize) then
  221. internalerror(2016052001)
  222. else
  223. result:=la_trunc
  224. end
  225. else
  226. result:=la_bitcast;
  227. end;
  228. end;
  229. function llvmmangledname(const s: TSymStr): TSymStr;
  230. begin
  231. if copy(s,1,length('llvm.'))<>'llvm.' then
  232. if s[1]<>'"' then
  233. result:='@"\01'+s+'"'
  234. else
  235. begin
  236. { already quoted -> insert \01 and prepend @ }
  237. result:='@'+s;
  238. insert('\01',result,3);
  239. end
  240. else
  241. result:='@'+s
  242. end;
  243. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  244. begin
  245. { AT_ADDR and AT_LABEL represent labels in the code, which have
  246. a different type in llvm compared to (global) data labels }
  247. if sym.bind=AB_TEMP then
  248. result:='%'+sym.name
  249. else if not(sym.typ in [AT_LABEL,AT_ADDR]) then
  250. result:=llvmmangledname(sym.name)
  251. else
  252. result:='label %'+sym.name;
  253. end;
  254. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  255. begin
  256. { "byval" is broken for register paras on several platforms in llvm
  257. (search for "byval" in llvm's bug tracker). Additionally, it should only
  258. be used to pass aggregate parameters on the stack, because it reportedly
  259. inhibits llvm's midlevel optimizers.
  260. Exception (for now?): parameters that have special shifting
  261. requirements, because modelling those in llvm is not easy (and clang
  262. nor llvm-gcc seem to do so either) }
  263. result:=
  264. ((paraloc^.loc=LOC_REFERENCE) and
  265. llvmaggregatetype(paraloc^.def)) or
  266. ((paraloc^.loc in [LOC_REGISTER,LOC_CREGISTER]) and
  267. (paraloc^.shiftval<>0))
  268. end;
  269. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr); forward;
  270. type
  271. tllvmencodeflag = (lef_inaggregate, lef_noimplicitderef, lef_typedecl);
  272. tllvmencodeflags = set of tllvmencodeflag;
  273. procedure llvmaddencodedtype_intern(def: tdef; const flags: tllvmencodeflags; var encodedstr: TSymStr);
  274. begin
  275. case def.typ of
  276. stringdef :
  277. begin
  278. case tstringdef(def).stringtype of
  279. st_widestring,
  280. st_unicodestring:
  281. { the variable does not point to the header, but to a
  282. null-terminated string/array with undefined bounds }
  283. encodedstr:=encodedstr+'i16*';
  284. st_ansistring:
  285. encodedstr:=encodedstr+'i8*';
  286. st_shortstring:
  287. { length byte followed by string bytes }
  288. if tstringdef(def).len>0 then
  289. encodedstr:=encodedstr+'['+tostr(tstringdef(def).len+1)+' x i8]'
  290. else
  291. encodedstr:=encodedstr+'[0 x i8]';
  292. else
  293. internalerror(2013100201);
  294. end;
  295. end;
  296. enumdef:
  297. begin
  298. encodedstr:=encodedstr+'i'+tostr(def.size*8);
  299. end;
  300. orddef :
  301. begin
  302. if is_void(def) then
  303. encodedstr:=encodedstr+'void'
  304. { mainly required because comparison operations return i1, and
  305. we need a way to represent the i1 type in Pascal. We don't
  306. reuse pasbool1type, because putting an i1 in a record or
  307. passing it as a parameter may result in unexpected behaviour }
  308. else if def=llvmbool1type then
  309. encodedstr:=encodedstr+'i1'
  310. else if torddef(def).ordtype<>customint then
  311. encodedstr:=encodedstr+'i'+tostr(def.size*8)
  312. else
  313. encodedstr:=encodedstr+'i'+tostr(def.packedbitsize);
  314. end;
  315. pointerdef :
  316. begin
  317. if is_voidpointer(def) then
  318. encodedstr:=encodedstr+'i8*'
  319. else
  320. begin
  321. llvmaddencodedtype_intern(tpointerdef(def).pointeddef,[],encodedstr);
  322. encodedstr:=encodedstr+'*';
  323. end;
  324. end;
  325. floatdef :
  326. begin
  327. case tfloatdef(def).floattype of
  328. s32real:
  329. encodedstr:=encodedstr+'float';
  330. s64real:
  331. encodedstr:=encodedstr+'double';
  332. { necessary to be able to force our own size/alignment }
  333. s80real:
  334. { prevent llvm from allocating the standard ABI size for
  335. extended }
  336. if lef_inaggregate in flags then
  337. encodedstr:=encodedstr+'[10 x i8]'
  338. else
  339. encodedstr:=encodedstr+'x86_fp80';
  340. sc80real:
  341. encodedstr:=encodedstr+'x86_fp80';
  342. s64comp,
  343. s64currency:
  344. encodedstr:=encodedstr+'i64';
  345. s128real:
  346. {$if defined(powerpc) or defined(powerpc128)}
  347. encodedstr:=encodedstr+'ppc_fp128';
  348. {$else}
  349. encodedstr:=encodedstr+'fp128';
  350. {$endif}
  351. else
  352. internalerror(2013100202);
  353. end;
  354. end;
  355. filedef :
  356. begin
  357. case tfiledef(def).filetyp of
  358. ft_text :
  359. llvmaddencodedtype_intern(search_system_type('TEXTREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  360. ft_typed :
  361. begin
  362. { in case of ISO-like I/O, the typed file def includes a
  363. get/put buffer of the size of the file's elements }
  364. if (m_isolike_io in current_settings.modeswitches) and
  365. not is_void(tfiledef(def).typedfiledef) then
  366. encodedstr:=encodedstr+'<{';
  367. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  368. if (m_isolike_io in current_settings.modeswitches) and
  369. not is_void(tfiledef(def).typedfiledef) then
  370. begin
  371. encodedstr:=encodedstr+',[';
  372. encodedstr:=encodedstr+tostr(tfiledef(def).typedfiledef.size);
  373. encodedstr:=encodedstr+' x i8]}>'
  374. end;
  375. end;
  376. ft_untyped :
  377. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  378. else
  379. internalerror(2013100203);
  380. end;
  381. end;
  382. recorddef :
  383. begin
  384. { avoid endlessly recursive definitions }
  385. if assigned(def.typesym) and
  386. ((lef_inaggregate in flags) or
  387. not(lef_typedecl in flags)) then
  388. encodedstr:=encodedstr+llvmtypeidentifier(def)
  389. else
  390. llvmaddencodedabstractrecordtype(trecorddef(def),encodedstr);
  391. end;
  392. variantdef :
  393. begin
  394. llvmaddencodedtype_intern(search_system_type('TVARDATA').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  395. end;
  396. classrefdef :
  397. begin
  398. if is_class(tclassrefdef(def).pointeddef) then
  399. begin
  400. llvmaddencodedtype_intern(tobjectdef(tclassrefdef(def).pointeddef).vmt_def,flags,encodedstr);
  401. encodedstr:=encodedstr+'*';
  402. end
  403. else if is_objcclass(tclassrefdef(def).pointeddef) then
  404. llvmaddencodedtype_intern(objc_idtype,flags,encodedstr)
  405. else
  406. encodedstr:=encodedstr+'i8*'
  407. end;
  408. setdef :
  409. begin
  410. { just an array as far as llvm is concerned; don't use a "packed
  411. array of i1" or so, this requires special support in backends
  412. and guarantees nothing about the internal format }
  413. if is_smallset(def) then
  414. llvmaddencodedtype_intern(cgsize_orddef(def_cgsize(def)),[lef_inaggregate],encodedstr)
  415. else
  416. encodedstr:=encodedstr+'['+tostr(tsetdef(def).size)+' x i8]';
  417. end;
  418. formaldef :
  419. begin
  420. { var/const/out x (always treated as "pass by reference" -> don't
  421. add extra "*" here) }
  422. encodedstr:=encodedstr+'i8';
  423. end;
  424. arraydef :
  425. begin
  426. if is_array_of_const(def) then
  427. begin
  428. encodedstr:=encodedstr+'[0 x ';
  429. llvmaddencodedtype_intern(search_system_type('TVARREC').typedef,[lef_inaggregate],encodedstr);
  430. encodedstr:=encodedstr+']';
  431. end
  432. else if is_open_array(def) then
  433. begin
  434. encodedstr:=encodedstr+'[0 x ';
  435. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  436. encodedstr:=encodedstr+']';
  437. end
  438. else if is_dynamic_array(def) then
  439. begin
  440. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  441. encodedstr:=encodedstr+'*';
  442. end
  443. else if is_packed_array(def) and
  444. (tarraydef(def).elementdef.typ in [enumdef,orddef]) then
  445. begin
  446. { encode as an array of bytes rather than as an array of
  447. packedbitsloadsize(elesize), because even if the load size
  448. is e.g. 2 bytes, the array may only be 1 or 3 bytes long
  449. (and if this array is inside a record, it must not be
  450. encoded as a type that is too long) }
  451. encodedstr:=encodedstr+'['+tostr(tarraydef(def).size)+' x ';
  452. llvmaddencodedtype_intern(u8inttype,[lef_inaggregate],encodedstr);
  453. encodedstr:=encodedstr+']';
  454. end
  455. else
  456. begin
  457. encodedstr:=encodedstr+'['+tostr(tarraydef(def).elecount)+' x ';
  458. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  459. encodedstr:=encodedstr+']';
  460. end;
  461. end;
  462. procdef,
  463. procvardef :
  464. begin
  465. if (def.typ=procdef) or
  466. tprocvardef(def).is_addressonly then
  467. begin
  468. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  469. if def.typ=procvardef then
  470. encodedstr:=encodedstr+'*';
  471. end
  472. else if ((lef_inaggregate in flags) or
  473. not(lef_typedecl in flags)) and
  474. assigned(tprocvardef(def).typesym) then
  475. begin
  476. { in case the procvardef recursively references itself, e.g.
  477. via a pointer }
  478. encodedstr:=encodedstr+llvmtypeidentifier(def);
  479. { blocks are implicit pointers }
  480. if is_block(def) then
  481. encodedstr:=encodedstr+'*'
  482. end
  483. else if is_block(def) then
  484. begin
  485. llvmaddencodedtype_intern(get_block_literal_type_for_proc(tabstractprocdef(def)),flags,encodedstr);
  486. end
  487. else
  488. begin
  489. encodedstr:=encodedstr+'<{';
  490. { code pointer }
  491. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  492. { data pointer (maybe todo: generate actual layout if
  493. available) }
  494. encodedstr:=encodedstr+'*, i8*}>';
  495. end;
  496. end;
  497. objectdef :
  498. case tobjectdef(def).objecttype of
  499. odt_class,
  500. odt_objcclass,
  501. odt_object,
  502. odt_cppclass:
  503. begin
  504. if not(lef_typedecl in flags) and
  505. assigned(def.typesym) then
  506. encodedstr:=encodedstr+llvmtypeidentifier(def)
  507. else
  508. llvmaddencodedabstractrecordtype(tabstractrecorddef(def),encodedstr);
  509. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) and
  510. is_implicit_pointer_object_type(def) then
  511. encodedstr:=encodedstr+'*'
  512. end;
  513. odt_interfacecom,
  514. odt_interfacecorba,
  515. odt_dispinterface:
  516. begin
  517. { type is a pointer to a pointer to the vmt }
  518. llvmaddencodedtype_intern(tobjectdef(def).vmt_def,flags,encodedstr);
  519. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) then
  520. encodedstr:=encodedstr+'**';
  521. end;
  522. odt_interfacecom_function,
  523. odt_interfacecom_property,
  524. odt_objcprotocol:
  525. begin
  526. { opaque for now }
  527. encodedstr:=encodedstr+'i8*'
  528. end;
  529. odt_helper:
  530. llvmaddencodedtype_intern(tobjectdef(def).extendeddef,flags,encodedstr);
  531. else
  532. internalerror(2013100601);
  533. end;
  534. undefineddef,
  535. errordef :
  536. internalerror(2013100604);
  537. else
  538. internalerror(2013100603);
  539. end;
  540. end;
  541. function llvmencodetypename(def: tdef): TSymStr;
  542. begin
  543. result:='';
  544. llvmaddencodedtype_intern(def,[],result);
  545. end;
  546. procedure llvmaddencodedtype(def: tdef; inaggregate: boolean; var encodedstr: TSymStr);
  547. var
  548. flags: tllvmencodeflags;
  549. begin
  550. if inaggregate then
  551. flags:=[lef_inaggregate]
  552. else
  553. flags:=[];
  554. llvmaddencodedtype_intern(def,flags,encodedstr);
  555. end;
  556. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr);
  557. var
  558. st: tllvmshadowsymtable;
  559. symdeflist: tfpobjectlist;
  560. i: longint;
  561. nopacked: boolean;
  562. begin
  563. st:=tabstractrecordsymtable(def.symtable).llvmst;
  564. symdeflist:=st.symdeflist;
  565. nopacked:=df_llvm_no_struct_packing in def.defoptions;
  566. if nopacked then
  567. encodedstr:=encodedstr+'{ '
  568. else
  569. encodedstr:=encodedstr+'<{ ';
  570. if symdeflist.count>0 then
  571. begin
  572. i:=0;
  573. if (def.typ=objectdef) and
  574. assigned(tobjectdef(def).childof) and
  575. is_class_or_interface_or_dispinterface(tllvmshadowsymtableentry(symdeflist[0]).def) then
  576. begin
  577. { insert the struct for the class rather than a pointer to the struct }
  578. if (tllvmshadowsymtableentry(symdeflist[0]).def.typ<>objectdef) then
  579. internalerror(2008070601);
  580. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[0]).def,[lef_inaggregate,lef_noimplicitderef],encodedstr);
  581. inc(i);
  582. end;
  583. while i<symdeflist.count do
  584. begin
  585. if i<>0 then
  586. encodedstr:=encodedstr+', ';
  587. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[i]).def,[lef_inaggregate],encodedstr);
  588. inc(i);
  589. end;
  590. end;
  591. if nopacked then
  592. encodedstr:=encodedstr+' }'
  593. else
  594. encodedstr:=encodedstr+' }>';
  595. end;
  596. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  597. begin
  598. { implicit zero/sign extension for ABI compliance? (yes, if the size
  599. of a paraloc is larger than the size of the entire parameter) }
  600. if is_ordinal(paradef) and
  601. is_ordinal(paralocdef) and
  602. (paradef.size<paralocdef.size) then
  603. begin
  604. paralocdef:=paradef;
  605. if is_signed(paradef) then
  606. signext:=lve_signext
  607. else
  608. signext:=lve_zeroext
  609. end
  610. else
  611. signext:=lve_none;
  612. end;
  613. procedure llvmaddencodedparaloctype(hp: tparavarsym; proccalloption: tproccalloption; withparaname, withattributes: boolean; var first: boolean; var encodedstr: TSymStr);
  614. var
  615. para: PCGPara;
  616. paraloc: PCGParaLocation;
  617. side: tcallercallee;
  618. signext: tllvmvalueextension;
  619. usedef: tdef;
  620. firstloc: boolean;
  621. begin
  622. if (proccalloption in cdecl_pocalls) and
  623. is_array_of_const(hp.vardef) then
  624. begin
  625. if not first then
  626. encodedstr:=encodedstr+', '
  627. else
  628. first:=false;
  629. encodedstr:=encodedstr+'...';
  630. exit
  631. end;
  632. if not withparaname then
  633. side:=callerside
  634. else
  635. side:=calleeside;
  636. { don't add parameters that don't take up registers or stack space;
  637. clang doesn't either and some LLVM backends don't support them }
  638. if hp.paraloc[side].isempty then
  639. exit;
  640. para:[email protected][side];
  641. paraloc:=para^.location;
  642. firstloc:=true;
  643. repeat
  644. usedef:=paraloc^.def;
  645. llvmextractvalueextinfo(hp.vardef,usedef,signext);
  646. { implicit zero/sign extension for ABI compliance? }
  647. if not first then
  648. encodedstr:=encodedstr+', ';
  649. llvmaddencodedtype_intern(usedef,[],encodedstr);
  650. { in case signextstr<>'', there should be only one paraloc -> no need
  651. to clear (reason: it means that the paraloc is larger than the
  652. original parameter) }
  653. if withattributes then
  654. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  655. { sret: hidden pointer for structured function result }
  656. if vo_is_funcret in hp.varoptions then
  657. begin
  658. { "sret" is only valid for the firstparameter, while in FPC this
  659. can sometimes be second one (self comes before). In general,
  660. this is not a problem: we can just leave out sret, which means
  661. the result will be a bit less well optimised), but it is for
  662. AArch64: there, the sret parameter must be passed in a different
  663. register (-> paranr_result is smaller than paranr_self for that
  664. platform in symconst) }
  665. {$ifdef aarch64}
  666. if not first then
  667. internalerror(2015101404);
  668. {$endif aarch64}
  669. if withattributes then
  670. if first then
  671. encodedstr:=encodedstr+' sret noalias nocapture'
  672. else
  673. encodedstr:=encodedstr+' noalias nocapture';
  674. end
  675. else if not paramanager.push_addr_param(hp.varspez,hp.vardef,proccalloption) and
  676. llvmbyvalparaloc(paraloc) then
  677. begin
  678. if withattributes then
  679. begin
  680. encodedstr:=encodedstr+'* byval';
  681. if firstloc and
  682. (para^.alignment<>std_param_align) then
  683. begin
  684. encodedstr:=encodedstr+' align '+tostr(para^.alignment);
  685. end;
  686. end
  687. else
  688. encodedstr:=encodedstr+'*';
  689. end
  690. else if withattributes and
  691. paramanager.push_addr_param(hp.varspez,hp.vardef,proccalloption) then
  692. begin
  693. { it's not valid to take the address of a parameter and store it for
  694. use past the end of the function call (since the address can always
  695. be on the stack and become invalid later) }
  696. encodedstr:=encodedstr+' nocapture';
  697. { open array/array of const/variant array may be a valid pointer but empty }
  698. if not is_special_array(hp.vardef) and
  699. { e.g. empty records }
  700. (hp.vardef.size<>0) then
  701. begin
  702. case hp.varspez of
  703. vs_value,
  704. vs_const:
  705. begin
  706. encodedstr:=encodedstr+' dereferenceable('
  707. end;
  708. vs_var,
  709. vs_out,
  710. vs_constref:
  711. begin
  712. { while normally these are not nil, it is technically possible
  713. to pass nil via ptrtype(nil)^ }
  714. encodedstr:=encodedstr+' dereferenceable_or_null('
  715. end;
  716. else
  717. internalerror(2018120801);
  718. end;
  719. if hp.vardef.typ<>formaldef then
  720. encodedstr:=encodedstr+tostr(hp.vardef.size)+')'
  721. else
  722. encodedstr:=encodedstr+'1)';
  723. end;
  724. end;
  725. if withparaname then
  726. begin
  727. if paraloc^.llvmloc.loc<>LOC_REFERENCE then
  728. internalerror(2014010803);
  729. encodedstr:=encodedstr+' '+llvmasmsymname(paraloc^.llvmloc.sym);
  730. end;
  731. paraloc:=paraloc^.next;
  732. firstloc:=false;
  733. first:=false;
  734. until not assigned(paraloc);
  735. end;
  736. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  737. begin
  738. result:='';
  739. llvmaddencodedproctype(def,customname,pddecltype,result);
  740. end;
  741. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  742. var
  743. usedef: tdef;
  744. paranr: longint;
  745. hp: tparavarsym;
  746. signext: tllvmvalueextension;
  747. useside: tcallercallee;
  748. first: boolean;
  749. begin
  750. { when writing a definition, we have to write the parameter names, and
  751. those are only available on the callee side. In all other cases,
  752. we are at the callerside }
  753. if pddecltype=lpd_def then
  754. useside:=calleeside
  755. else
  756. useside:=callerside;
  757. def.init_paraloc_info(useside);
  758. first:=true;
  759. { function result (return-by-ref is handled explicitly) }
  760. if not paramanager.ret_in_param(def.returndef,def) then
  761. begin
  762. usedef:=llvmgetcgparadef(def.funcretloc[useside],false);
  763. llvmextractvalueextinfo(def.returndef,usedef,signext);
  764. { specifying result sign extention information for an alias causes
  765. an error for some reason }
  766. if pddecltype in [lpd_decl,lpd_def] then
  767. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  768. encodedstr:=encodedstr+' ';
  769. llvmaddencodedtype_intern(usedef,[],encodedstr);
  770. end
  771. else
  772. begin
  773. encodedstr:=encodedstr+' ';
  774. llvmaddencodedtype(voidtype,false,encodedstr);
  775. end;
  776. encodedstr:=encodedstr+' ';
  777. { add procname? }
  778. if (pddecltype in [lpd_decl,lpd_def]) and
  779. (def.typ=procdef) then
  780. if customname='' then
  781. encodedstr:=encodedstr+llvmmangledname(tprocdef(def).mangledname)
  782. else
  783. encodedstr:=encodedstr+llvmmangledname(customname);
  784. encodedstr:=encodedstr+'(';
  785. { parameters }
  786. first:=true;
  787. for paranr:=0 to def.paras.count-1 do
  788. begin
  789. hp:=tparavarsym(def.paras[paranr]);
  790. llvmaddencodedparaloctype(hp,def.proccalloption,pddecltype in [lpd_def],not(pddecltype in [lpd_procvar,lpd_alias]),first,encodedstr);
  791. end;
  792. if po_varargs in def.procoptions then
  793. begin
  794. if not first then
  795. encodedstr:=encodedstr+', ';
  796. encodedstr:=encodedstr+'...';
  797. end;
  798. encodedstr:=encodedstr+')'
  799. end;
  800. function llvmgettemprecorddef(fieldtypes: array of tdef; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  801. var
  802. i: longint;
  803. res: PHashSetItem;
  804. oldsymtablestack: tsymtablestack;
  805. hrecst: trecordsymtable;
  806. hdef: tdef;
  807. hrecdef: trecorddef;
  808. sym: tfieldvarsym;
  809. typename: string;
  810. begin
  811. typename:=internaltypeprefixName[itp_llvmstruct];
  812. for i:=low(fieldtypes) to high(fieldtypes) do
  813. begin
  814. hdef:=fieldtypes[i];
  815. case hdef.typ of
  816. orddef:
  817. case torddef(hdef).ordtype of
  818. s8bit,
  819. u8bit,
  820. pasbool1,
  821. pasbool8:
  822. typename:=typename+'i8';
  823. s16bit,
  824. u16bit:
  825. typename:=typename+'i16';
  826. s32bit,
  827. u32bit:
  828. typename:=typename+'i32';
  829. s64bit,
  830. u64bit:
  831. typename:=typename+'i64';
  832. customint:
  833. typename:=typename+'i'+tostr(torddef(hdef).packedbitsize);
  834. else
  835. { other types should not appear currently, add as needed }
  836. internalerror(2014012001);
  837. end;
  838. floatdef:
  839. case tfloatdef(hdef).floattype of
  840. s32real:
  841. typename:=typename+'f32';
  842. s64real:
  843. typename:=typename+'f64';
  844. else
  845. { other types should not appear currently, add as needed }
  846. internalerror(2014012008);
  847. end;
  848. else
  849. typename:=typename+'d'+hdef.unique_id_str;
  850. end;
  851. end;
  852. if not assigned(current_module) then
  853. internalerror(2014012002);
  854. res:=current_module.llvmdefs.FindOrAdd(@typename[1],length(typename));
  855. if not assigned(res^.Data) then
  856. begin
  857. res^.Data:=crecorddef.create_global_internal(typename,packrecords,
  858. recordalignmin,maxcrecordalign);
  859. for i:=low(fieldtypes) to high(fieldtypes) do
  860. trecorddef(res^.Data).add_field_by_def('F'+tostr(i),fieldtypes[i]);
  861. end;
  862. trecordsymtable(trecorddef(res^.Data).symtable).addalignmentpadding;
  863. result:=trecorddef(res^.Data);
  864. end;
  865. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  866. var
  867. retdeflist: array[0..9] of tdef;
  868. retloc: pcgparalocation;
  869. usedef: tdef;
  870. valueext: tllvmvalueextension;
  871. paraslots,
  872. i: longint;
  873. sizeleft: asizeint;
  874. begin
  875. { single location }
  876. if not assigned(cgpara.location^.next) then
  877. begin
  878. { def of the location, except in case of zero/sign-extension and
  879. zero-sized records }
  880. if not is_special_array(cgpara.def) and
  881. (cgpara.def.size=0) then
  882. usedef:=cgpara.def
  883. else
  884. usedef:=cgpara.location^.def;
  885. if beforevalueext then
  886. llvmextractvalueextinfo(cgpara.def,usedef,valueext);
  887. { comp and currency are handled by the x87 in this case. They cannot
  888. be represented directly in llvm, and llvmdef translates them into
  889. i64 (since that's their storage size and internally they also are
  890. int64). Solve this by changing the type to s80real in the
  891. returndef/parameter declaration. }
  892. if (usedef.typ=floatdef) and
  893. (tfloatdef(usedef).floattype in [s64comp,s64currency]) then
  894. usedef:=s80floattype;
  895. result:=usedef;
  896. exit
  897. end;
  898. { multiple locations -> create temp record }
  899. retloc:=cgpara.location;
  900. i:=0;
  901. sizeleft:=cgpara.Def.size;
  902. repeat
  903. if i>high(retdeflist) then
  904. internalerror(2016121801);
  905. if assigned(retloc^.next) then
  906. begin
  907. retdeflist[i]:=retloc^.def;
  908. dec(sizeleft,retloc^.def.size);
  909. end
  910. else if retloc^.def.size<>sizeleft then
  911. begin
  912. case sizeleft of
  913. 1:
  914. retdeflist[i]:=u8inttype;
  915. 2:
  916. retdeflist[i]:=u16inttype;
  917. 3:
  918. retdeflist[i]:=u24inttype;
  919. 4:
  920. retdeflist[i]:=u32inttype;
  921. 5:
  922. retdeflist[i]:=u40inttype;
  923. 6:
  924. retdeflist[i]:=u48inttype;
  925. 7:
  926. retdeflist[i]:=u56inttype;
  927. else
  928. retdeflist[i]:=retloc^.def;
  929. end
  930. end
  931. else
  932. begin
  933. if retloc^.def.typ<>floatdef then
  934. begin
  935. paraslots:=sizeleft div cgpara.Alignment;
  936. if (paraslots>1) and
  937. ((paraslots*cgpara.Alignment)=sizeleft) then
  938. retdeflist[i]:=carraydef.getreusable(cgsize_orddef(int_cgsize(cgpara.Alignment)),paraslots)
  939. else
  940. retdeflist[i]:=retloc^.def;
  941. end
  942. else
  943. retdeflist[i]:=retloc^.def;
  944. end;
  945. inc(i);
  946. retloc:=retloc^.next;
  947. until not assigned(retloc);
  948. result:=llvmgettemprecorddef(slice(retdeflist,i),C_alignment,
  949. targetinfos[target_info.system]^.alignment.recordalignmin,
  950. targetinfos[target_info.system]^.alignment.maxCrecordalign);
  951. include(result.defoptions,df_llvm_no_struct_packing);
  952. end;
  953. function llvmencodetypedecl(def: tdef): TSymStr;
  954. begin
  955. result:='';
  956. llvmaddencodedtype_intern(def,[lef_typedecl],result);
  957. end;
  958. end.