llvmdef.pas 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927
  1. {
  2. Copyright (c) 2013 by Jonas Maebe
  3. This unit implements some LLVM type helper routines.
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. {$i fpcdefs.inc}
  18. unit llvmdef;
  19. interface
  20. uses
  21. cclasses,globtype,
  22. aasmbase,
  23. parabase,
  24. symbase,symtype,symdef,
  25. llvmbase;
  26. type
  27. { there are three different circumstances in which procdefs are used:
  28. a) definition of a procdef that's implemented in the current module
  29. b) declaration of an external routine that's called in the current one
  30. c) alias declaration of a procdef implemented in the current module
  31. d) defining a procvar type
  32. The main differences between the contexts are:
  33. a) information about sign extension of result type, proc name, parameter names & sign-extension info & types
  34. b) information about sign extension of result type, proc name, no parameter names, with parameter sign-extension info & types
  35. c) no information about sign extension of result type, proc name, no parameter names, no information about sign extension of parameters, parameter types
  36. d) no information about sign extension of result type, no proc name, no parameter names, no information about sign extension of parameters, parameter types
  37. }
  38. tllvmprocdefdecltype = (lpd_def,lpd_decl,lpd_alias,lpd_procvar);
  39. { returns the identifier to use as typename for a def in llvm (llvm only
  40. allows naming struct types) -- only supported for defs with a typesym, and
  41. only for tabstractrecorddef descendantds and complex procvars }
  42. function llvmtypeidentifier(def: tdef): TSymStr;
  43. { encode a type into the internal format used by LLVM (for a type
  44. declaration) }
  45. function llvmencodetypedecl(def: tdef): TSymStr;
  46. { same as above, but use a type name if possible (for any use) }
  47. function llvmencodetypename(def: tdef): TSymStr;
  48. { encode a procdef/procvardef into the internal format used by LLVM }
  49. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  50. { incremental version of the above }
  51. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  52. { function result types may have to be represented differently, e.g. a
  53. record consisting of 4 longints must be returned as a record consisting of
  54. two int64's on x86-64. This function is used to create (and reuse)
  55. temporary recorddefs for such purposes.}
  56. function llvmgettemprecorddef(fieldtypes: array of tdef; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  57. { get the llvm type corresponding to a parameter, e.g. a record containing
  58. two integer int64 for an arbitrary record split over two individual int64
  59. parameters, or an int32 for an int16 parameter on a platform that requires
  60. such parameters to be zero/sign extended. The second parameter can be used
  61. to get the type before zero/sign extension, as e.g. required to generate
  62. function declarations. }
  63. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  64. { can be used to extract the value extension info from acgpara. Pass in
  65. the def of the cgpara as first parameter and a local variable holding
  66. a copy of the def of the location (value extension only makes sense for
  67. ordinal parameters that are smaller than a single location). The routine
  68. will return the def of the location without sign extension (if applicable)
  69. and the kind of sign extension that was originally performed in the
  70. signext parameter }
  71. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  72. { returns whether a paraloc should be translated into an llvm "byval"
  73. parameter. These are declared as pointers to a particular type, but
  74. usually turned into copies onto the stack. The exact behaviour for
  75. parameters that should be passed in registers is undefined and depends on
  76. the platform, and furthermore this modifier sometimes inhibits
  77. optimizations. As a result,we only use it for aggregate parameters of
  78. which we know that they should be passed on the stack }
  79. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  80. { returns whether a def is representated by an aggregate type in llvm
  81. (struct, array) }
  82. function llvmaggregatetype(def: tdef): boolean;
  83. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  84. { mangle a global identifier so that it's recognised by LLVM as a global
  85. (in the sense of module-global) label and so that it won't mangle the
  86. name further according to platform conventions (we already did that) }
  87. function llvmmangledname(const s: TSymStr): TSymStr;
  88. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  89. implementation
  90. uses
  91. globals,cutils,constexp,
  92. verbose,systems,
  93. fmodule,
  94. symtable,symconst,symsym,
  95. llvmsym,hlcgobj,
  96. defutil,blockutl,cgbase,paramgr;
  97. {******************************************************************
  98. Type encoding
  99. *******************************************************************}
  100. function llvmtypeidentifier(def: tdef): TSymStr;
  101. begin
  102. if not assigned(def.typesym) then
  103. internalerror(2015041901);
  104. result:='%"typ.'+def.fullownerhierarchyname(false)+def.typesym.realname+'"'
  105. end;
  106. function llvmaggregatetype(def: tdef): boolean;
  107. begin
  108. result:=
  109. (def.typ in [recorddef,filedef,variantdef]) or
  110. ((def.typ=arraydef) and
  111. not is_dynamic_array(def)) or
  112. ((def.typ=setdef) and
  113. not is_smallset(def)) or
  114. is_shortstring(def) or
  115. is_object(def) or
  116. ((def.typ=procvardef) and
  117. not tprocvardef(def).is_addressonly)
  118. end;
  119. function llvmconvop(var fromsize, tosize: tdef; inregs: boolean): tllvmop;
  120. var
  121. fromregtyp,
  122. toregtyp: tregistertype;
  123. frombytesize,
  124. tobytesize: asizeint;
  125. begin
  126. fromregtyp:=chlcgobj.def2regtyp(fromsize);
  127. toregtyp:=chlcgobj.def2regtyp(tosize);
  128. { int to pointer or vice versa }
  129. if fromregtyp=R_ADDRESSREGISTER then
  130. begin
  131. case toregtyp of
  132. R_INTREGISTER:
  133. result:=la_ptrtoint;
  134. R_ADDRESSREGISTER:
  135. result:=la_bitcast;
  136. else
  137. result:=la_ptrtoint_to_x;
  138. end;
  139. end
  140. else if toregtyp=R_ADDRESSREGISTER then
  141. begin
  142. case fromregtyp of
  143. R_INTREGISTER:
  144. result:=la_inttoptr;
  145. R_ADDRESSREGISTER:
  146. result:=la_bitcast;
  147. else
  148. result:=la_x_to_inttoptr;
  149. end;
  150. end
  151. else
  152. begin
  153. { treat comp and currency as extended in registers (see comment at start
  154. of thlgcobj.a_loadfpu_ref_reg) }
  155. if inregs and
  156. (fromsize.typ=floatdef) then
  157. begin
  158. if tfloatdef(fromsize).floattype in [s64comp,s64currency] then
  159. fromsize:=sc80floattype;
  160. { at the value level, s80real and sc80real are the same }
  161. if tfloatdef(fromsize).floattype<>s80real then
  162. frombytesize:=fromsize.size
  163. else
  164. frombytesize:=sc80floattype.size;
  165. end
  166. else
  167. frombytesize:=fromsize.size;
  168. if inregs and
  169. (tosize.typ=floatdef) then
  170. begin
  171. if tfloatdef(tosize).floattype in [s64comp,s64currency] then
  172. tosize:=sc80floattype;
  173. if tfloatdef(tosize).floattype<>s80real then
  174. tobytesize:=tosize.size
  175. else
  176. tobytesize:=sc80floattype.size;
  177. end
  178. else
  179. tobytesize:=tosize.size;
  180. { need zero/sign extension, float truncation or plain bitcast? }
  181. if tobytesize<>frombytesize then
  182. begin
  183. case fromregtyp of
  184. R_FPUREGISTER,
  185. R_MMREGISTER:
  186. begin
  187. { todo: update once we support vectors }
  188. if not(toregtyp in [R_FPUREGISTER,R_MMREGISTER]) then
  189. internalerror(2014062203);
  190. if tobytesize<frombytesize then
  191. result:=la_fptrunc
  192. else
  193. result:=la_fpext
  194. end;
  195. else
  196. begin
  197. if tobytesize<frombytesize then
  198. result:=la_trunc
  199. else if is_signed(fromsize) then
  200. { fromsize is signed -> sign extension }
  201. result:=la_sext
  202. else
  203. result:=la_zext;
  204. end;
  205. end;
  206. end
  207. else if (fromsize=llvmbool1type) and
  208. (tosize<>llvmbool1type) then
  209. begin
  210. if is_cbool(tosize) then
  211. result:=la_sext
  212. else
  213. result:=la_zext
  214. end
  215. else if (tosize=llvmbool1type) and
  216. (fromsize<>llvmbool1type) then
  217. begin
  218. { would have to compare with 0, can't just take the lowest bit }
  219. if is_cbool(fromsize) then
  220. internalerror(2016052001)
  221. else
  222. result:=la_trunc
  223. end
  224. else
  225. result:=la_bitcast;
  226. end;
  227. end;
  228. function llvmmangledname(const s: TSymStr): TSymStr;
  229. begin
  230. if copy(s,1,length('llvm.'))<>'llvm.' then
  231. if s[1]<>'"' then
  232. result:='@"\01'+s+'"'
  233. else
  234. begin
  235. { already quoted -> insert \01 and prepend @ }
  236. result:='@'+s;
  237. insert('\01',result,3);
  238. end
  239. else
  240. result:='@'+s
  241. end;
  242. function llvmasmsymname(const sym: TAsmSymbol): TSymStr;
  243. begin
  244. { AT_ADDR and AT_LABEL represent labels in the code, which have
  245. a different type in llvm compared to (global) data labels }
  246. if sym.bind=AB_TEMP then
  247. result:='%'+sym.name
  248. else if not(sym.typ in [AT_LABEL,AT_ADDR]) then
  249. result:=llvmmangledname(sym.name)
  250. else
  251. result:='label %'+sym.name;
  252. end;
  253. function llvmbyvalparaloc(paraloc: pcgparalocation): boolean;
  254. begin
  255. { "byval" is broken for register paras on several platforms in llvm
  256. (search for "byval" in llvm's bug tracker). Additionally, it should only
  257. be used to pass aggregate parameters on the stack, because it reportedly
  258. inhibits llvm's midlevel optimizers.
  259. Exception (for now?): parameters that have special shifting
  260. requirements, because modelling those in llvm is not easy (and clang
  261. nor llvm-gcc seem to do so either) }
  262. result:=
  263. ((paraloc^.loc=LOC_REFERENCE) and
  264. llvmaggregatetype(paraloc^.def)) or
  265. ((paraloc^.loc in [LOC_REGISTER,LOC_CREGISTER]) and
  266. (paraloc^.shiftval<>0))
  267. end;
  268. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr); forward;
  269. type
  270. tllvmencodeflag = (lef_inaggregate, lef_noimplicitderef, lef_typedecl);
  271. tllvmencodeflags = set of tllvmencodeflag;
  272. procedure llvmaddencodedtype_intern(def: tdef; const flags: tllvmencodeflags; var encodedstr: TSymStr);
  273. begin
  274. case def.typ of
  275. stringdef :
  276. begin
  277. case tstringdef(def).stringtype of
  278. st_widestring,
  279. st_unicodestring:
  280. { the variable does not point to the header, but to a
  281. null-terminated string/array with undefined bounds }
  282. encodedstr:=encodedstr+'i16*';
  283. st_ansistring:
  284. encodedstr:=encodedstr+'i8*';
  285. st_shortstring:
  286. { length byte followed by string bytes }
  287. if tstringdef(def).len>0 then
  288. encodedstr:=encodedstr+'['+tostr(tstringdef(def).len+1)+' x i8]'
  289. else
  290. encodedstr:=encodedstr+'[0 x i8]';
  291. else
  292. internalerror(2013100201);
  293. end;
  294. end;
  295. enumdef:
  296. begin
  297. encodedstr:=encodedstr+'i'+tostr(def.size*8);
  298. end;
  299. orddef :
  300. begin
  301. if is_void(def) then
  302. encodedstr:=encodedstr+'void'
  303. { mainly required because comparison operations return i1, and
  304. we need a way to represent the i1 type in Pascal. We don't
  305. reuse pasbool1type, because putting an i1 in a record or
  306. passing it as a parameter may result in unexpected behaviour }
  307. else if def=llvmbool1type then
  308. encodedstr:=encodedstr+'i1'
  309. else
  310. encodedstr:=encodedstr+'i'+tostr(def.size*8);
  311. end;
  312. pointerdef :
  313. begin
  314. if is_voidpointer(def) then
  315. encodedstr:=encodedstr+'i8*'
  316. else
  317. begin
  318. llvmaddencodedtype_intern(tpointerdef(def).pointeddef,[],encodedstr);
  319. encodedstr:=encodedstr+'*';
  320. end;
  321. end;
  322. floatdef :
  323. begin
  324. case tfloatdef(def).floattype of
  325. s32real:
  326. encodedstr:=encodedstr+'float';
  327. s64real:
  328. encodedstr:=encodedstr+'double';
  329. { necessary to be able to force our own size/alignment }
  330. s80real:
  331. { prevent llvm from allocating the standard ABI size for
  332. extended }
  333. if lef_inaggregate in flags then
  334. encodedstr:=encodedstr+'[10 x i8]'
  335. else
  336. encodedstr:=encodedstr+'x86_fp80';
  337. sc80real:
  338. encodedstr:=encodedstr+'x86_fp80';
  339. s64comp,
  340. s64currency:
  341. encodedstr:=encodedstr+'i64';
  342. s128real:
  343. {$if defined(powerpc) or defined(powerpc128)}
  344. encodedstr:=encodedstr+'ppc_fp128';
  345. {$else}
  346. encodedstr:=encodedstr+'fp128';
  347. {$endif}
  348. else
  349. internalerror(2013100202);
  350. end;
  351. end;
  352. filedef :
  353. begin
  354. case tfiledef(def).filetyp of
  355. ft_text :
  356. llvmaddencodedtype_intern(search_system_type('TEXTREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  357. ft_typed :
  358. begin
  359. { in case of ISO-like I/O, the typed file def includes a
  360. get/put buffer of the size of the file's elements }
  361. if (m_isolike_io in current_settings.modeswitches) and
  362. not is_void(tfiledef(def).typedfiledef) then
  363. encodedstr:=encodedstr+'<{';
  364. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  365. if (m_isolike_io in current_settings.modeswitches) and
  366. not is_void(tfiledef(def).typedfiledef) then
  367. begin
  368. encodedstr:=encodedstr+',[';
  369. encodedstr:=encodedstr+tostr(tfiledef(def).typedfiledef.size);
  370. encodedstr:=encodedstr+' x i8]}>'
  371. end;
  372. end;
  373. ft_untyped :
  374. llvmaddencodedtype_intern(search_system_type('FILEREC').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  375. else
  376. internalerror(2013100203);
  377. end;
  378. end;
  379. recorddef :
  380. begin
  381. { avoid endlessly recursive definitions }
  382. if assigned(def.typesym) and
  383. ((lef_inaggregate in flags) or
  384. not(lef_typedecl in flags)) then
  385. encodedstr:=encodedstr+llvmtypeidentifier(def)
  386. else
  387. llvmaddencodedabstractrecordtype(trecorddef(def),encodedstr);
  388. end;
  389. variantdef :
  390. begin
  391. llvmaddencodedtype_intern(search_system_type('TVARDATA').typedef,[lef_inaggregate]+[lef_typedecl]*flags,encodedstr);
  392. end;
  393. classrefdef :
  394. begin
  395. if is_class(tclassrefdef(def).pointeddef) then
  396. begin
  397. llvmaddencodedtype_intern(tobjectdef(tclassrefdef(def).pointeddef).vmt_def,flags,encodedstr);
  398. encodedstr:=encodedstr+'*';
  399. end
  400. else if is_objcclass(tclassrefdef(def).pointeddef) then
  401. llvmaddencodedtype_intern(objc_idtype,flags,encodedstr)
  402. else
  403. encodedstr:=encodedstr+'i8*'
  404. end;
  405. setdef :
  406. begin
  407. { just an array as far as llvm is concerned; don't use a "packed
  408. array of i1" or so, this requires special support in backends
  409. and guarantees nothing about the internal format }
  410. if is_smallset(def) then
  411. llvmaddencodedtype_intern(cgsize_orddef(def_cgsize(def)),[lef_inaggregate],encodedstr)
  412. else
  413. encodedstr:=encodedstr+'['+tostr(tsetdef(def).size)+' x i8]';
  414. end;
  415. formaldef :
  416. begin
  417. { var/const/out x (always treated as "pass by reference" -> don't
  418. add extra "*" here) }
  419. encodedstr:=encodedstr+'i8';
  420. end;
  421. arraydef :
  422. begin
  423. if is_array_of_const(def) then
  424. begin
  425. encodedstr:=encodedstr+'[0 x ';
  426. llvmaddencodedtype_intern(search_system_type('TVARREC').typedef,[lef_inaggregate],encodedstr);
  427. encodedstr:=encodedstr+']';
  428. end
  429. else if is_open_array(def) then
  430. begin
  431. encodedstr:=encodedstr+'[0 x ';
  432. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  433. encodedstr:=encodedstr+']';
  434. end
  435. else if is_dynamic_array(def) then
  436. begin
  437. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  438. encodedstr:=encodedstr+'*';
  439. end
  440. else if is_packed_array(def) and
  441. (tarraydef(def).elementdef.typ in [enumdef,orddef]) then
  442. begin
  443. { encode as an array of bytes rather than as an array of
  444. packedbitsloadsize(elesize), because even if the load size
  445. is e.g. 2 bytes, the array may only be 1 or 3 bytes long
  446. (and if this array is inside a record, it must not be
  447. encoded as a type that is too long) }
  448. encodedstr:=encodedstr+'['+tostr(tarraydef(def).size)+' x ';
  449. llvmaddencodedtype_intern(u8inttype,[lef_inaggregate],encodedstr);
  450. encodedstr:=encodedstr+']';
  451. end
  452. else
  453. begin
  454. encodedstr:=encodedstr+'['+tostr(tarraydef(def).elecount)+' x ';
  455. llvmaddencodedtype_intern(tarraydef(def).elementdef,[lef_inaggregate],encodedstr);
  456. encodedstr:=encodedstr+']';
  457. end;
  458. end;
  459. procdef,
  460. procvardef :
  461. begin
  462. if (def.typ=procdef) or
  463. tprocvardef(def).is_addressonly then
  464. begin
  465. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  466. if def.typ=procvardef then
  467. encodedstr:=encodedstr+'*';
  468. end
  469. else if ((lef_inaggregate in flags) or
  470. not(lef_typedecl in flags)) and
  471. assigned(tprocvardef(def).typesym) then
  472. begin
  473. { in case the procvardef recursively references itself, e.g.
  474. via a pointer }
  475. encodedstr:=encodedstr+llvmtypeidentifier(def);
  476. { blocks are implicit pointers }
  477. if is_block(def) then
  478. encodedstr:=encodedstr+'*'
  479. end
  480. else if is_block(def) then
  481. begin
  482. llvmaddencodedtype_intern(get_block_literal_type_for_proc(tabstractprocdef(def)),flags,encodedstr);
  483. end
  484. else
  485. begin
  486. encodedstr:=encodedstr+'<{';
  487. { code pointer }
  488. llvmaddencodedproctype(tabstractprocdef(def),'',lpd_procvar,encodedstr);
  489. { data pointer (maybe todo: generate actual layout if
  490. available) }
  491. encodedstr:=encodedstr+'*, i8*}>';
  492. end;
  493. end;
  494. objectdef :
  495. case tobjectdef(def).objecttype of
  496. odt_class,
  497. odt_objcclass,
  498. odt_object,
  499. odt_cppclass:
  500. begin
  501. if not(lef_typedecl in flags) and
  502. assigned(def.typesym) then
  503. encodedstr:=encodedstr+llvmtypeidentifier(def)
  504. else
  505. llvmaddencodedabstractrecordtype(tabstractrecorddef(def),encodedstr);
  506. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) and
  507. is_implicit_pointer_object_type(def) then
  508. encodedstr:=encodedstr+'*'
  509. end;
  510. odt_interfacecom,
  511. odt_interfacecorba,
  512. odt_dispinterface:
  513. begin
  514. { type is a pointer to a pointer to the vmt }
  515. llvmaddencodedtype_intern(tobjectdef(def).vmt_def,flags,encodedstr);
  516. if ([lef_typedecl,lef_noimplicitderef]*flags=[]) then
  517. encodedstr:=encodedstr+'**';
  518. end;
  519. odt_interfacecom_function,
  520. odt_interfacecom_property,
  521. odt_objcprotocol:
  522. begin
  523. { opaque for now }
  524. encodedstr:=encodedstr+'i8*'
  525. end;
  526. odt_helper:
  527. llvmaddencodedtype_intern(tobjectdef(def).extendeddef,flags,encodedstr);
  528. else
  529. internalerror(2013100601);
  530. end;
  531. undefineddef,
  532. errordef :
  533. internalerror(2013100604);
  534. else
  535. internalerror(2013100603);
  536. end;
  537. end;
  538. function llvmencodetypename(def: tdef): TSymStr;
  539. begin
  540. result:='';
  541. llvmaddencodedtype_intern(def,[],result);
  542. end;
  543. procedure llvmaddencodedtype(def: tdef; inaggregate: boolean; var encodedstr: TSymStr);
  544. var
  545. flags: tllvmencodeflags;
  546. begin
  547. if inaggregate then
  548. flags:=[lef_inaggregate]
  549. else
  550. flags:=[];
  551. llvmaddencodedtype_intern(def,flags,encodedstr);
  552. end;
  553. procedure llvmaddencodedabstractrecordtype(def: tabstractrecorddef; var encodedstr: TSymStr);
  554. var
  555. st: tllvmshadowsymtable;
  556. symdeflist: tfpobjectlist;
  557. i: longint;
  558. nopacked: boolean;
  559. begin
  560. st:=tabstractrecordsymtable(def.symtable).llvmst;
  561. symdeflist:=st.symdeflist;
  562. nopacked:=df_llvm_no_struct_packing in def.defoptions;
  563. if nopacked then
  564. encodedstr:=encodedstr+'{ '
  565. else
  566. encodedstr:=encodedstr+'<{ ';
  567. if symdeflist.count>0 then
  568. begin
  569. i:=0;
  570. if (def.typ=objectdef) and
  571. assigned(tobjectdef(def).childof) and
  572. is_class_or_interface_or_dispinterface(tllvmshadowsymtableentry(symdeflist[0]).def) then
  573. begin
  574. { insert the struct for the class rather than a pointer to the struct }
  575. if (tllvmshadowsymtableentry(symdeflist[0]).def.typ<>objectdef) then
  576. internalerror(2008070601);
  577. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[0]).def,[lef_inaggregate,lef_noimplicitderef],encodedstr);
  578. inc(i);
  579. end;
  580. while i<symdeflist.count do
  581. begin
  582. if i<>0 then
  583. encodedstr:=encodedstr+', ';
  584. llvmaddencodedtype_intern(tllvmshadowsymtableentry(symdeflist[i]).def,[lef_inaggregate],encodedstr);
  585. inc(i);
  586. end;
  587. end;
  588. if nopacked then
  589. encodedstr:=encodedstr+' }'
  590. else
  591. encodedstr:=encodedstr+' }>';
  592. end;
  593. procedure llvmextractvalueextinfo(paradef: tdef; var paralocdef: tdef; out signext: tllvmvalueextension);
  594. begin
  595. { implicit zero/sign extension for ABI compliance? (yes, if the size
  596. of a paraloc is larger than the size of the entire parameter) }
  597. if is_ordinal(paradef) and
  598. is_ordinal(paralocdef) and
  599. (paradef.size<paralocdef.size) then
  600. begin
  601. paralocdef:=paradef;
  602. if is_signed(paradef) then
  603. signext:=lve_signext
  604. else
  605. signext:=lve_zeroext
  606. end
  607. else
  608. signext:=lve_none;
  609. end;
  610. procedure llvmaddencodedparaloctype(hp: tparavarsym; proccalloption: tproccalloption; withparaname, withattributes: boolean; var first: boolean; var encodedstr: TSymStr);
  611. var
  612. paraloc: PCGParaLocation;
  613. signext: tllvmvalueextension;
  614. usedef: tdef;
  615. begin
  616. if (proccalloption in cdecl_pocalls) and
  617. is_array_of_const(hp.vardef) then
  618. begin
  619. if not first then
  620. encodedstr:=encodedstr+', '
  621. else
  622. first:=false;
  623. encodedstr:=encodedstr+'...';
  624. exit
  625. end;
  626. if withparaname then
  627. paraloc:=hp.paraloc[calleeside].location
  628. else
  629. paraloc:=hp.paraloc[callerside].location;
  630. repeat
  631. usedef:=paraloc^.def;
  632. llvmextractvalueextinfo(hp.vardef,usedef,signext);
  633. { implicit zero/sign extension for ABI compliance? }
  634. if not first then
  635. encodedstr:=encodedstr+', '
  636. else
  637. first:=false;
  638. llvmaddencodedtype_intern(usedef,[],encodedstr);
  639. { in case signextstr<>'', there should be only one paraloc -> no need
  640. to clear (reason: it means that the paraloc is larger than the
  641. original parameter) }
  642. if withattributes then
  643. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  644. { sret: hidden pointer for structured function result }
  645. if vo_is_funcret in hp.varoptions then
  646. begin
  647. { "sret" is only valid for the firstparameter, while in FPC this
  648. can sometimes be second one (self comes before). In general,
  649. this is not a problem: we can just leave out sret, which means
  650. the result will be a bit less well optimised), but it is for
  651. AArch64: there, the sret parameter must be passed in a different
  652. register (-> paranr_result is smaller than paranr_self for that
  653. platform in symconst) }
  654. {$ifdef aarch64}
  655. if not first then
  656. internalerror(2015101404);
  657. {$endif aarch64}
  658. if withattributes then
  659. if first then
  660. encodedstr:=encodedstr+' sret'
  661. else { we can add some other attributes to optimise things,}
  662. encodedstr:=encodedstr+' noalias nocapture';
  663. end
  664. else if not paramanager.push_addr_param(hp.varspez,hp.vardef,proccalloption) and
  665. llvmbyvalparaloc(paraloc) then
  666. begin
  667. if withattributes then
  668. encodedstr:=encodedstr+'* byval'
  669. else
  670. encodedstr:=encodedstr+'*';
  671. end;
  672. if withparaname then
  673. begin
  674. if paraloc^.llvmloc.loc<>LOC_REFERENCE then
  675. internalerror(2014010803);
  676. encodedstr:=encodedstr+' '+llvmasmsymname(paraloc^.llvmloc.sym);
  677. end;
  678. paraloc:=paraloc^.next;
  679. until not assigned(paraloc);
  680. end;
  681. function llvmencodeproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype): TSymStr;
  682. begin
  683. result:='';
  684. llvmaddencodedproctype(def,customname,pddecltype,result);
  685. end;
  686. procedure llvmaddencodedproctype(def: tabstractprocdef; const customname: TSymStr; pddecltype: tllvmprocdefdecltype; var encodedstr: TSymStr);
  687. var
  688. usedef: tdef;
  689. paranr: longint;
  690. hp: tparavarsym;
  691. signext: tllvmvalueextension;
  692. useside: tcallercallee;
  693. first: boolean;
  694. begin
  695. { when writing a definition, we have to write the parameter names, and
  696. those are only available on the callee side. In all other cases,
  697. we are at the callerside }
  698. if pddecltype=lpd_def then
  699. useside:=calleeside
  700. else
  701. useside:=callerside;
  702. def.init_paraloc_info(useside);
  703. first:=true;
  704. { function result (return-by-ref is handled explicitly) }
  705. if not paramanager.ret_in_param(def.returndef,def) then
  706. begin
  707. usedef:=llvmgetcgparadef(def.funcretloc[useside],false);
  708. llvmextractvalueextinfo(def.returndef,usedef,signext);
  709. { specifying result sign extention information for an alias causes
  710. an error for some reason }
  711. if pddecltype in [lpd_decl,lpd_def] then
  712. encodedstr:=encodedstr+llvmvalueextension2str[signext];
  713. encodedstr:=encodedstr+' ';
  714. llvmaddencodedtype_intern(usedef,[],encodedstr);
  715. end
  716. else
  717. begin
  718. encodedstr:=encodedstr+' ';
  719. llvmaddencodedtype(voidtype,false,encodedstr);
  720. end;
  721. encodedstr:=encodedstr+' ';
  722. { add procname? }
  723. if (pddecltype in [lpd_decl,lpd_def]) and
  724. (def.typ=procdef) then
  725. if customname='' then
  726. encodedstr:=encodedstr+llvmmangledname(tprocdef(def).mangledname)
  727. else
  728. encodedstr:=encodedstr+llvmmangledname(customname);
  729. encodedstr:=encodedstr+'(';
  730. { parameters }
  731. first:=true;
  732. for paranr:=0 to def.paras.count-1 do
  733. begin
  734. hp:=tparavarsym(def.paras[paranr]);
  735. llvmaddencodedparaloctype(hp,def.proccalloption,pddecltype in [lpd_def],not(pddecltype in [lpd_procvar,lpd_alias]),first,encodedstr);
  736. end;
  737. if po_varargs in def.procoptions then
  738. begin
  739. if not first then
  740. encodedstr:=encodedstr+', ';
  741. encodedstr:=encodedstr+'...';
  742. end;
  743. encodedstr:=encodedstr+')'
  744. end;
  745. function llvmgettemprecorddef(fieldtypes: array of tdef; packrecords, recordalignmin, maxcrecordalign: shortint): trecorddef;
  746. var
  747. i: longint;
  748. res: PHashSetItem;
  749. oldsymtablestack: tsymtablestack;
  750. hrecst: trecordsymtable;
  751. hdef: tdef;
  752. hrecdef: trecorddef;
  753. sym: tfieldvarsym;
  754. typename: string;
  755. begin
  756. typename:=internaltypeprefixName[itp_llvmstruct];
  757. for i:=low(fieldtypes) to high(fieldtypes) do
  758. begin
  759. hdef:=fieldtypes[i];
  760. case hdef.typ of
  761. orddef:
  762. case torddef(hdef).ordtype of
  763. s8bit,
  764. u8bit,
  765. pasbool1,
  766. pasbool8:
  767. typename:=typename+'i8';
  768. s16bit,
  769. u16bit:
  770. typename:=typename+'i16';
  771. s32bit,
  772. u32bit:
  773. typename:=typename+'i32';
  774. s64bit,
  775. u64bit:
  776. typename:=typename+'i64';
  777. else
  778. { other types should not appear currently, add as needed }
  779. internalerror(2014012001);
  780. end;
  781. floatdef:
  782. case tfloatdef(hdef).floattype of
  783. s32real:
  784. typename:=typename+'f32';
  785. s64real:
  786. typename:=typename+'f64';
  787. else
  788. { other types should not appear currently, add as needed }
  789. internalerror(2014012008);
  790. end;
  791. else
  792. typename:=typename+'d'+hdef.unique_id_str;
  793. end;
  794. end;
  795. if not assigned(current_module) then
  796. internalerror(2014012002);
  797. res:=current_module.llvmdefs.FindOrAdd(@typename[1],length(typename));
  798. if not assigned(res^.Data) then
  799. begin
  800. res^.Data:=crecorddef.create_global_internal(typename,packrecords,
  801. recordalignmin,maxcrecordalign);
  802. for i:=low(fieldtypes) to high(fieldtypes) do
  803. trecorddef(res^.Data).add_field_by_def('F'+tostr(i),fieldtypes[i]);
  804. end;
  805. trecordsymtable(trecorddef(res^.Data).symtable).addalignmentpadding;
  806. result:=trecorddef(res^.Data);
  807. end;
  808. function llvmgetcgparadef(const cgpara: tcgpara; beforevalueext: boolean): tdef;
  809. var
  810. retdeflist: array[0..9] of tdef;
  811. retloc: pcgparalocation;
  812. usedef: tdef;
  813. valueext: tllvmvalueextension;
  814. i: longint;
  815. begin
  816. { single location }
  817. if not assigned(cgpara.location^.next) then
  818. begin
  819. { def of the location, except in case of zero/sign-extension and
  820. zero-sized records }
  821. if not is_special_array(cgpara.def) and
  822. (cgpara.def.size=0) then
  823. usedef:=cgpara.def
  824. else
  825. usedef:=cgpara.location^.def;
  826. if beforevalueext then
  827. llvmextractvalueextinfo(cgpara.def,usedef,valueext);
  828. { comp and currency are handled by the x87 in this case. They cannot
  829. be represented directly in llvm, and llvmdef translates them into
  830. i64 (since that's their storage size and internally they also are
  831. int64). Solve this by changing the type to s80real in the
  832. returndef/parameter declaration. }
  833. if (usedef.typ=floatdef) and
  834. (tfloatdef(usedef).floattype in [s64comp,s64currency]) then
  835. usedef:=s80floattype;
  836. result:=usedef;
  837. exit
  838. end;
  839. { multiple locations -> create temp record }
  840. retloc:=cgpara.location;
  841. i:=0;
  842. repeat
  843. if i>high(retdeflist) then
  844. internalerror(2016121801);
  845. retdeflist[i]:=retloc^.def;
  846. inc(i);
  847. retloc:=retloc^.next;
  848. until not assigned(retloc);
  849. result:=llvmgettemprecorddef(slice(retdeflist,i),C_alignment,
  850. targetinfos[target_info.system]^.alignment.recordalignmin,
  851. targetinfos[target_info.system]^.alignment.maxCrecordalign);
  852. include(result.defoptions,df_llvm_no_struct_packing);
  853. end;
  854. function llvmencodetypedecl(def: tdef): TSymStr;
  855. begin
  856. result:='';
  857. llvmaddencodedtype_intern(def,[lef_typedecl],result);
  858. end;
  859. end.