| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289 | {    Copyright (c) 2002 by Florian Klaempfl    This unit contains the CPU specific part of tprocinfo    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}{ This unit contains the CPU specific part of tprocinfo. }unit cpupi;{$i fpcdefs.inc}  interface    uses       globtype,cutils,       procinfo,cpuinfo,psub,cgbase,       aasmdata;    type       tcpuprocinfo = class(tcgprocinfo)          { for arm thumb, we need to know the stackframe size before            starting procedure compilation, so this contains the stack frame size, the compiler            should assume            if this size is too little the procedure must be compiled again with a larger value }          stackframesize,          floatregstart : aint;          stackpaddingreg: TSuperRegister;          // procedure handle_body_start;override;          // procedure after_pass1;override;          procedure set_first_temp_offset;override;          function calc_stackframe_size:longint;override;          procedure init_framepointer; override;          procedure generate_parameter_info;override;          procedure allocate_got_register(list : TAsmList);override;          procedure postprocess_code;override;          procedure allocate_tls_register(list : TAsmList);override;       end;  implementation    uses       globals,systems,       cpubase,       tgobj,       symconst,symtype,symsym,symcpu,paramgr,       cgutils,       cgobj,       defutil,       aasmcpu;    procedure tcpuprocinfo.set_first_temp_offset;      var        localsize : aint;        i : longint;      begin        { We allocate enough space to save all registers because we can't determine          the necessary space because the used registers aren't known before          secondpass is run. Even worse, patching          the local offsets after generating the code could cause trouble because          "shifter" constants could change to non-"shifter" constants. This          is especially a problem when taking the address of a local. For now,          this extra memory should hurt less than generating all local contants with offsets          >256 as non shifter constants }        if (po_nostackframe in procdef.procoptions) then          begin             { maxpushedparasize sghould be zero,               if not we will get an error later. }             tg.setfirsttemp(maxpushedparasize);             exit;          end;        if tg.direction = -1 then          begin            if (target_info.system<>system_arm_darwin) then              { Non-Darwin, worst case: r4-r10,r11,r13,r14,r15 is saved -> -28-16, but we                always adjust the frame pointer to point to the first stored                register (= last register in list above) -> + 4 }              tg.setfirsttemp(-28-16)            else              { on Darwin first r4-r7,r14 are saved, then r7 is adjusted to                point to the saved r7, and next r8,r10,r11 gets saved -> -24                (r4-r6 and r8,r10,r11) }              tg.setfirsttemp(-24)          end        else          tg.setfirsttemp(maxpushedparasize);        { estimate stack frame size }        if GenerateThumbCode or (pi_estimatestacksize in flags) then          begin            stackframesize:=maxpushedparasize+32;            localsize:=0;            for i:=0 to procdef.localst.SymList.Count-1 do              if tsym(procdef.localst.SymList[i]).typ=localvarsym then                inc(localsize,tabstractnormalvarsym(procdef.localst.SymList[i]).getsize);            inc(stackframesize,localsize);            localsize:=0;            for i:=0 to procdef.parast.SymList.Count-1 do              if tsym(procdef.parast.SymList[i]).typ=paravarsym then                begin                  if tabstractnormalvarsym(procdef.parast.SymList[i]).varspez in [vs_var,vs_out,vs_constref] then                    inc(localsize,4)                  else if is_open_string(tabstractnormalvarsym(procdef.parast.SymList[i]).vardef) then                    inc(localsize,256)                  else                    inc(localsize,tabstractnormalvarsym(procdef.parast.SymList[i]).getsize);                end;            inc(stackframesize,localsize);            if pi_needs_implicit_finally in flags then              inc(stackframesize,40);            if pi_uses_exceptions in flags then              inc(stackframesize,40);            if procdef.proctypeoption in [potype_constructor] then              inc(stackframesize,40*2);            inc(stackframesize,estimatedtempsize);            stackframesize:=Align(stackframesize,8);          end;      end;    function tcpuprocinfo.calc_stackframe_size:longint;      var         firstfloatreg,lastfloatreg,         r : byte;         floatsavesize : aword;         regs: tcpuregisterset;      begin        if GenerateThumbCode or (pi_estimatestacksize in flags) then          result:=stackframesize        else          begin            maxpushedparasize:=align(maxpushedparasize,max(current_settings.alignment.localalignmin,4));            floatsavesize:=0;            case current_settings.fputype of              fpu_fpa,              fpu_fpa10,              fpu_fpa11:                begin                  { save floating point registers? }                  firstfloatreg:=RS_NO;                  lastfloatreg:=RS_NO;                  regs:=cg.rg[R_FPUREGISTER].used_in_proc-paramanager.get_volatile_registers_fpu(pocall_stdcall);                  for r:=RS_F0 to RS_F7 do                    if r in regs then                      begin                        if firstfloatreg=RS_NO then                          firstfloatreg:=r;                        lastfloatreg:=r;                      end;                  if firstfloatreg<>RS_NO then                    floatsavesize:=(lastfloatreg-firstfloatreg+1)*12;                end;              fpu_vfpv2,              fpu_vfpv3,              fpu_vfpv4,              fpu_vfpv3_d16:                begin                  floatsavesize:=0;                  regs:=cg.rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);                  for r:=RS_D0 to RS_D31 do                    if r in regs then                      inc(floatsavesize,8);                end;              fpu_fpv4_s16:                begin                  floatsavesize:=0;                  regs:=cg.rg[R_MMREGISTER].used_in_proc-paramanager.get_volatile_registers_mm(pocall_stdcall);                  for r:=RS_D0 to RS_D15 do                    if r in regs then                      inc(floatsavesize,8);                end;            end;            floatsavesize:=align(floatsavesize,max(current_settings.alignment.localalignmin,4));            result:=Align(tg.direction*tg.lasttemp,max(current_settings.alignment.localalignmin,4))+maxpushedparasize+aint(floatsavesize);            { Note: in cgcpu "-floatregstart" is subtracted -> reason based on                "adding floatregstart" to avoid double negation              tg.direction=1 -> no framepointer ->                1) save used int registers                2) allocate stacksize (= subtracting result, which is positive,                   from the stackpointer)                3) add floatregstart to the stackpointer to get the offset where                   to store the floating point registers (-> floatregstart                   should be positive)                4) store the floating point registers from this offset with IA                   (i.e., this offset and higher addresses -> offset should                    point to lower end of area)               -> newsp+(result) points to lower end of saved int registers area               -> newsp+(result-floatsavesize) points to lower end of float reg                  saving area              tg.direction=-1 -> with framepointer ->                1) save stack pointer in framepointer                2) save used int registers using stackpointer                3) allocate stacksize (= subtracting result, which is positive,                   from the stack pointer)                4) add floatregstart" to the framepointer to get the offset                   where to store the floating point registers (-> floatregstart                   should be negative)                5) store the floating point registers from this offset with IA                   (i.e., this offset and higher addresses -> offset should                    point to lower end of area)                o in this case, firsttemp starts right after the saved int                  registers area (or a bit further, because it's calculated for                  the worst-case scenario, when all non-volative integer                  registers have to be saved) -> we store the floating point                  registers between the last temp and the parameter pushing area               -> fp+(-result) points to the top of the stack (= end of                  parameter pushing area)               -> fp+(-result+maxpushedparasize) points to the start of the                  parameter pushing area = lower end of float reg saving area            }            if tg.direction=1 then              floatregstart:=result-aint(floatsavesize)            else              floatregstart:=-result+maxpushedparasize;          end;      end;    procedure tcpuprocinfo.init_framepointer;      begin        if (target_info.system in systems_darwin) or GenerateThumbCode then          begin            RS_FRAME_POINTER_REG:=RS_R7;            NR_FRAME_POINTER_REG:=NR_R7;          end        else          begin            RS_FRAME_POINTER_REG:=RS_R11;            NR_FRAME_POINTER_REG:=NR_R11;          end;      end;    procedure tcpuprocinfo.generate_parameter_info;      begin       tcpuprocdef(procdef).total_stackframe_size:=stackframesize;       inherited generate_parameter_info;      end;    procedure tcpuprocinfo.allocate_got_register(list: TAsmList);      begin        { darwin doesn't use a got }        if tf_pic_uses_got in target_info.flags then          got := cg.getaddressregister(list);      end;    procedure tcpuprocinfo.postprocess_code;      begin        { because of the limited constant size of the arm, all data access is done pc relative }        finalizearmcode(aktproccode,aktlocaldata);      end;    procedure tcpuprocinfo.allocate_tls_register(list: TAsmList);      begin        current_procinfo.tlsoffset:=cg.getaddressregister(list);      end;begin   cprocinfo:=tcpuprocinfo;end.
 |