| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152 | {    Copyright (c) 1998-2002 by Florian Klaempfl    This unit implements the base class for the register allocator    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}{$i fpcdefs.inc}{ Allow duplicate allocations, can be used to get the .s file written }{ $define ALLOWDUPREG}unit rgobj;  interface    uses      cutils, cpubase,      aasmbase,aasmtai,aasmdata,aasmcpu,      cclasses,globtype,cgbase,cgutils,      cpuinfo      ;    type      {        The interference bitmap contains of 2 layers:          layer 1 - 256*256 blocks with pointers to layer 2 blocks          layer 2 - blocks of 32*256 (32 bytes = 256 bits)      }      Tinterferencebitmap2 = array[byte] of set of byte;      Pinterferencebitmap2 = ^Tinterferencebitmap2;      Tinterferencebitmap1 = array[byte] of Pinterferencebitmap2;      pinterferencebitmap1 = ^tinterferencebitmap1;      Tinterferencebitmap=class      private        maxx1,        maxy1    : byte;        fbitmap  : pinterferencebitmap1;        function getbitmap(x,y:tsuperregister):boolean;        procedure setbitmap(x,y:tsuperregister;b:boolean);      public        constructor create;        destructor destroy;override;        property bitmap[x,y:tsuperregister]:boolean read getbitmap write setbitmap;default;      end;      Tmovelistheader=record        count,        maxcount,        sorted_until : cardinal;      end;      Tmovelist=record        header : Tmovelistheader;        data : array[tsuperregister] of Tlinkedlistitem;      end;      Pmovelist=^Tmovelist;      {In the register allocator we keep track of move instructions.       These instructions are moved between five linked lists. There       is also a linked list per register to keep track about the moves       it is associated with. Because we need to determine quickly in       which of the five lists it is we add anu enumeradtion to each       move instruction.}      Tmoveset=(ms_coalesced_moves,ms_constrained_moves,ms_frozen_moves,                ms_worklist_moves,ms_active_moves);      Tmoveins=class(Tlinkedlistitem)        moveset:Tmoveset;        x,y:Tsuperregister;      end;      Treginfoflag=(ri_coalesced,ri_selected);      Treginfoflagset=set of Treginfoflag;      Treginfo=record        live_start,        live_end   : Tai;        subreg   : tsubregister;        alias    : Tsuperregister;        { The register allocator assigns each register a colour }        colour   : Tsuperregister;        movelist : Pmovelist;        adjlist  : Psuperregisterworklist;        degree   : TSuperregister;        flags    : Treginfoflagset;        weight   : longint;      end;      Preginfo=^TReginfo;      tspillreginfo = record        { a single register may appear more than once in an instruction,          but with different subregister types -> store all subregister types          that occur, so we can add the necessary constraints for the inline          register that will have to replace it }        spillregconstraints : set of TSubRegister;        orgreg : tsuperregister;        tempreg : tregister;        regread,regwritten, mustbespilled: boolean;      end;      tspillregsinfo = array[0..3] of tspillreginfo;      Tspill_temp_list=array[tsuperregister] of Treference;      {#------------------------------------------------------------------      This class implements the default register allocator. It is used by the      code generator to allocate and free registers which might be valid      across nodes. It also contains utility routines related to registers.      Some of the methods in this class should be overridden      by cpu-specific implementations.      --------------------------------------------------------------------}      trgobj=class        preserved_by_proc : tcpuregisterset;        used_in_proc : tcpuregisterset;        constructor create(Aregtype:Tregistertype;                           Adefaultsub:Tsubregister;                           const Ausable:array of tsuperregister;                           Afirst_imaginary:Tsuperregister;                           Apreserved_by_proc:Tcpuregisterset);        destructor destroy;override;        {# Allocate a register. An internalerror will be generated if there is         no more free registers which can be allocated.}        function getregister(list:TAsmList;subreg:Tsubregister):Tregister;virtual;        {# Get the register specified.}        procedure getcpuregister(list:TAsmList;r:Tregister);virtual;        procedure ungetcpuregister(list:TAsmList;r:Tregister);virtual;        {# Get multiple registers specified.}        procedure alloccpuregisters(list:TAsmList;const r:Tcpuregisterset);virtual;        {# Free multiple registers specified.}        procedure dealloccpuregisters(list:TAsmList;const r:Tcpuregisterset);virtual;        function uses_registers:boolean;virtual;        procedure add_reg_instruction(instr:Tai;r:tregister;aweight:longint);        procedure add_move_instruction(instr:Taicpu);        {# Do the register allocation.}        procedure do_register_allocation(list:TAsmList;headertai:tai);virtual;        { Adds an interference edge.          don't move this to the protected section, the arm cg requires to access this (FK) }        procedure add_edge(u,v:Tsuperregister);        { translates a single given imaginary register to it's real register }        procedure translate_register(var reg : tregister);      protected        regtype           : Tregistertype;        { default subregister used }        defaultsub        : tsubregister;        live_registers:Tsuperregisterworklist;        { can be overridden to add cpu specific interferences }        procedure add_cpu_interferences(p : tai);virtual;        procedure add_constraints(reg:Tregister);virtual;        function  get_alias(n:Tsuperregister):Tsuperregister;        function  getregisterinline(list:TAsmList;const subregconstraints:Tsubregisterset):Tregister;        procedure ungetregisterinline(list:TAsmList;r:Tregister);        function  get_spill_subreg(r : tregister) : tsubregister;virtual;        function  do_spill_replace(list:TAsmList;instr:taicpu;orgreg:tsuperregister;const spilltemp:treference):boolean;virtual;        procedure do_spill_read(list:TAsmList;pos:tai;const spilltemp:treference;tempreg:tregister);virtual;        procedure do_spill_written(list:TAsmList;pos:tai;const spilltemp:treference;tempreg:tregister);virtual;        function instr_spill_register(list:TAsmList;                                      instr:taicpu;                                      const r:Tsuperregisterset;                                      const spilltemplist:Tspill_temp_list): boolean;virtual;      private        int_live_range_direction: TRADirection;        {# First imaginary register.}        first_imaginary   : Tsuperregister;        {# Highest register allocated until now.}        reginfo           : PReginfo;        maxreginfo,        maxreginfoinc,        maxreg            : Tsuperregister;        usable_registers_cnt : word;        usable_registers  : array[0..maxcpuregister-1] of tsuperregister;        ibitmap           : Tinterferencebitmap;        spillednodes,        simplifyworklist,        freezeworklist,        spillworklist,        coalescednodes,        selectstack       : tsuperregisterworklist;        worklist_moves,        active_moves,        frozen_moves,        coalesced_moves,        constrained_moves : Tlinkedlist;        extended_backwards,        backwards_was_first : tbitset;{$ifdef EXTDEBUG}        procedure writegraph(loopidx:longint);{$endif EXTDEBUG}        {# Disposes of the reginfo array.}        procedure dispose_reginfo;        {# Prepare the register colouring.}        procedure prepare_colouring;        {# Clean up after register colouring.}        procedure epilogue_colouring;        {# Colour the registers; that is do the register allocation.}        procedure colour_registers;        procedure insert_regalloc_info(list:TAsmList;u:tsuperregister);        procedure insert_regalloc_info_all(list:TAsmList);        procedure generate_interference_graph(list:TAsmList;headertai:tai);        { translates the registers in the given assembler list }        procedure translate_registers(list:TAsmList);        function  spill_registers(list:TAsmList;headertai:tai):boolean;virtual;        function  getnewreg(subreg:tsubregister):tsuperregister;        procedure add_edges_used(u:Tsuperregister);        procedure add_to_movelist(u:Tsuperregister;data:Tlinkedlistitem);        function move_related(n:Tsuperregister):boolean;        procedure make_work_list;        procedure sort_simplify_worklist;        procedure enable_moves(n:Tsuperregister);        procedure decrement_degree(m:Tsuperregister);        procedure simplify;        procedure add_worklist(u:Tsuperregister);        function adjacent_ok(u,v:Tsuperregister):boolean;        function conservative(u,v:Tsuperregister):boolean;        procedure combine(u,v:Tsuperregister);        procedure coalesce;        procedure freeze_moves(u:Tsuperregister);        procedure freeze;        procedure select_spill;        procedure assign_colours;        procedure clear_interferences(u:Tsuperregister);        procedure set_live_range_direction(dir: TRADirection);       public        property live_range_direction: TRADirection read int_live_range_direction write set_live_range_direction;      end;    const      first_reg = 0;      last_reg = high(tsuperregister)-1;      maxspillingcounter = 20;  implementation    uses       systems,fmodule,globals,       verbose,tgobj,procinfo;    procedure sort_movelist(ml:Pmovelist);    {Ok, sorting pointers is silly, but it does the job to make Trgobj.combine     faster.}    var h,i,p:longword;        t:Tlinkedlistitem;    begin      with ml^ do        begin          if header.count<2 then            exit;          p:=1;          while 2*cardinal(p)<header.count do            p:=2*p;          while p<>0 do            begin              for h:=p to header.count-1 do                begin                  i:=h;                  t:=data[i];                  repeat                    if ptruint(data[i-p])<=ptruint(t) then                      break;                    data[i]:=data[i-p];                    dec(i,p);                  until i<p;                  data[i]:=t;                end;              p:=p shr 1;            end;          header.sorted_until:=header.count-1;        end;    end;{******************************************************************************                              tinterferencebitmap******************************************************************************}    constructor tinterferencebitmap.create;      begin        inherited create;        maxx1:=1;        getmem(fbitmap,sizeof(tinterferencebitmap1)*2);        fillchar(fbitmap^,sizeof(tinterferencebitmap1)*2,0);      end;    destructor tinterferencebitmap.destroy;    var i,j:byte;    begin      for i:=0 to maxx1 do        for j:=0 to maxy1 do          if assigned(fbitmap[i,j]) then            dispose(fbitmap[i,j]);      freemem(fbitmap);    end;    function tinterferencebitmap.getbitmap(x,y:tsuperregister):boolean;      var        page : pinterferencebitmap2;      begin        result:=false;        if (x shr 8>maxx1) then          exit;        page:=fbitmap[x shr 8,y shr 8];        result:=assigned(page) and          ((x and $ff) in page^[y and $ff]);      end;    procedure tinterferencebitmap.setbitmap(x,y:tsuperregister;b:boolean);      var        x1,y1 : byte;      begin        x1:=x shr 8;        y1:=y shr 8;        if x1>maxx1 then          begin            reallocmem(fbitmap,sizeof(tinterferencebitmap1)*(x1+1));            fillchar(fbitmap[maxx1+1],sizeof(tinterferencebitmap1)*(x1-maxx1),0);            maxx1:=x1;          end;        if not assigned(fbitmap[x1,y1]) then          begin            if y1>maxy1 then              maxy1:=y1;            new(fbitmap[x1,y1]);            fillchar(fbitmap[x1,y1]^,sizeof(tinterferencebitmap2),0);          end;        if b then          include(fbitmap[x1,y1]^[y and $ff],(x and $ff))        else          exclude(fbitmap[x1,y1]^[y and $ff],(x and $ff));      end;{******************************************************************************                                trgobj******************************************************************************}    constructor trgobj.create(Aregtype:Tregistertype;                              Adefaultsub:Tsubregister;                              const Ausable:array of tsuperregister;                              Afirst_imaginary:Tsuperregister;                              Apreserved_by_proc:Tcpuregisterset);       var         i : cardinal;       begin         { empty super register sets can cause very strange problems }         if high(Ausable)=-1 then           internalerror(200210181);         live_range_direction:=rad_forward;         first_imaginary:=Afirst_imaginary;         maxreg:=Afirst_imaginary;         regtype:=Aregtype;         defaultsub:=Adefaultsub;         preserved_by_proc:=Apreserved_by_proc;         // default value set by newinstance         // used_in_proc:=[];         live_registers.init;         { Get reginfo for CPU registers }         maxreginfo:=first_imaginary;         maxreginfoinc:=16;         worklist_moves:=Tlinkedlist.create;         reginfo:=allocmem(first_imaginary*sizeof(treginfo));         for i:=0 to first_imaginary-1 do           begin             reginfo[i].degree:=high(tsuperregister);             reginfo[i].alias:=RS_INVALID;           end;         { Usable registers }         // default value set by constructor         // fillchar(usable_registers,sizeof(usable_registers),0);         for i:=low(Ausable) to high(Ausable) do           usable_registers[i]:=Ausable[i];         usable_registers_cnt:=high(Ausable)+1;         { Initialize Worklists }         spillednodes.init;         simplifyworklist.init;         freezeworklist.init;         spillworklist.init;         coalescednodes.init;         selectstack.init;      end;    destructor trgobj.destroy;    begin      spillednodes.done;      simplifyworklist.done;      freezeworklist.done;      spillworklist.done;      coalescednodes.done;      selectstack.done;      live_registers.done;      worklist_moves.free;      dispose_reginfo;      extended_backwards.free;      backwards_was_first.free;    end;    procedure Trgobj.dispose_reginfo;    var i:cardinal;    begin      if reginfo<>nil then        begin          for i:=0 to maxreg-1 do            with reginfo[i] do              begin                if adjlist<>nil then                  dispose(adjlist,done);                if movelist<>nil then                  dispose(movelist);              end;          freemem(reginfo);          reginfo:=nil;        end;    end;    function trgobj.getnewreg(subreg:tsubregister):tsuperregister;      var        oldmaxreginfo : tsuperregister;      begin        result:=maxreg;        inc(maxreg);        if maxreg>=last_reg then          Message(parser_f_too_complex_proc);        if maxreg>=maxreginfo then          begin            oldmaxreginfo:=maxreginfo;            { Prevent overflow }            if maxreginfoinc>last_reg-maxreginfo then              maxreginfo:=last_reg            else              begin                inc(maxreginfo,maxreginfoinc);                if maxreginfoinc<256 then                  maxreginfoinc:=maxreginfoinc*2;              end;            reallocmem(reginfo,maxreginfo*sizeof(treginfo));            { Do we really need it to clear it ? At least for 1.0.x (PFV) }            fillchar(reginfo[oldmaxreginfo],(maxreginfo-oldmaxreginfo)*sizeof(treginfo),0);          end;        reginfo[result].subreg:=subreg;      end;    function trgobj.getregister(list:TAsmList;subreg:Tsubregister):Tregister;      begin        {$ifdef EXTDEBUG}        if reginfo=nil then          InternalError(2004020901);        {$endif EXTDEBUG}        if defaultsub=R_SUBNONE then          result:=newreg(regtype,getnewreg(R_SUBNONE),R_SUBNONE)        else          result:=newreg(regtype,getnewreg(subreg),subreg);      end;    function trgobj.uses_registers:boolean;      begin        result:=(maxreg>first_imaginary);      end;    procedure trgobj.ungetcpuregister(list:TAsmList;r:Tregister);      begin        if (getsupreg(r)>=first_imaginary) then          InternalError(2004020901);        list.concat(Tai_regalloc.dealloc(r,nil));      end;    procedure trgobj.getcpuregister(list:TAsmList;r:Tregister);      var        supreg:Tsuperregister;      begin        supreg:=getsupreg(r);        if supreg>=first_imaginary then          internalerror(2003121503);        include(used_in_proc,supreg);        list.concat(Tai_regalloc.alloc(r,nil));      end;    procedure trgobj.alloccpuregisters(list:TAsmList;const r:Tcpuregisterset);    var i:cardinal;    begin      for i:=0 to first_imaginary-1 do        if i in r then          getcpuregister(list,newreg(regtype,i,defaultsub));    end;    procedure trgobj.dealloccpuregisters(list:TAsmList;const r:Tcpuregisterset);    var i:cardinal;    begin      for i:=0 to first_imaginary-1 do        if i in r then          ungetcpuregister(list,newreg(regtype,i,defaultsub));    end;    procedure trgobj.do_register_allocation(list:TAsmList;headertai:tai);      var        spillingcounter:byte;        endspill:boolean;      begin        { Insert regalloc info for imaginary registers }        insert_regalloc_info_all(list);        ibitmap:=tinterferencebitmap.create;        generate_interference_graph(list,headertai);        { Don't do the real allocation when -sr is passed }        if (cs_no_regalloc in current_settings.globalswitches) then          exit;        {Do register allocation.}        spillingcounter:=0;        repeat          prepare_colouring;          colour_registers;          epilogue_colouring;          endspill:=true;          if spillednodes.length<>0 then            begin              inc(spillingcounter);              if spillingcounter>maxspillingcounter then                begin{$ifdef EXTDEBUG}                  { Only exit here so the .s file is still generated. Assembling                    the file will still trigger an error }                  exit;{$else}                  internalerror(200309041);{$endif}                end;              endspill:=not spill_registers(list,headertai);            end;        until endspill;        ibitmap.free;        translate_registers(list);        { we need the translation table for debugging info and verbose assembler output (FK)          dispose_reginfo;        }      end;    procedure trgobj.add_constraints(reg:Tregister);    begin    end;    procedure trgobj.add_edge(u,v:Tsuperregister);    {This procedure will add an edge to the virtual interference graph.}      procedure addadj(u,v:Tsuperregister);      begin        with reginfo[u] do          begin            if adjlist=nil then              new(adjlist,init);            adjlist^.add(v);          end;      end;    begin      if (u<>v) and not(ibitmap[v,u]) then        begin          ibitmap[v,u]:=true;          ibitmap[u,v]:=true;          {Precoloured nodes are not stored in the interference graph.}          if (u>=first_imaginary) then            addadj(u,v);          if (v>=first_imaginary) then            addadj(v,u);        end;    end;    procedure trgobj.add_edges_used(u:Tsuperregister);    var i:cardinal;    begin      with live_registers do        if length>0 then          for i:=0 to length-1 do            add_edge(u,get_alias(buf^[i]));    end;{$ifdef EXTDEBUG}    procedure trgobj.writegraph(loopidx:longint);    {This procedure writes out the current interference graph in the    register allocator.}    var f:text;        i,j:cardinal;    begin      assign(f,'igraph'+tostr(loopidx));      rewrite(f);      writeln(f,'Interference graph');      writeln(f);      write(f,'    ');      for i:=0 to 15 do        for j:=0 to 15 do          write(f,hexstr(i,1));      writeln(f);      write(f,'    ');      for i:=0 to 15 do        write(f,'0123456789ABCDEF');      writeln(f);      for i:=0 to maxreg-1 do        begin          write(f,hexstr(i,2):4);          for j:=0 to maxreg-1 do            if ibitmap[i,j] then              write(f,'*')            else              write(f,'-');          writeln(f);        end;      close(f);    end;{$endif EXTDEBUG}    procedure trgobj.add_to_movelist(u:Tsuperregister;data:Tlinkedlistitem);    begin      with reginfo[u] do        begin          if movelist=nil then            begin              { don't use sizeof(tmovelistheader), because that ignores alignment }              getmem(movelist,ptruint(@movelist^.data)-ptruint(movelist)+60*sizeof(pointer));              movelist^.header.maxcount:=60;              movelist^.header.count:=0;              movelist^.header.sorted_until:=0;            end          else            begin              if movelist^.header.count>=movelist^.header.maxcount then                begin                  movelist^.header.maxcount:=movelist^.header.maxcount*2;                  { don't use sizeof(tmovelistheader), because that ignores alignment }                  reallocmem(movelist,ptruint(@movelist^.data)-ptruint(movelist)+movelist^.header.maxcount*sizeof(pointer));                end;            end;          movelist^.data[movelist^.header.count]:=data;          inc(movelist^.header.count);        end;    end;    procedure trgobj.set_live_range_direction(dir: TRADirection);      begin        if (dir in [rad_backwards,rad_backwards_reinit]) then          begin            if not assigned(extended_backwards) then              begin                { create expects a "size", not a "max bit" parameter -> +1 }                backwards_was_first:=tbitset.create(maxreg+1);                extended_backwards:=tbitset.create(maxreg+1);              end            else              begin                if (dir=rad_backwards_reinit) then                  extended_backwards.clear;                backwards_was_first.clear;              end;            int_live_range_direction:=rad_backwards;          end        else          int_live_range_direction:=rad_forward;      end;    procedure trgobj.add_reg_instruction(instr:Tai;r:tregister;aweight:longint);      var        supreg : tsuperregister;      begin        supreg:=getsupreg(r);{$ifdef extdebug}        if not (cs_no_regalloc in current_settings.globalswitches) and           (supreg>=maxreginfo) then          internalerror(200411061);{$endif extdebug}        if supreg>=first_imaginary then          with reginfo[supreg] do            begin              if aweight>weight then                weight:=aweight;              if (live_range_direction=rad_forward) then                begin                  if not assigned(live_start) then                    live_start:=instr;                  live_end:=instr;                end               else                 begin                   if not extended_backwards.isset(supreg) then                     begin                       extended_backwards.include(supreg);                       live_start := instr;                       if not assigned(live_end) then                         begin                           backwards_was_first.include(supreg);                           live_end := instr;                         end;                     end                   else                     begin                       if backwards_was_first.isset(supreg) then                         live_end := instr;                     end                 end            end;      end;    procedure trgobj.add_move_instruction(instr:Taicpu);    {This procedure notifies a certain as a move instruction so the     register allocator can try to eliminate it.}    var i:Tmoveins;        ssupreg,dsupreg:Tsuperregister;    begin    {$ifdef extdebug}      if (instr.oper[O_MOV_SOURCE]^.typ<>top_reg) or         (instr.oper[O_MOV_DEST]^.typ<>top_reg) then        internalerror(200311291);    {$endif}      i:=Tmoveins.create;      i.moveset:=ms_worklist_moves;      worklist_moves.insert(i);      ssupreg:=getsupreg(instr.oper[O_MOV_SOURCE]^.reg);      add_to_movelist(ssupreg,i);      dsupreg:=getsupreg(instr.oper[O_MOV_DEST]^.reg);      if ssupreg<>dsupreg then        {Avoid adding the same move instruction twice to a single register.}        add_to_movelist(dsupreg,i);      i.x:=ssupreg;      i.y:=dsupreg;    end;    function trgobj.move_related(n:Tsuperregister):boolean;    var i:cardinal;    begin      move_related:=false;      with reginfo[n] do        if movelist<>nil then          with movelist^ do            for i:=0 to header.count-1 do              if Tmoveins(data[i]).moveset in [ms_worklist_moves,ms_active_moves] then                begin                  move_related:=true;                  break;                end;    end;    procedure Trgobj.sort_simplify_worklist;    {Sorts the simplifyworklist by the number of interferences the     registers in it cause. This allows simplify to execute in     constant time.}    var p,h,i,leni,lent:longword;        t:Tsuperregister;        adji,adjt:Psuperregisterworklist;    begin      with simplifyworklist do        begin          if length<2 then            exit;          p:=1;          while 2*p<length do            p:=2*p;          while p<>0 do            begin              for h:=p to length-1 do                begin                  i:=h;                  t:=buf^[i];                  adjt:=reginfo[buf^[i]].adjlist;                  lent:=0;                  if adjt<>nil then                    lent:=adjt^.length;                  repeat                    adji:=reginfo[buf^[i-p]].adjlist;                    leni:=0;                    if adji<>nil then                      leni:=adji^.length;                    if leni<=lent then                      break;                    buf^[i]:=buf^[i-p];                    dec(i,p)                  until i<p;                  buf^[i]:=t;                end;              p:=p shr 1;            end;        end;    end;    procedure trgobj.make_work_list;    var n:cardinal;    begin      {If we have 7 cpu registers, and the degree of a node is 7, we cannot       assign it to any of the registers, thus it is significant.}      for n:=first_imaginary to maxreg-1 do        with reginfo[n] do          begin            if adjlist=nil then              degree:=0            else              degree:=adjlist^.length;            if degree>=usable_registers_cnt then              spillworklist.add(n)            else if move_related(n) then              freezeworklist.add(n)            else              simplifyworklist.add(n);          end;      sort_simplify_worklist;    end;    procedure trgobj.prepare_colouring;    begin      make_work_list;      active_moves:=Tlinkedlist.create;      frozen_moves:=Tlinkedlist.create;      coalesced_moves:=Tlinkedlist.create;      constrained_moves:=Tlinkedlist.create;      selectstack.clear;    end;    procedure trgobj.enable_moves(n:Tsuperregister);    var m:Tlinkedlistitem;        i:cardinal;    begin      with reginfo[n] do        if movelist<>nil then          for i:=0 to movelist^.header.count-1 do            begin              m:=movelist^.data[i];              if Tmoveins(m).moveset in [ms_worklist_moves,ms_active_moves] then                if Tmoveins(m).moveset=ms_active_moves then                  begin                    {Move m from the set active_moves to the set worklist_moves.}                    active_moves.remove(m);                    Tmoveins(m).moveset:=ms_worklist_moves;                    worklist_moves.concat(m);                  end;          end;    end;    procedure Trgobj.decrement_degree(m:Tsuperregister);    var adj : Psuperregisterworklist;        n : tsuperregister;        d,i : cardinal;    begin      with reginfo[m] do        begin          d:=degree;          if d=0 then            internalerror(200312151);          dec(degree);          if d=usable_registers_cnt then            begin              {Enable moves for m.}              enable_moves(m);              {Enable moves for adjacent.}              adj:=adjlist;              if adj<>nil then                for i:=1 to adj^.length do                  begin                    n:=adj^.buf^[i-1];                    if reginfo[n].flags*[ri_selected,ri_coalesced]<>[] then                      enable_moves(n);                  end;              {Remove the node from the spillworklist.}              if not spillworklist.delete(m) then                internalerror(200310145);              if move_related(m) then                freezeworklist.add(m)              else                simplifyworklist.add(m);            end;        end;    end;    procedure trgobj.simplify;    var adj : Psuperregisterworklist;        m,n : Tsuperregister;        i : cardinal;    begin      {We take the element with the least interferences out of the       simplifyworklist. Since the simplifyworklist is now sorted, we       no longer need to search, but we can simply take the first element.}      m:=simplifyworklist.get;      {Push it on the selectstack.}      selectstack.add(m);      with reginfo[m] do        begin          include(flags,ri_selected);          adj:=adjlist;        end;      if adj<>nil then        for i:=1 to adj^.length do          begin            n:=adj^.buf^[i-1];            if (n>=first_imaginary) and               (reginfo[n].flags*[ri_selected,ri_coalesced]=[]) then              decrement_degree(n);          end;    end;    function trgobj.get_alias(n:Tsuperregister):Tsuperregister;    begin      while ri_coalesced in reginfo[n].flags do        n:=reginfo[n].alias;      get_alias:=n;    end;    procedure trgobj.add_worklist(u:Tsuperregister);      begin        if (u>=first_imaginary) and           (not move_related(u)) and           (reginfo[u].degree<usable_registers_cnt) then          begin            if not freezeworklist.delete(u) then              internalerror(200308161); {must be found}            simplifyworklist.add(u);          end;      end;    function trgobj.adjacent_ok(u,v:Tsuperregister):boolean;    {Check wether u and v should be coalesced. u is precoloured.}      function ok(t,r:Tsuperregister):boolean;      begin        ok:=(t<first_imaginary) or            (reginfo[t].degree<usable_registers_cnt) or            ibitmap[r,t];      end;    var adj : Psuperregisterworklist;        i : cardinal;        n : tsuperregister;    begin      with reginfo[v] do        begin          adjacent_ok:=true;          adj:=adjlist;          if adj<>nil then            for i:=1 to adj^.length do              begin                n:=adj^.buf^[i-1];                if (flags*[ri_coalesced,ri_selected]=[]) and not ok(n,u) then                  begin                    adjacent_ok:=false;                    break;                  end;              end;        end;    end;    function trgobj.conservative(u,v:Tsuperregister):boolean;    var adj : Psuperregisterworklist;        done : Tsuperregisterset; {To prevent that we count nodes twice.}        i,k:cardinal;        n : tsuperregister;    begin      k:=0;      supregset_reset(done,false,maxreg);      with reginfo[u] do        begin          adj:=adjlist;          if adj<>nil then            for i:=1 to adj^.length do              begin                n:=adj^.buf^[i-1];                if flags*[ri_coalesced,ri_selected]=[] then                  begin                    supregset_include(done,n);                    if reginfo[n].degree>=usable_registers_cnt then                      inc(k);                  end;              end;        end;      adj:=reginfo[v].adjlist;      if adj<>nil then        for i:=1 to adj^.length do          begin            n:=adj^.buf^[i-1];            if not supregset_in(done,n) and               (reginfo[n].degree>=usable_registers_cnt) and               (reginfo[u].flags*[ri_coalesced,ri_selected]=[]) then              inc(k);          end;      conservative:=(k<usable_registers_cnt);    end;    procedure trgobj.combine(u,v:Tsuperregister);    var adj : Psuperregisterworklist;        i,n,p,q:cardinal;        t : tsuperregister;        searched:Tlinkedlistitem;        found : boolean;    begin      if not freezeworklist.delete(v) then        spillworklist.delete(v);      coalescednodes.add(v);      include(reginfo[v].flags,ri_coalesced);      reginfo[v].alias:=u;      {Combine both movelists. Since the movelists are sets, only add       elements that are not already present. The movelists cannot be       empty by definition; nodes are only coalesced if there is a move       between them. To prevent quadratic time blowup (movelists of       especially machine registers can get very large because of moves       generated during calls) we need to go into disgusting complexity.       (See webtbs/tw2242 for an example that stresses this.)       We want to sort the movelist to be able to search logarithmically.       Unfortunately, sorting the movelist every time before searching       is counter-productive, since the movelist usually grows with a few       items at a time. Therefore, we split the movelist into a sorted       and an unsorted part and search through both. If the unsorted part       becomes too large, we sort.}      if assigned(reginfo[u].movelist) then        begin          {We have to weigh the cost of sorting the list against searching           the cost of the unsorted part. I use factor of 8 here; if the           number of items is less than 8 times the numer of unsorted items,           we'll sort the list.}          with reginfo[u].movelist^ do            if header.count<8*(header.count-header.sorted_until) then              sort_movelist(reginfo[u].movelist);          if assigned(reginfo[v].movelist) then            begin              for n:=0 to reginfo[v].movelist^.header.count-1 do                begin                  {Binary search the sorted part of the list.}                  searched:=reginfo[v].movelist^.data[n];                  p:=0;                  q:=reginfo[u].movelist^.header.sorted_until;                  i:=0;                  if q<>0 then                    repeat                      i:=(p+q) shr 1;                      if ptruint(searched)>ptruint(reginfo[u].movelist^.data[i]) then                        p:=i+1                      else                        q:=i;                    until p=q;                  with reginfo[u].movelist^ do                    if searched<>data[i] then                      begin                        {Linear search the unsorted part of the list.}                        found:=false;                        for i:=header.sorted_until+1 to header.count-1 do                          if searched=data[i] then                            begin                              found:=true;                              break;                            end;                        if not found then                          add_to_movelist(u,searched);                      end;                end;            end;        end;      enable_moves(v);      adj:=reginfo[v].adjlist;      if adj<>nil then        for i:=1 to adj^.length do          begin            t:=adj^.buf^[i-1];            with reginfo[t] do              if not(ri_coalesced in flags) then                begin                  {t has a connection to v. Since we are adding v to u, we                   need to connect t to u. However, beware if t was already                   connected to u...}                  if (ibitmap[t,u]) and not (ri_selected in flags) then                    {... because in that case, we are actually removing an edge                     and the degree of t decreases.}                    decrement_degree(t)                  else                    begin                      add_edge(t,u);                      {We have added an edge to t and u. So their degree increases.                       However, v is added to u. That means its neighbours will                       no longer point to v, but to u instead. Therefore, only the                       degree of u increases.}                      if (u>=first_imaginary) and not (ri_selected in flags) then                        inc(reginfo[u].degree);                    end;                end;          end;      if (reginfo[u].degree>=usable_registers_cnt) and freezeworklist.delete(u) then        spillworklist.add(u);    end;    procedure trgobj.coalesce;    var m:Tmoveins;        x,y,u,v:cardinal;    begin      m:=Tmoveins(worklist_moves.getfirst);      x:=get_alias(m.x);      y:=get_alias(m.y);      if (y<first_imaginary) then        begin          u:=y;          v:=x;        end      else        begin          u:=x;          v:=y;        end;      if (u=v) then        begin          m.moveset:=ms_coalesced_moves;  {Already coalesced.}          coalesced_moves.insert(m);          add_worklist(u);        end      {Do u and v interfere? In that case the move is constrained. Two       precoloured nodes interfere allways. If v is precoloured, by the above       code u is precoloured, thus interference...}      else if (v<first_imaginary) or ibitmap[u,v] then        begin          m.moveset:=ms_constrained_moves;  {Cannot coalesce yet...}          constrained_moves.insert(m);          add_worklist(u);          add_worklist(v);        end      {Next test: is it possible and a good idea to coalesce??}      else if ((u<first_imaginary) and adjacent_ok(u,v)) or              ((u>=first_imaginary) and conservative(u,v)) then        begin          m.moveset:=ms_coalesced_moves;  {Move coalesced!}          coalesced_moves.insert(m);          combine(u,v);          add_worklist(u);        end      else        begin          m.moveset:=ms_active_moves;          active_moves.insert(m);        end;    end;    procedure trgobj.freeze_moves(u:Tsuperregister);    var i:cardinal;        m:Tlinkedlistitem;        v,x,y:Tsuperregister;    begin      if reginfo[u].movelist<>nil then        for i:=0 to reginfo[u].movelist^.header.count-1 do          begin            m:=reginfo[u].movelist^.data[i];            if Tmoveins(m).moveset in [ms_worklist_moves,ms_active_moves] then              begin                x:=Tmoveins(m).x;                y:=Tmoveins(m).y;                if get_alias(y)=get_alias(u) then                  v:=get_alias(x)                else                  v:=get_alias(y);                {Move m from active_moves/worklist_moves to frozen_moves.}                if Tmoveins(m).moveset=ms_active_moves then                  active_moves.remove(m)                else                  worklist_moves.remove(m);                Tmoveins(m).moveset:=ms_frozen_moves;                frozen_moves.insert(m);                if (v>=first_imaginary) and not(move_related(v)) and                   (reginfo[v].degree<usable_registers_cnt) then                  begin                    freezeworklist.delete(v);                    simplifyworklist.add(v);                  end;              end;          end;    end;    procedure trgobj.freeze;    var n:Tsuperregister;    begin      { We need to take a random element out of the freezeworklist. We take        the last element. Dirty code! }      n:=freezeworklist.get;      {Add it to the simplifyworklist.}      simplifyworklist.add(n);      freeze_moves(n);    end;    procedure trgobj.select_spill;    var      n : tsuperregister;      adj : psuperregisterworklist;      max,p,i:word;      minweight: longint;    begin      { We must look for the element with the most interferences in the        spillworklist. This is required because those registers are creating        the most conflicts and keeping them in a register will not reduce the        complexity and even can cause the help registers for the spilling code        to get too much conflicts with the result that the spilling code        will never converge (PFV) }      max:=0;      minweight:=high(longint);      p:=0;      with spillworklist do        begin          {Safe: This procedure is only called if length<>0}          for i:=0 to length-1 do            begin              adj:=reginfo[buf^[i]].adjlist;              if assigned(adj) and                 (                  (adj^.length>max) or                  ((adj^.length=max) and (reginfo[buf^[i]].weight<minweight))                 ) then                begin                  p:=i;                  max:=adj^.length;                  minweight:=reginfo[buf^[i]].weight;                end;            end;          n:=buf^[p];          deleteidx(p);        end;      simplifyworklist.add(n);      freeze_moves(n);    end;    procedure trgobj.assign_colours;    {Assign_colours assigns the actual colours to the registers.}    var adj : Psuperregisterworklist;        i,j,k : cardinal;        n,a,c : Tsuperregister;        colourednodes : Tsuperregisterset;        adj_colours:set of 0..255;        found : boolean;    begin      spillednodes.clear;      {Reset colours}      for n:=0 to maxreg-1 do        reginfo[n].colour:=n;      {Colour the cpu registers...}      supregset_reset(colourednodes,false,maxreg);      for n:=0 to first_imaginary-1 do        supregset_include(colourednodes,n);      {Now colour the imaginary registers on the select-stack.}      for i:=selectstack.length downto 1 do        begin          n:=selectstack.buf^[i-1];          {Create a list of colours that we cannot assign to n.}          adj_colours:=[];          adj:=reginfo[n].adjlist;          if adj<>nil then            for j:=0 to adj^.length-1 do              begin                a:=get_alias(adj^.buf^[j]);                if supregset_in(colourednodes,a) and (reginfo[a].colour<=255) then                  include(adj_colours,reginfo[a].colour);              end;          if regtype=R_INTREGISTER then            include(adj_colours,RS_STACK_POINTER_REG);          {Assume a spill by default...}          found:=false;          {Search for a colour not in this list.}          for k:=0 to usable_registers_cnt-1 do            begin              c:=usable_registers[k];               if not(c in adj_colours) then                 begin                   reginfo[n].colour:=c;                   found:=true;                   supregset_include(colourednodes,n);                   include(used_in_proc,c);                   break;                 end;            end;          if not found then            spillednodes.add(n);        end;      {Finally colour the nodes that were coalesced.}      for i:=1 to coalescednodes.length do        begin          n:=coalescednodes.buf^[i-1];          k:=get_alias(n);          reginfo[n].colour:=reginfo[k].colour;          if reginfo[k].colour<maxcpuregister then            include(used_in_proc,reginfo[k].colour);        end;    end;    procedure trgobj.colour_registers;    begin      repeat        if simplifyworklist.length<>0 then          simplify        else if not(worklist_moves.empty) then          coalesce        else if freezeworklist.length<>0 then          freeze        else if spillworklist.length<>0 then          select_spill;      until (simplifyworklist.length=0) and            worklist_moves.empty and            (freezeworklist.length=0) and            (spillworklist.length=0);      assign_colours;    end;    procedure trgobj.epilogue_colouring;    var      i : cardinal;    begin      worklist_moves.clear;      active_moves.destroy;      active_moves:=nil;      frozen_moves.destroy;      frozen_moves:=nil;      coalesced_moves.destroy;      coalesced_moves:=nil;      constrained_moves.destroy;      constrained_moves:=nil;      for i:=0 to maxreg-1 do        with reginfo[i] do          if movelist<>nil then            begin              dispose(movelist);              movelist:=nil;            end;    end;    procedure trgobj.clear_interferences(u:Tsuperregister);    {Remove node u from the interference graph and remove all collected     move instructions it is associated with.}    var i : word;        v : Tsuperregister;        adj,adj2 : Psuperregisterworklist;    begin      adj:=reginfo[u].adjlist;      if adj<>nil then        begin          for i:=1 to adj^.length do            begin              v:=adj^.buf^[i-1];              {Remove (u,v) and (v,u) from bitmap.}              ibitmap[u,v]:=false;              ibitmap[v,u]:=false;              {Remove (v,u) from adjacency list.}              adj2:=reginfo[v].adjlist;              if adj2<>nil then                begin                  adj2^.delete(u);                  if adj2^.length=0 then                    begin                      dispose(adj2,done);                      reginfo[v].adjlist:=nil;                    end;                end;            end;          {Remove ( u,* ) from adjacency list.}          dispose(adj,done);          reginfo[u].adjlist:=nil;        end;    end;    function trgobj.getregisterinline(list:TAsmList;const subregconstraints:Tsubregisterset):Tregister;      var        p : Tsuperregister;        subreg: tsubregister;      begin        for subreg:=high(tsubregister) downto low(tsubregister) do          if subreg in subregconstraints then            break;        p:=getnewreg(subreg);        live_registers.add(p);        result:=newreg(regtype,p,subreg);        add_edges_used(p);        add_constraints(result);        { also add constraints for other sizes used for this register }        if subreg<>low(tsubregister) then          for subreg:=pred(subreg) downto low(tsubregister) do            if subreg in subregconstraints then              add_constraints(newreg(regtype,getsupreg(result),subreg));      end;    procedure trgobj.ungetregisterinline(list:TAsmList;r:Tregister);      var        supreg:Tsuperregister;      begin        supreg:=getsupreg(r);        live_registers.delete(supreg);        insert_regalloc_info(list,supreg);      end;    procedure trgobj.insert_regalloc_info(list:TAsmList;u:tsuperregister);      var        p : tai;        r : tregister;        palloc,        pdealloc : tai_regalloc;      begin        { Insert regallocs for all imaginary registers }        with reginfo[u] do          begin            r:=newreg(regtype,u,subreg);            if assigned(live_start) then              begin                { Generate regalloc and bind it to an instruction, this                  is needed to find all live registers belonging to an                  instruction during the spilling }                if live_start.typ=ait_instruction then                  palloc:=tai_regalloc.alloc(r,live_start)                else                  palloc:=tai_regalloc.alloc(r,nil);                if live_end.typ=ait_instruction then                  pdealloc:=tai_regalloc.dealloc(r,live_end)                else                  pdealloc:=tai_regalloc.dealloc(r,nil);                { Insert live start allocation before the instruction/reg_a_sync }                list.insertbefore(palloc,live_start);                { Insert live end deallocation before reg allocations                  to reduce conflicts }                p:=live_end;                while assigned(p) and                      assigned(p.previous) and                      (tai(p.previous).typ=ait_regalloc) and                      (tai_regalloc(p.previous).ratype=ra_alloc) and                      (tai_regalloc(p.previous).reg<>r) do                  p:=tai(p.previous);                { , but add release after a reg_a_sync }                if assigned(p) and                   (p.typ=ait_regalloc) and                   (tai_regalloc(p).ratype=ra_sync) then                  p:=tai(p.next);                if assigned(p) then                  list.insertbefore(pdealloc,p)                else                  list.concat(pdealloc);              end;          end;      end;    procedure trgobj.insert_regalloc_info_all(list:TAsmList);      var        supreg : tsuperregister;      begin        { Insert regallocs for all imaginary registers }        for supreg:=first_imaginary to maxreg-1 do          insert_regalloc_info(list,supreg);      end;    procedure trgobj.add_cpu_interferences(p : tai);      begin      end;    procedure trgobj.generate_interference_graph(list:TAsmList;headertai:tai);      var        p : tai;{$ifdef EXTDEBUG}        i : integer;{$endif EXTDEBUG}        supreg : tsuperregister;      begin        { All allocations are available. Now we can generate the          interference graph. Walk through all instructions, we can          start with the headertai, because before the header tai is          only symbols. }        live_registers.clear;        p:=headertai;        while assigned(p) do          begin            if p.typ=ait_regalloc then              with Tai_regalloc(p) do                begin                  if (getregtype(reg)=regtype) then                    begin                      supreg:=getsupreg(reg);                      case ratype of                        ra_alloc :                          begin                            live_registers.add(supreg);                            add_edges_used(supreg);                          end;                        ra_dealloc :                          begin                            live_registers.delete(supreg);                            add_edges_used(supreg);                          end;                      end;                      { constraints needs always to be updated }                      add_constraints(reg);                    end;                end;            add_cpu_interferences(p);            p:=Tai(p.next);          end;{$ifdef EXTDEBUG}        if live_registers.length>0 then          begin            for i:=0 to live_registers.length-1 do              begin                { Only report for imaginary registers }                if live_registers.buf^[i]>=first_imaginary then                  Comment(V_Warning,'Register '+std_regname(newreg(R_INTREGISTER,live_registers.buf^[i],defaultsub))+' not released');              end;          end;{$endif}      end;    procedure trgobj.translate_register(var reg : tregister);      begin        if (getregtype(reg)=regtype) then          setsupreg(reg,reginfo[getsupreg(reg)].colour)        else          internalerror(200602021);      end;    procedure Trgobj.translate_registers(list:TAsmList);      var        hp,p,q:Tai;        i:shortint;{$ifdef arm}        so:pshifterop;{$endif arm}      begin        { Leave when no imaginary registers are used }        if maxreg<=first_imaginary then          exit;        p:=Tai(list.first);        while assigned(p) do          begin            case p.typ of              ait_regalloc:                with Tai_regalloc(p) do                  begin                    if (getregtype(reg)=regtype) then                      begin                        { Only alloc/dealloc is needed for the optimizer, remove                          other regalloc }                        if not(ratype in [ra_alloc,ra_dealloc]) then                          begin                            q:=Tai(next);                            list.remove(p);                            p.free;                            p:=q;                            continue;                          end                        else                          begin                            setsupreg(reg,reginfo[getsupreg(reg)].colour);                            {                              Remove sequences of release and                              allocation of the same register like. Other combinations                              of release/allocate need to stay in the list.                                 # Register X released                                 # Register X allocated                            }                            if assigned(previous) and                               (ratype=ra_alloc) and                               (Tai(previous).typ=ait_regalloc) and                               (Tai_regalloc(previous).reg=reg) and                               (Tai_regalloc(previous).ratype=ra_dealloc) then                              begin                                q:=Tai(next);                                hp:=tai(previous);                                list.remove(hp);                                hp.free;                                list.remove(p);                                p.free;                                p:=q;                                continue;                              end;                          end;                      end;                  end;              ait_varloc:                begin                  if cs_asm_source in current_settings.globalswitches then                    begin                      setsupreg(tai_varloc(p).newlocation,reginfo[getsupreg(tai_varloc(p).newlocation)].colour);                      hp:=Tai_comment.Create(strpnew('Var '+tai_varloc(p).varsym.realname+' located in register '+                        std_regname(tai_varloc(p).newlocation)));                      list.insertafter(hp,p);                    end;                  q:=tai(p.next);                  list.remove(p);                  p.free;                  p:=q;                  continue;                end;              ait_instruction:                with Taicpu(p) do                  begin                    current_filepos:=fileinfo;                    for i:=0 to ops-1 do                      with oper[i]^ do                        case typ of                          Top_reg:                             if (getregtype(reg)=regtype) then                               setsupreg(reg,reginfo[getsupreg(reg)].colour);                          Top_ref:                            begin                              if regtype in [R_INTREGISTER,R_ADDRESSREGISTER] then                                with ref^ do                                  begin                                    if (base<>NR_NO) and                                       (getregtype(base)=regtype) then                                      setsupreg(base,reginfo[getsupreg(base)].colour);                                    if (index<>NR_NO) and                                       (getregtype(index)=regtype) then                                      setsupreg(index,reginfo[getsupreg(index)].colour);                                  end;                            end;{$ifdef arm}                          Top_shifterop:                            begin                              if regtype=R_INTREGISTER then                                begin                                  so:=shifterop;                                  if (so^.rs<>NR_NO) and                                     (getregtype(so^.rs)=regtype) then                                    setsupreg(so^.rs,reginfo[getsupreg(so^.rs)].colour);                                end;                            end;{$endif arm}                        end;                    { Maybe the operation can be removed when                      it is a move and both arguments are the same }                    if is_same_reg_move(regtype) then                      begin                        q:=Tai(p.next);                        list.remove(p);                        p.free;                        p:=q;                        continue;                      end;                  end;            end;            p:=Tai(p.next);          end;        current_filepos:=current_procinfo.exitpos;      end;    function trgobj.spill_registers(list:TAsmList;headertai:tai):boolean;    { Returns true if any help registers have been used }      var        i : cardinal;        t : tsuperregister;        p,q : Tai;        regs_to_spill_set:Tsuperregisterset;        spill_temps : ^Tspill_temp_list;        supreg : tsuperregister;        templist : TAsmList;        size: ptrint;      begin        spill_registers:=false;        live_registers.clear;        for i:=first_imaginary to maxreg-1 do          exclude(reginfo[i].flags,ri_selected);        spill_temps:=allocmem(sizeof(treference)*maxreg);        supregset_reset(regs_to_spill_set,false,$ffff);        { Allocate temps and insert in front of the list }        templist:=TAsmList.create;        {Safe: this procedure is only called if there are spilled nodes.}        with spillednodes do          for i:=0 to length-1 do            begin              t:=buf^[i];              {Alternative representation.}              supregset_include(regs_to_spill_set,t);              {Clear all interferences of the spilled register.}              clear_interferences(t);              {Get a temp for the spilled register, the size must at least equal a complete register,               take also care of the fact that subreg can be larger than a single register like doubles               that occupy 2 registers }              { only force the whole register in case of integers. Storing a register that contains                a single precision value as a double can cause conversion errors on e.g. ARM VFP }              if (regtype=R_INTREGISTER) then                size:=max(tcgsize2size[reg_cgsize(newreg(regtype,t,R_SUBWHOLE))],                               tcgsize2size[reg_cgsize(newreg(regtype,t,reginfo[t].subreg))])              else                size:=tcgsize2size[reg_cgsize(newreg(regtype,t,reginfo[t].subreg))];              tg.gettemp(templist,                         size,size,                         tt_noreuse,spill_temps^[t]);            end;        list.insertlistafter(headertai,templist);        templist.free;        { Walk through all instructions, we can start with the headertai,          because before the header tai is only symbols }        p:=headertai;        while assigned(p) do          begin            case p.typ of              ait_regalloc:                with Tai_regalloc(p) do                  begin                    if (getregtype(reg)=regtype) then                      begin                        {A register allocation of a spilled register can be removed.}                        supreg:=getsupreg(reg);                        if supregset_in(regs_to_spill_set,supreg) then                          begin                            q:=Tai(p.next);                            list.remove(p);                            p.free;                            p:=q;                            continue;                          end                        else                          begin                            case ratype of                              ra_alloc :                               live_registers.add(supreg);                              ra_dealloc :                               live_registers.delete(supreg);                            end;                          end;                      end;                  end;              ait_instruction:                with Taicpu(p) do                  begin                    current_filepos:=fileinfo;                    if instr_spill_register(list,taicpu(p),regs_to_spill_set,spill_temps^) then                      spill_registers:=true;                  end;            end;            p:=Tai(p.next);          end;        current_filepos:=current_procinfo.exitpos;        {Safe: this procedure is only called if there are spilled nodes.}        with spillednodes do          for i:=0 to length-1 do            tg.ungettemp(list,spill_temps^[buf^[i]]);        freemem(spill_temps);      end;    function trgobj.do_spill_replace(list:TAsmList;instr:taicpu;orgreg:tsuperregister;const spilltemp:treference):boolean;      begin        result:=false;      end;    procedure trgobj.do_spill_read(list:TAsmList;pos:tai;const spilltemp:treference;tempreg:tregister);      var        ins:Taicpu;      begin        ins:=spilling_create_load(spilltemp,tempreg);        add_cpu_interferences(ins);        list.insertafter(ins,pos);      end;    procedure Trgobj.do_spill_written(list:TAsmList;pos:tai;const spilltemp:treference;tempreg:tregister);      var        ins:Taicpu;      begin        ins:=spilling_create_store(tempreg,spilltemp);        add_cpu_interferences(ins);        list.insertafter(ins,pos);      end;    function trgobj.get_spill_subreg(r : tregister) : tsubregister;      begin        result:=defaultsub;      end;    function trgobj.instr_spill_register(list:TAsmList;                                         instr:taicpu;                                         const r:Tsuperregisterset;                                         const spilltemplist:Tspill_temp_list): boolean;      var        counter, regindex: longint;        regs: tspillregsinfo;        spilled: boolean;      procedure addreginfo(reg: tregister; operation: topertype);        var          i, tmpindex: longint;          supreg : tsuperregister;        begin          tmpindex := regindex;          supreg:=get_alias(getsupreg(reg));          { did we already encounter this register? }          for i := 0 to pred(regindex) do            if (regs[i].orgreg = supreg) then              begin                tmpindex := i;                break;              end;          if tmpindex > high(regs) then            internalerror(2003120301);          regs[tmpindex].orgreg := supreg;          include(regs[tmpindex].spillregconstraints,get_spill_subreg(reg));          if supregset_in(r,supreg) then            begin              { add/update info on this register }              regs[tmpindex].mustbespilled := true;              case operation of                operand_read:                  regs[tmpindex].regread := true;                operand_write:                  regs[tmpindex].regwritten := true;                operand_readwrite:                  begin                    regs[tmpindex].regread := true;                    regs[tmpindex].regwritten := true;                  end;              end;              spilled := true;            end;          inc(regindex,ord(regindex=tmpindex));        end;      procedure tryreplacereg(var reg: tregister);        var          i: longint;          supreg: tsuperregister;        begin          supreg:=get_alias(getsupreg(reg));          for i:=0 to pred(regindex) do            if (regs[i].mustbespilled) and               (regs[i].orgreg=supreg) then              begin                { Only replace supreg }                setsupreg(reg,getsupreg(regs[i].tempreg));                break;              end;        end;      var        loadpos,        storepos : tai;        oldlive_registers : tsuperregisterworklist;      begin        result := false;        fillchar(regs,sizeof(regs),0);        for counter := low(regs) to high(regs) do          regs[counter].orgreg := RS_INVALID;        spilled := false;        regindex := 0;        { check whether and if so which and how (read/written) this instructions contains          registers that must be spilled }        for counter := 0 to instr.ops-1 do         with instr.oper[counter]^ do          begin            case typ of              top_reg:                begin                  if (getregtype(reg) = regtype) then                    addreginfo(reg,instr.spilling_get_operation_type(counter));                end;              top_ref:                begin                  if regtype in [R_INTREGISTER,R_ADDRESSREGISTER] then                    with ref^ do                      begin                        if (base <> NR_NO) then                          addreginfo(base,instr.spilling_get_operation_type_ref(counter,base));                        if (index <> NR_NO) then                          addreginfo(index,instr.spilling_get_operation_type_ref(counter,index));                      end;                end;{$ifdef ARM}              top_shifterop:                begin                  if regtype in [R_INTREGISTER,R_ADDRESSREGISTER] then                    if shifterop^.rs<>NR_NO then                      addreginfo(shifterop^.rs,operand_read);                end;{$endif ARM}            end;          end;        { if no spilling for this instruction we can leave }        if not spilled then          exit;{$ifdef x86}        { Try replacing the register with the spilltemp. This is useful only          for the i386,x86_64 that support memory locations for several instructions }        for counter := 0 to pred(regindex) do          with regs[counter] do            begin              if mustbespilled then                begin                  if do_spill_replace(list,instr,orgreg,spilltemplist[orgreg]) then                    mustbespilled:=false;                end;            end;{$endif x86}        {          There are registers that need are spilled. We generate the          following code for it. The used positions where code need          to be inserted are marked using #. Note that code is always inserted          before the positions using pos.previous. This way the position is always          the same since pos doesn't change, but pos.previous is modified everytime          new code is inserted.          [            - reg_allocs load spills            - load spills          ]          [#loadpos            - reg_deallocs            - reg_allocs          ]          [            - reg_deallocs for load-only spills            - reg_allocs for store-only spills          ]          [#instr            - original instruction          ]          [            - store spills            - reg_deallocs store spills          ]          [#storepos          ]        }        result := true;        oldlive_registers.copyfrom(live_registers);        { Process all tai_regallocs belonging to this instruction, ignore explicit          inserted regallocs. These can happend for example in i386:             mov ref,ireg26             <regdealloc ireg26, instr=taicpu of lea>             <regalloc edi, insrt=nil>             lea [ireg26+ireg17],edi          All released registers are also added to the live_registers because          they can't be used during the spilling }        loadpos:=tai(instr.previous);        while assigned(loadpos) and              (loadpos.typ=ait_regalloc) and              ((tai_regalloc(loadpos).instr=nil) or               (tai_regalloc(loadpos).instr=instr)) do          begin            { Only add deallocs belonging to the instruction. Explicit inserted deallocs              belong to the previous instruction and not the current instruction }            if (tai_regalloc(loadpos).instr=instr) and               (tai_regalloc(loadpos).ratype=ra_dealloc) then              live_registers.add(getsupreg(tai_regalloc(loadpos).reg));            loadpos:=tai(loadpos.previous);          end;        loadpos:=tai(loadpos.next);        { Load the spilled registers }        for counter := 0 to pred(regindex) do          with regs[counter] do            begin              if mustbespilled and regread then                begin                  tempreg:=getregisterinline(list,regs[counter].spillregconstraints);                  do_spill_read(list,tai(loadpos.previous),spilltemplist[orgreg],tempreg);                end;            end;        { Release temp registers of read-only registers, and add reference of the instruction          to the reginfo }        for counter := 0 to pred(regindex) do          with regs[counter] do            begin              if mustbespilled and regread and (not regwritten) then                begin                  { The original instruction will be the next that uses this register }                  add_reg_instruction(instr,tempreg,1);                  ungetregisterinline(list,tempreg);                end;            end;        { Allocate temp registers of write-only registers, and add reference of the instruction          to the reginfo }        for counter := 0 to pred(regindex) do          with regs[counter] do            begin              if mustbespilled and regwritten then                begin                  { When the register is also loaded there is already a register assigned }                  if (not regread) then                    tempreg:=getregisterinline(list,regs[counter].spillregconstraints);                  { The original instruction will be the next that uses this register, this                    also needs to be done for read-write registers }                  add_reg_instruction(instr,tempreg,1);                end;            end;        { store the spilled registers }        storepos:=tai(instr.next);        for counter := 0 to pred(regindex) do          with regs[counter] do            begin              if mustbespilled and regwritten then                begin                  do_spill_written(list,tai(storepos.previous),spilltemplist[orgreg],tempreg);                  ungetregisterinline(list,tempreg);                end;            end;        { now all spilling code is generated we can restore the live registers. This          must be done after the store because the store can need an extra register          that also needs to conflict with the registers of the instruction }        live_registers.done;        live_registers:=oldlive_registers;        { substitute registers }        for counter:=0 to instr.ops-1 do          with instr.oper[counter]^ do            case typ of              top_reg:                begin                  if (getregtype(reg) = regtype) then                    tryreplacereg(reg);                end;              top_ref:                begin                  if regtype in [R_INTREGISTER,R_ADDRESSREGISTER] then                    begin                      tryreplacereg(ref^.base);                      tryreplacereg(ref^.index);                    end;                end;{$ifdef ARM}              top_shifterop:                begin                  if regtype in [R_INTREGISTER,R_ADDRESSREGISTER] then                    tryreplacereg(shifterop^.rs);                end;{$endif ARM}            end;         {We have modified the instruction; perhaps the new instruction has          certain constraints regarding which imaginary registers interfere          with certain physical registers.}         add_cpu_interferences(instr);      end;end.
 |