12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246 |
- {
- $Id$
- Copyright (c) 1998-2002 by Florian Klaempfl
- This unit implements the base class for the register allocator
- This program is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2 of the License, or
- (at your option) any later version.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- You should have received a copy of the GNU General Public License
- along with this program; if not, write to the Free Software
- Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- ****************************************************************************
- }
- {$i fpcdefs.inc}
- { Allow duplicate allocations, can be used to get the .s file written }
- { $define ALLOWDUPREG}
- {#******************************************************************************
- @abstract(Abstract register allocator unit)
- Register allocator introduction.
- Free Pascal uses a Chaitin style register allocator. We use a variant similair
- to the one described in the book "Modern compiler implementation in C" by
- Andrew W. Appel., published by Cambridge University Press.
- The register allocator that is described by Appel uses a much improved way
- of register coalescing, called "iterated register coalescing". Instead
- of doing coalescing as a prepass to the register allocation, the coalescing
- is done inside the register allocator. This has the advantage that the
- register allocator can coalesce very aggresively without introducing spills.
- Reading this book is recommended for a complete understanding. Here is a small
- introduction.
- The code generator thinks it has an infinite amount of registers. Our processor
- has a limited amount of registers. Therefore we must reduce the amount of
- registers until there are less enough to fit into the processors registers.
- Registers can interfere or not interfere. If two imaginary registers interfere
- they cannot be placed into the same psysical register. Reduction of registers
- is done by:
- - "coalescing" Two registers that do not interfere are combined
- into one register.
- - "spilling" A register is changed into a memory location and the generated
- code is modified to use the memory location instead of the register.
- Register allocation is a graph colouring problem. Each register is a colour, and
- if two registers interfere there is a connection between them in the graph.
- In addition to the imaginary registers in the code generator, the psysical
- CPU registers are also present in this graph. This allows us to make
- interferences between imaginary registers and cpu registers. This is very
- usefull for describing archtectural constraints, like for example that
- the div instruction modifies edx, so variables that are in use at that time
- cannot be stored into edx. This can be modelled by making edx interfere
- with those variables.
- Graph colouring is an NP complete problem. Therefore we use an approximation
- that pushes registers to colour on to a stack. This is done in the "simplify"
- procedure.
- The register allocator first checks which registers are a candidate for
- coalescing.
- *******************************************************************************}
- unit rgobj;
- interface
- uses
- cutils, cpubase,
- aasmbase,aasmtai,aasmcpu,
- cclasses,globtype,cgbase,node,
- {$ifdef delphi}
- dmisc,
- {$endif}
- cpuinfo
- ;
- type
- {
- regvarother_longintarray = array[tregisterindex] of longint;
- regvarother_booleanarray = array[tregisterindex] of boolean;
- regvarint_longintarray = array[first_int_supreg..last_int_supreg] of longint;
- regvarint_ptreearray = array[first_int_supreg..last_int_supreg] of tnode;
- }
- tsuperregisterworklist=object
- buflength,
- buflengthinc,
- length,
- head,
- tail : integer;
- buf : ^tsuperregister;
- constructor init;
- destructor done;
- procedure clear;
- procedure next(var i:integer);
- procedure add(s:tsuperregister);
- function get:tsuperregister;
- function getlast:tsuperregister;
- function getidx(i:integer):tsuperregister;
- procedure deleteidx(i:integer);
- function delete(s:tsuperregister):boolean;
- function find(s:tsuperregister):boolean;
- end;
- psuperregisterworklist=^tsuperregisterworklist;
- {
- The interference bitmap contains of 2 layers:
- layer 1 - 256*256 blocks with pointers to layer 2 blocks
- layer 2 - blocks of 32*256 (32 bytes = 256 bits)
- }
- Tinterferencebitmap2 = array[byte] of set of byte;
- Pinterferencebitmap2 = ^Tinterferencebitmap2;
- Tinterferencebitmap1 = array[byte] of Pinterferencebitmap2;
- pinterferencebitmap1 = ^tinterferencebitmap1;
- Tinterferencebitmap=class
- private
- maxx1,
- maxy1 : byte;
- fbitmap : pinterferencebitmap1;
- function getbitmap(x,y:tsuperregister):boolean;
- procedure setbitmap(x,y:tsuperregister;b:boolean);
- public
- constructor create;
- destructor destroy;override;
- property bitmap[x,y:tsuperregister]:boolean read getbitmap write setbitmap;default;
- end;
- Tmovelist=record
- count:cardinal;
- data:array[0..$ffff] of Tlinkedlistitem;
- end;
- Pmovelist=^Tmovelist;
- {In the register allocator we keep track of move instructions.
- These instructions are moved between five linked lists. There
- is also a linked list per register to keep track about the moves
- it is associated with. Because we need to determine quickly in
- which of the five lists it is we add anu enumeradtion to each
- move instruction.}
- Tmoveset=(ms_coalesced_moves,ms_constrained_moves,ms_frozen_moves,
- ms_worklist_moves,ms_active_moves);
- Tmoveins=class(Tlinkedlistitem)
- moveset:Tmoveset;
- { $ifdef ra_debug}
- x,y:Tsuperregister;
- { $endif}
- instruction:Taicpu;
- end;
- Treginfo=record
- alias : Tsuperregister;
- { The register allocator assigns each register a colour }
- colour : Tsuperregister;
- movelist : Pmovelist;
- adjlist : Psuperregisterworklist;
- degree : byte;
- end;
- Preginfo=^TReginfo;
- {#------------------------------------------------------------------
- This class implements the abstract register allocator. It is used by the
- code generator to allocate and free registers which might be valid across
- nodes. It also contains utility routines related to registers.
- Some of the methods in this class should be overriden
- by cpu-specific implementations.
- --------------------------------------------------------------------}
- trgobj=class
- preserved_by_proc : tcpuregisterset;
- used_in_proc : tcpuregisterset;
- // is_reg_var : Tsuperregisterset; {old regvars}
- // reg_var_loaded:Tsuperregisterset; {old regvars}
- constructor create(Aregtype:Tregistertype;
- Adefaultsub:Tsubregister;
- const Ausable:array of tsuperregister;
- Afirst_imaginary:Tsuperregister;
- Apreserved_by_proc:Tcpuregisterset);
- destructor destroy;override;
- {# Allocate a register. An internalerror will be generated if there is
- no more free registers which can be allocated.}
- function getregister(list:Taasmoutput;subreg:Tsubregister):Tregister;
- procedure add_constraints(reg:Tregister);virtual;
- {# Get the register specified.}
- procedure getexplicitregister(list:Taasmoutput;r:Tregister);
- {# Get multiple registers specified.}
- procedure allocexplicitregisters(list:Taasmoutput;r:Tcpuregisterset);
- {# Free multiple registers specified.}
- procedure deallocexplicitregisters(list:Taasmoutput;r:Tcpuregisterset);
- function uses_registers:boolean;
- {# Deallocate any kind of register }
- procedure ungetregister(list:Taasmoutput;r:Tregister);virtual;
- {# Do the register allocation.}
- procedure do_register_allocation(list:Taasmoutput;headertai:tai);
- { procedure resetusableregisters;virtual;}
- { procedure makeregvar(reg:Tsuperregister);}
- {$ifdef EXTDEBUG}
- procedure writegraph(loopidx:longint);
- {$endif EXTDEBUG}
- procedure add_move_instruction(instr:Taicpu);
- {# Prepare the register colouring.}
- procedure prepare_colouring;
- {# Clean up after register colouring.}
- procedure epilogue_colouring;
- {# Colour the registers; that is do the register allocation.}
- procedure colour_registers;
- {# Spills certain registers in the specified assembler list.}
- function spill_registers(list:Taasmoutput;headertai:tai):boolean;
- procedure translate_registers(list:Taasmoutput);
- {# Adds an interference edge.}
- procedure add_edge(u,v:Tsuperregister);
- procedure check_unreleasedregs;
- unusedregs : Tsuperregisterset;
- protected
- regtype : Tregistertype;
- { default subregister used }
- defaultsub : tsubregister;
- {# First imaginary register.}
- first_imaginary : Tsuperregister;
- {# Highest register allocated until now.}
- reginfo : PReginfo;
- maxreginfo,
- maxreginfoinc,
- maxreg : Tsuperregister;
- usable_registers_cnt : integer;
- usable_registers : array[0..maxcpuregister-1] of tsuperregister;
- ibitmap : Tinterferencebitmap;
- spillednodes,
- simplifyworklist,
- freezeworklist,
- spillworklist,
- coalescednodes,
- selectstack : tsuperregisterworklist;
- worklist_moves,
- active_moves,
- frozen_moves,
- coalesced_moves,
- constrained_moves : Tlinkedlist;
- function getnewreg:tsuperregister;
- procedure getregisterinline(list:Taasmoutput;position:Tai;subreg:Tsubregister;var result:Tregister);
- procedure ungetregisterinline(list:Taasmoutput;position:Tai;r:Tregister);
- procedure add_edges_used(u:Tsuperregister);
- procedure add_to_movelist(u:Tsuperregister;data:Tlinkedlistitem);
- function move_related(n:Tsuperregister):boolean;
- procedure make_work_list;
- procedure enable_moves(n:Tsuperregister);
- procedure decrement_degree(m:Tsuperregister);
- procedure simplify;
- function get_alias(n:Tsuperregister):Tsuperregister;
- procedure add_worklist(u:Tsuperregister);
- function adjacent_ok(u,v:Tsuperregister):boolean;
- function conservative(u,v:Tsuperregister):boolean;
- procedure combine(u,v:Tsuperregister);
- procedure coalesce;
- procedure freeze_moves(u:Tsuperregister);
- procedure freeze;
- procedure select_spill;
- procedure assign_colours;
- procedure clear_interferences(u:Tsuperregister);
- end;
- const
- first_reg = 0;
- last_reg = high(tsuperregister)-1;
- maxspillingcounter = 20;
- implementation
- uses
- systems,
- globals,verbose,tgobj,procinfo;
- {******************************************************************************
- tsuperregisterworklist
- ******************************************************************************}
- constructor tsuperregisterworklist.init;
- begin
- length:=0;
- buflength:=0;
- buflengthinc:=16;
- head:=0;
- tail:=0;
- buf:=nil;
- end;
- destructor tsuperregisterworklist.done;
- begin
- if assigned(buf) then
- freemem(buf);
- end;
- procedure tsuperregisterworklist.add(s:tsuperregister);
- var
- oldbuflength : integer;
- newbuf : ^tsuperregister;
- begin
- inc(length);
- { Need to increase buffer length? }
- if length>=buflength then
- begin
- oldbuflength:=buflength;
- inc(buflength,buflengthinc);
- buflengthinc:=buflengthinc*2;
- if buflengthinc>256 then
- buflengthinc:=256;
- { We need to allocate a new block and move data around when the
- tail is wrapped around }
- if tail<head then
- begin
- Getmem(newbuf,buflength*sizeof(tsuperregister));
- move(buf[0],newbuf[oldbuflength-head],tail*sizeof(tsuperregister));
- move(buf[head],newbuf[0],(oldbuflength-head)*sizeof(tsuperregister));
- Freemem(buf);
- buf:=newbuf;
- head:=0;
- tail:=oldbuflength-1;
- end
- else
- Reallocmem(buf,buflength*sizeof(tsuperregister));
- end;
- buf[tail]:=s;
- inc(tail);
- if tail>=buflength then
- tail:=0;
- end;
- procedure tsuperregisterworklist.clear;
- begin
- length:=0;
- tail:=0;
- head:=0;
- end;
- procedure tsuperregisterworklist.next(var i:integer);
- begin
- inc(i);
- if i>=buflength then
- i:=0;
- end;
- function tsuperregisterworklist.getidx(i:integer):tsuperregister;
- begin
- result:=buf[i];
- end;
- procedure tsuperregisterworklist.deleteidx(i:integer);
- begin
- if length=0 then
- internalerror(200310144);
- buf[i]:=buf[head];
- inc(head);
- if head>=buflength then
- head:=0;
- dec(length);
- end;
- function tsuperregisterworklist.get:tsuperregister;
- begin
- if length=0 then
- internalerror(200310142);
- result:=buf[head];
- inc(head);
- if head>=buflength then
- head:=0;
- dec(length);
- end;
- function tsuperregisterworklist.getlast:tsuperregister;
- begin
- if length=0 then
- internalerror(200310143);
- dec(tail);
- if tail<0 then
- tail:=buflength-1;
- result:=buf[tail];
- dec(length);
- end;
- function tsuperregisterworklist.delete(s:tsuperregister):boolean;
- var
- i : integer;
- begin
- result:=false;
- i:=head;
- while (i<>tail) do
- begin
- if buf[i]=s then
- begin
- deleteidx(i);
- result:=true;
- exit;
- end;
- inc(i);
- if i>=buflength then
- i:=0;
- end;
- end;
- function tsuperregisterworklist.find(s:tsuperregister):boolean;
- var
- i : integer;
- begin
- result:=false;
- i:=head;
- while (i<>tail) do
- begin
- if buf[i]=s then
- begin
- result:=true;
- exit;
- end;
- inc(i);
- if i>=buflength then
- i:=0;
- end;
- end;
- {******************************************************************************
- tinterferencebitmap
- ******************************************************************************}
- constructor tinterferencebitmap.create;
- begin
- inherited create;
- maxx1:=1;
- getmem(fbitmap,sizeof(tinterferencebitmap1)*2);
- fillchar(fbitmap^,sizeof(tinterferencebitmap1)*2,0);
- end;
- destructor tinterferencebitmap.destroy;
- var
- i,j : byte;
- begin
- if assigned(fbitmap) then
- begin
- for i:=0 to maxx1 do
- for j:=0 to maxy1 do
- if assigned(fbitmap[i,j]) then
- dispose(fbitmap[i,j]);
- freemem(fbitmap);
- end;
- end;
- function tinterferencebitmap.getbitmap(x,y:tsuperregister):boolean;
- var
- page : pinterferencebitmap2;
- begin
- result:=false;
- if (x shr 8>maxx1) then
- exit;
- page:=fbitmap[x shr 8,y shr 8];
- result:=assigned(page) and
- ((x and $ff) in page^[y and $ff]);
- end;
- procedure tinterferencebitmap.setbitmap(x,y:tsuperregister;b:boolean);
- var
- x1,y1 : byte;
- begin
- x1:=x shr 8;
- y1:=y shr 8;
- if x1>maxx1 then
- begin
- reallocmem(fbitmap,sizeof(tinterferencebitmap1)*(x1+1));
- fillchar(fbitmap[maxx1+1],sizeof(tinterferencebitmap1)*(x1-maxx1),0);
- maxx1:=x1;
- end;
- if not assigned(fbitmap[x1,y1]) then
- begin
- if y1>maxy1 then
- maxy1:=y1;
- new(fbitmap[x1,y1]);
- fillchar(fbitmap[x1,y1]^,sizeof(tinterferencebitmap2),0);
- end;
- if b then
- include(fbitmap[x1,y1]^[y and $ff],(x and $ff))
- else
- exclude(fbitmap[x1,y1]^[y and $ff],(x and $ff));
- end;
- {******************************************************************************
- trgobj
- ******************************************************************************}
- constructor trgobj.create(Aregtype:Tregistertype;
- Adefaultsub:Tsubregister;
- const Ausable:array of tsuperregister;
- Afirst_imaginary:Tsuperregister;
- Apreserved_by_proc:Tcpuregisterset);
- var
- i : Tsuperregister;
- begin
- { empty super register sets can cause very strange problems }
- if high(Ausable)=0 then
- internalerror(200210181);
- first_imaginary:=Afirst_imaginary;
- maxreg:=Afirst_imaginary;
- regtype:=Aregtype;
- defaultsub:=Adefaultsub;
- preserved_by_proc:=Apreserved_by_proc;
- used_in_proc:=[];
- supregset_reset(unusedregs,true);
- { RS_INVALID can't be used }
- supregset_exclude(unusedregs,RS_INVALID);
- ibitmap:=tinterferencebitmap.create;
- { Get reginfo for CPU registers }
- reginfo:=allocmem(first_imaginary*sizeof(treginfo));
- maxreginfo:=first_imaginary;
- maxreginfoinc:=16;
- for i:=0 to first_imaginary-1 do
- reginfo[i].degree:=255;
- worklist_moves:=Tlinkedlist.create;
- { Usable registers }
- fillchar(usable_registers,sizeof(usable_registers),0);
- for i:=low(Ausable) to high(Ausable) do
- usable_registers[i]:=Ausable[i];
- usable_registers_cnt:=high(Ausable)+1;
- { Initialize Worklists }
- spillednodes.init;
- simplifyworklist.init;
- freezeworklist.init;
- spillworklist.init;
- coalescednodes.init;
- selectstack.init;
- end;
- destructor trgobj.destroy;
- var i:Tsuperregister;
- begin
- spillednodes.done;
- simplifyworklist.done;
- freezeworklist.done;
- spillworklist.done;
- coalescednodes.done;
- selectstack.done;
- for i:=0 to maxreg-1 do
- begin
- if reginfo[i].adjlist<>nil then
- dispose(reginfo[i].adjlist,done);
- if reginfo[i].movelist<>nil then
- dispose(reginfo[i].movelist);
- end;
- freemem(reginfo);
- worklist_moves.free;
- ibitmap.free;
- end;
- function trgobj.getnewreg:tsuperregister;
- var
- oldmaxreginfo : tsuperregister;
- begin
- result:=maxreg;
- inc(maxreg);
- if maxreg>=last_reg then
- internalerror(200310146);
- if maxreg>=maxreginfo then
- begin
- oldmaxreginfo:=maxreginfo;
- inc(maxreginfo,maxreginfoinc);
- if maxreginfoinc<256 then
- maxreginfoinc:=maxreginfoinc*2;
- reallocmem(reginfo,maxreginfo*sizeof(treginfo));
- { Do we really need it to clear it ? At least for 1.0.x (PFV) }
- fillchar(reginfo[oldmaxreginfo],(maxreginfo-oldmaxreginfo)*sizeof(treginfo),0);
- end;
- end;
- function trgobj.getregister(list:Taasmoutput;subreg:Tsubregister):Tregister;
- var p:Tsuperregister;
- r:Tregister;
- begin
- p:=getnewreg;
- supregset_exclude(unusedregs,p);
- r:=newreg(regtype,p,subreg);
- list.concat(Tai_regalloc.alloc(r));
- add_edges_used(p);
- add_constraints(r);
- result:=r;
- end;
- function trgobj.uses_registers:boolean;
- begin
- result:=(maxreg>first_imaginary);
- end;
- procedure trgobj.ungetregister(list:Taasmoutput;r:Tregister);
- var supreg:Tsuperregister;
- begin
- supreg:=getsupreg(r);
- if not supregset_in(unusedregs,supreg) then
- begin
- supregset_include(unusedregs,supreg);
- list.concat(Tai_regalloc.dealloc(r));
- add_edges_used(supreg);
- add_constraints(r);
- end;
- end;
- procedure trgobj.getexplicitregister(list:Taasmoutput;r:Tregister);
- var supreg:Tsuperregister;
- begin
- supreg:=getsupreg(r);
- if supregset_in(unusedregs,supreg) then
- begin
- supregset_exclude(unusedregs,supreg);
- if supreg<first_imaginary then
- include(used_in_proc,supreg);
- list.concat(Tai_regalloc.alloc(r));
- add_edges_used(supreg);
- add_constraints(r);
- end
- else
- {$ifndef ALLOWDUPREG}
- internalerror(200301103)
- {$else ALLOWDUPREG}
- list.concat(Tai_regalloc.alloc(r));
- {$endif ALLOWDUPREG}
- ;
- end;
- procedure trgobj.allocexplicitregisters(list:Taasmoutput;r:Tcpuregisterset);
- var reg:Tregister;
- i:Tsuperregister;
- begin
- if unusedregs[0]*r=r then
- begin
- unusedregs[0]:=unusedregs[0]-r;
- used_in_proc:=used_in_proc+r;
- for i:=0 to first_imaginary-1 do
- if i in r then
- begin
- add_edges_used(i);
- reg:=newreg(regtype,i,R_SUBWHOLE);
- list.concat(Tai_regalloc.alloc(reg));
- end;
- end
- else
- {$ifndef ALLOWDUPREG}
- internalerror(200305061)
- {$else ALLOWDUPREG}
- list.concat(Tai_regalloc.alloc(reg));
- {$endif ALLOWDUPREG}
- ;
- end;
- procedure trgobj.deallocexplicitregisters(list:Taasmoutput;r:Tcpuregisterset);
- var reg:Tregister;
- i:Tsuperregister;
- begin
- if unusedregs[0]*r=[] then
- begin
- unusedregs[0]:=unusedregs[0]+r;
- for i:=first_imaginary-1 downto 0 do
- if i in r then
- begin
- reg:=newreg(regtype,i,R_SUBWHOLE);
- list.concat(Tai_regalloc.dealloc(reg));
- end;
- end
- else
- {$ifndef ALLOWDUPREG}
- internalerror(200305061);
- {$else ALLOWDUPREG}
- list.concat(Tai_regalloc.dealloc(reg));
- {$endif ALLOWDUPREG}
- end;
- procedure trgobj.do_register_allocation(list:Taasmoutput;headertai:tai);
- var
- spillingcounter:byte;
- endspill:boolean;
- begin
- {Do register allocation.}
- spillingcounter:=0;
- repeat
- prepare_colouring;
- colour_registers;
- epilogue_colouring;
- endspill:=true;
- if spillednodes.length<>0 then
- begin
- inc(spillingcounter);
- if spillingcounter>maxspillingcounter then
- internalerror(200309041);
- endspill:=not spill_registers(list,headertai);
- end;
- until endspill;
- end;
- procedure trgobj.add_constraints(reg:Tregister);
- begin
- end;
- procedure trgobj.add_edge(u,v:Tsuperregister);
- {This procedure will add an edge to the virtual interference graph.}
- procedure addadj(u,v:Tsuperregister);
- begin
- if reginfo[u].adjlist=nil then
- new(reginfo[u].adjlist,init);
- reginfo[u].adjlist^.add(v);
- end;
- begin
- if (u<>v) and not(ibitmap[v,u]) then
- begin
- ibitmap[v,u]:=true;
- ibitmap[u,v]:=true;
- {Precoloured nodes are not stored in the interference graph.}
- if (u>=first_imaginary) then
- begin
- addadj(u,v);
- inc(reginfo[u].degree);
- end;
- if (v>=first_imaginary) then
- begin
- addadj(v,u);
- inc(reginfo[v].degree);
- end;
- end;
- end;
- procedure trgobj.add_edges_used(u:Tsuperregister);
- var i:Tsuperregister;
- begin
- for i:=0 to maxreg-1 do
- if not(supregset_in(unusedregs,i)) then
- add_edge(u,i);
- end;
- {$ifdef EXTDEBUG}
- procedure trgobj.writegraph(loopidx:longint);
- {This procedure writes out the current interference graph in the
- register allocator.}
- var f:text;
- i,j:Tsuperregister;
- begin
- assign(f,'igraph'+tostr(loopidx));
- rewrite(f);
- writeln(f,'Interference graph');
- writeln(f);
- write(f,' ');
- for i:=0 to 15 do
- for j:=0 to 15 do
- write(f,hexstr(i,1));
- writeln(f);
- write(f,' ');
- for i:=0 to 15 do
- write(f,'0123456789ABCDEF');
- writeln(f);
- for i:=0 to maxreg-1 do
- begin
- write(f,hexstr(i,2):4);
- for j:=0 to maxreg-1 do
- if ibitmap[i,j] then
- write(f,'*')
- else
- write(f,'-');
- writeln(f);
- end;
- close(f);
- end;
- {$endif EXTDEBUG}
- procedure trgobj.add_to_movelist(u:Tsuperregister;data:Tlinkedlistitem);
- begin
- if reginfo[u].movelist=nil then
- begin
- getmem(reginfo[u].movelist,64);
- reginfo[u].movelist^.count:=0;
- end
- else if (reginfo[u].movelist^.count and 15)=15 then
- reallocmem(reginfo[u].movelist,(reginfo[u].movelist^.count+1)*4+64);
- reginfo[u].movelist^.data[reginfo[u].movelist^.count]:=data;
- inc(reginfo[u].movelist^.count);
- end;
- procedure trgobj.add_move_instruction(instr:Taicpu);
- {This procedure notifies a certain as a move instruction so the
- register allocator can try to eliminate it.}
- var i:Tmoveins;
- ssupreg,dsupreg:Tsuperregister;
- begin
- i:=Tmoveins.create;
- i.moveset:=ms_worklist_moves;
- i.instruction:=instr;
- worklist_moves.insert(i);
- ssupreg:=getsupreg(instr.oper[O_MOV_SOURCE]^.reg);
- add_to_movelist(ssupreg,i);
- dsupreg:=getsupreg(instr.oper[O_MOV_DEST]^.reg);
- if ssupreg<>dsupreg then
- {Avoid adding the same move instruction twice to a single register.}
- add_to_movelist(dsupreg,i);
- i.x:=ssupreg;
- i.y:=dsupreg;
- end;
- function trgobj.move_related(n:Tsuperregister):boolean;
- var i:cardinal;
- begin
- move_related:=false;
- if reginfo[n].movelist<>nil then
- begin
- for i:=0 to reginfo[n].movelist^.count-1 do
- if Tmoveins(reginfo[n].movelist^.data[i]).moveset in [ms_worklist_moves,ms_active_moves] then
- begin
- move_related:=true;
- break;
- end;
- end;
- end;
- procedure trgobj.make_work_list;
- var n:Tsuperregister;
- begin
- {If we have 7 cpu registers, and the degree of a node is 7, we cannot
- assign it to any of the registers, thus it is significant.}
- for n:=first_imaginary to maxreg-1 do
- if reginfo[n].degree>=usable_registers_cnt then
- spillworklist.add(n)
- else if move_related(n) then
- freezeworklist.add(n)
- else
- simplifyworklist.add(n);
- end;
- procedure trgobj.prepare_colouring;
- var
- i : integer;
- begin
- make_work_list;
- active_moves:=Tlinkedlist.create;
- frozen_moves:=Tlinkedlist.create;
- coalesced_moves:=Tlinkedlist.create;
- constrained_moves:=Tlinkedlist.create;
- for i:=0 to maxreg-1 do
- reginfo[i].alias:=RS_INVALID;
- coalescednodes.clear;
- selectstack.clear;
- end;
- procedure trgobj.enable_moves(n:Tsuperregister);
- var m:Tlinkedlistitem;
- i:cardinal;
- begin
- if reginfo[n].movelist<>nil then
- for i:=0 to reginfo[n].movelist^.count-1 do
- begin
- m:=reginfo[n].movelist^.data[i];
- if Tmoveins(m).moveset in [ms_worklist_moves,ms_active_moves] then
- begin
- if Tmoveins(m).moveset=ms_active_moves then
- begin
- {Move m from the set active_moves to the set worklist_moves.}
- active_moves.remove(m);
- Tmoveins(m).moveset:=ms_worklist_moves;
- worklist_moves.concat(m);
- end;
- end;
- end;
- end;
- procedure trgobj.decrement_degree(m:Tsuperregister);
- var adj : Psuperregisterworklist;
- d : byte;
- n : tsuperregister;
- i : integer;
- begin
- d:=reginfo[m].degree;
- if reginfo[m].degree>0 then
- dec(reginfo[m].degree);
- if d=usable_registers_cnt then
- begin
- {Enable moves for m.}
- enable_moves(m);
- {Enable moves for adjacent.}
- adj:=reginfo[m].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- n:=adj^.buf[i];
- if selectstack.find(n) or
- coalescednodes.find(n) then
- enable_moves(n);
- adj^.next(i);
- end;
- end;
- {Remove the node from the spillworklist.}
- if not spillworklist.delete(m) then
- internalerror(200310145);
- if move_related(m) then
- freezeworklist.add(m)
- else
- simplifyworklist.add(m);
- end;
- end;
- procedure trgobj.simplify;
- var adj : Psuperregisterworklist;
- min : byte;
- p,n : Tsuperregister;
- i : integer;
- begin
- {We the element with the least interferences out of the
- simplifyworklist.}
- min:=$ff;
- p:=0;
- n:=0;
- i:=simplifyworklist.head;
- while (i<>simplifyworklist.tail) do
- begin
- adj:=reginfo[simplifyworklist.buf[i]].adjlist;
- if adj=nil then
- begin
- p:=i;
- min:=0;
- break; {We won't find smaller ones.}
- end
- else
- if adj^.length<min then
- begin
- p:=i;
- min:=adj^.length;
- if min=0 then
- break; {We won't find smaller ones.}
- end;
- simplifyworklist.next(i);
- end;
- n:=simplifyworklist.getidx(p);
- simplifyworklist.deleteidx(p);
- {Push it on the selectstack.}
- selectstack.add(n);
- adj:=reginfo[n].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- n:=adj^.buf[i];
- if (n>first_imaginary) and
- not(selectstack.find(n) or
- coalescednodes.find(n)) then
- decrement_degree(n);
- adj^.next(i);
- end;
- end;
- end;
- function trgobj.get_alias(n:Tsuperregister):Tsuperregister;
- begin
- while coalescednodes.find(n) do
- n:=reginfo[n].alias;
- get_alias:=n;
- end;
- procedure trgobj.add_worklist(u:Tsuperregister);
- begin
- if (u>=first_imaginary) and
- not move_related(u) and
- (reginfo[u].degree<usable_registers_cnt) then
- begin
- if not freezeworklist.delete(u) then
- internalerror(200308161); {must be found}
- simplifyworklist.add(u);
- end;
- end;
- function trgobj.adjacent_ok(u,v:Tsuperregister):boolean;
- {Check wether u and v should be coalesced. u is precoloured.}
- function ok(t,r:Tsuperregister):boolean;
- begin
- ok:=(reginfo[t].degree<usable_registers_cnt) or
- (t<first_imaginary) or
- ibitmap[r,t];
- end;
- var adj : Psuperregisterworklist;
- i : integer;
- n : tsuperregister;
- begin
- adjacent_ok:=true;
- adj:=reginfo[v].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- n:=adj^.buf[i];
- if not(selectstack.find(n) or
- coalescednodes.find(n)) and
- not ok(n,u) then
- begin
- adjacent_ok:=false;
- break;
- end;
- adj^.next(i);
- end;
- end;
- end;
- function trgobj.conservative(u,v:Tsuperregister):boolean;
- var adj : Psuperregisterworklist;
- done : Tsuperregisterset; {To prevent that we count nodes twice.}
- i,k : integer;
- n : tsuperregister;
- begin
- k:=0;
- supregset_reset(done,false);
- adj:=reginfo[u].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- n:=adj^.buf[i];
- if not(selectstack.find(n) or
- coalescednodes.find(n)) then
- begin
- supregset_include(done,n);
- if reginfo[n].degree>=usable_registers_cnt then
- inc(k);
- end;
- adj^.next(i);
- end;
- end;
- adj:=reginfo[v].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- n:=adj^.buf[i];
- if not supregset_in(done,n) and
- (reginfo[n].degree>=usable_registers_cnt) and
- not(selectstack.find(n) or
- coalescednodes.find(n)) then
- inc(k);
- adj^.next(i);
- end;
- end;
- conservative:=(k<usable_registers_cnt);
- end;
- procedure trgobj.combine(u,v:Tsuperregister);
- var add : boolean;
- adj : Psuperregisterworklist;
- i : integer;
- t : tsuperregister;
- n,o : cardinal;
- decrement : boolean;
- begin
- if not freezeworklist.delete(v) then
- spillworklist.delete(v);
- coalescednodes.add(v);
- reginfo[v].alias:=u;
- {Combine both movelists. Since the movelists are sets, only add
- elements that are not already present.}
- if assigned(reginfo[v].movelist) then
- begin
- for n:=0 to reginfo[v].movelist^.count-1 do
- begin
- add:=true;
- for o:=0 to reginfo[u].movelist^.count-1 do
- if reginfo[u].movelist^.data[o]=reginfo[v].movelist^.data[n] then
- begin
- add:=false;
- break;
- end;
- if add then
- add_to_movelist(u,reginfo[v].movelist^.data[n]);
- end;
- enable_moves(v);
- end;
- adj:=reginfo[v].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- t:=adj^.buf[i];
- if not(selectstack.find(t) or
- coalescednodes.find(t)) then
- begin
- decrement:=(t<>u) and not(ibitmap[u,t]);
- add_edge(t,u);
- { Do not call decrement_degree because it might move nodes between
- lists while the degree does not change (add_edge will increase it).
- Instead, we will decrement manually. (Only if the degree has been
- increased.) }
- if decrement and
- (t>=first_imaginary) and
- (reginfo[t].degree>0) then
- dec(reginfo[t].degree);
- end;
- adj^.next(i);
- end;
- end;
- if (reginfo[u].degree>=usable_registers_cnt) and
- freezeworklist.delete(u) then
- spillworklist.add(u);
- end;
- procedure trgobj.coalesce;
- var m:Tmoveins;
- x,y,u,v:Tsuperregister;
- begin
- m:=Tmoveins(worklist_moves.getfirst);
- x:=get_alias(getsupreg(m.instruction.oper[0]^.reg));
- y:=get_alias(getsupreg(m.instruction.oper[1]^.reg));
- if (y<first_imaginary) then
- begin
- u:=y;
- v:=x;
- end
- else
- begin
- u:=x;
- v:=y;
- end;
- if (u=v) then
- begin
- m.moveset:=ms_coalesced_moves; {Already coalesced.}
- coalesced_moves.insert(m);
- add_worklist(u);
- end
- {Do u and v interfere? In that case the move is constrained. Two
- precoloured nodes interfere allways. If v is precoloured, by the above
- code u is precoloured, thus interference...}
- else if (v<first_imaginary) or ibitmap[u,v] then
- begin
- m.moveset:=ms_constrained_moves; {Cannot coalesce yet...}
- constrained_moves.insert(m);
- add_worklist(u);
- add_worklist(v);
- end
- {Next test: is it possible and a good idea to coalesce??}
- else if ((u<first_imaginary) and adjacent_ok(u,v)) or
- ((u>=first_imaginary) and conservative(u,v)) then
- begin
- m.moveset:=ms_coalesced_moves; {Move coalesced!}
- coalesced_moves.insert(m);
- combine(u,v);
- add_worklist(u);
- end
- else
- begin
- m.moveset:=ms_active_moves;
- active_moves.insert(m);
- end;
- end;
- procedure trgobj.freeze_moves(u:Tsuperregister);
- var i:cardinal;
- m:Tlinkedlistitem;
- v,x,y:Tsuperregister;
- begin
- if reginfo[u].movelist<>nil then
- for i:=0 to reginfo[u].movelist^.count-1 do
- begin
- m:=reginfo[u].movelist^.data[i];
- if Tmoveins(m).moveset in [ms_worklist_moves,ms_active_moves] then
- begin
- x:=getsupreg(Tmoveins(m).instruction.oper[0]^.reg);
- y:=getsupreg(Tmoveins(m).instruction.oper[1]^.reg);
- if get_alias(y)=get_alias(u) then
- v:=get_alias(x)
- else
- v:=get_alias(y);
- {Move m from active_moves/worklist_moves to frozen_moves.}
- if Tmoveins(m).moveset=ms_active_moves then
- active_moves.remove(m)
- else
- worklist_moves.remove(m);
- Tmoveins(m).moveset:=ms_frozen_moves;
- frozen_moves.insert(m);
- if (v>=first_imaginary) and
- not(move_related(v)) and
- (reginfo[v].degree<usable_registers_cnt) then
- begin
- freezeworklist.delete(v);
- simplifyworklist.add(v);
- end;
- end;
- end;
- end;
- procedure trgobj.freeze;
- var n:Tsuperregister;
- begin
- { We need to take a random element out of the freezeworklist. We take
- the last element. Dirty code! }
- n:=freezeworklist.get;
- {Add it to the simplifyworklist.}
- simplifyworklist.add(n);
- freeze_moves(n);
- end;
- procedure trgobj.select_spill;
- var
- n : tsuperregister;
- adj : psuperregisterworklist;
- max,p,i : integer;
- begin
- { We must look for the element with the most interferences in the
- spillworklist. This is required because those registers are creating
- the most conflicts and keeping them in a register will not reduce the
- complexity and even can cause the help registers for the spilling code
- to get too much conflicts with the result that the spilling code
- will never converge (PFV) }
- max:=0;
- p:=0;
- i:=spillworklist.head;
- while (i<>spillworklist.tail) do
- begin
- adj:=reginfo[spillworklist.buf[i]].adjlist;
- if assigned(adj) and
- (adj^.length>max) then
- begin
- p:=i;
- max:=adj^.length;
- end;
- spillworklist.next(i);
- end;
- n:=spillworklist.getidx(p);
- spillworklist.deleteidx(p);
- simplifyworklist.add(n);
- freeze_moves(n);
- end;
- procedure trgobj.assign_colours;
- {Assign_colours assigns the actual colours to the registers.}
- var adj : Psuperregisterworklist;
- i,j,k : integer;
- n,a,c : Tsuperregister;
- adj_colours,
- colourednodes : Tsuperregisterset;
- found : boolean;
- begin
- spillednodes.clear;
- {Reset colours}
- for n:=0 to maxreg-1 do
- reginfo[n].colour:=n;
- {Colour the cpu registers...}
- supregset_reset(colourednodes,false);
- for n:=0 to first_imaginary-1 do
- supregset_include(colourednodes,n);
- {Now colour the imaginary registers on the select-stack.}
- while (selectstack.length>0) do
- begin
- n:=selectstack.getlast;
- {Create a list of colours that we cannot assign to n.}
- supregset_reset(adj_colours,false);
- adj:=reginfo[n].adjlist;
- if adj<>nil then
- begin
- j:=adj^.head;
- while (j<>adj^.tail) do
- begin
- a:=get_alias(adj^.buf[j]);
- if supregset_in(colourednodes,a) then
- supregset_include(adj_colours,reginfo[a].colour);
- adj^.next(j);
- end;
- supregset_include(adj_colours,RS_STACK_POINTER_REG);
- end;
- {Assume a spill by default...}
- found:=false;
- {Search for a colour not in this list.}
- for k:=0 to usable_registers_cnt-1 do
- begin
- c:=usable_registers[k];
- if not(supregset_in(adj_colours,c)) then
- begin
- reginfo[n].colour:=c;
- found:=true;
- supregset_include(colourednodes,n);
- include(used_in_proc,c);
- break;
- end;
- end;
- if not found then
- spillednodes.add(n);
- end;
- {Finally colour the nodes that were coalesced.}
- i:=coalescednodes.head;
- while (i<>coalescednodes.tail) do
- begin
- n:=coalescednodes.buf[i];
- k:=get_alias(n);
- reginfo[n].colour:=reginfo[k].colour;
- include(used_in_proc,reginfo[k].colour);
- coalescednodes.next(i);
- end;
- {$ifdef ra_debug}
- if aktfilepos.line=51 then
- begin
- writeln('colourlist');
- for i:=0 to maxreg-1 do
- writeln(i:4,' ',reginfo[i].colour:4)
- end;
- {$endif ra_debug}
- end;
- procedure trgobj.colour_registers;
- begin
- repeat
- if simplifyworklist.length<>0 then
- simplify
- else if not(worklist_moves.empty) then
- coalesce
- else if freezeworklist.length<>0 then
- freeze
- else if spillworklist.length<>0 then
- select_spill;
- until (simplifyworklist.length=0) and
- worklist_moves.empty and
- (freezeworklist.length=0) and
- (spillworklist.length=0);
- assign_colours;
- end;
- procedure trgobj.epilogue_colouring;
- {
- procedure move_to_worklist_moves(list:Tlinkedlist);
- var p:Tlinkedlistitem;
- begin
- p:=list.first;
- while p<>nil do
- begin
- Tmoveins(p).moveset:=ms_worklist_moves;
- p:=p.next;
- end;
- worklist_moves.concatlist(list);
- end;
- }
- var i:Tsuperregister;
- begin
- worklist_moves.clear;
- {$ifdef Principle_wrong_by_definition}
- {Move everything back to worklist_moves.}
- move_to_worklist_moves(active_moves);
- move_to_worklist_moves(frozen_moves);
- move_to_worklist_moves(coalesced_moves);
- move_to_worklist_moves(constrained_moves);
- {$endif Principle_wrong_by_definition}
- active_moves.destroy;
- active_moves:=nil;
- frozen_moves.destroy;
- frozen_moves:=nil;
- coalesced_moves.destroy;
- coalesced_moves:=nil;
- constrained_moves.destroy;
- constrained_moves:=nil;
- for i:=0 to maxreg-1 do
- if reginfo[i].movelist<>nil then
- begin
- dispose(reginfo[i].movelist);
- reginfo[i].movelist:=0;
- end;
- end;
- procedure trgobj.clear_interferences(u:Tsuperregister);
- {Remove node u from the interference graph and remove all collected
- move instructions it is associated with.}
- var i : integer;
- v : Tsuperregister;
- adj,adj2 : Psuperregisterworklist;
- {$ifdef Principle_wrong_by_definition}
- k,j,count : cardinal;
- m,n : Tmoveins;
- {$endif Principle_wrong_by_definition}
- begin
- adj:=reginfo[u].adjlist;
- if adj<>nil then
- begin
- i:=adj^.head;
- while (i<>adj^.tail) do
- begin
- v:=adj^.buf[i];
- {Remove (u,v) and (v,u) from bitmap.}
- ibitmap[u,v]:=false;
- ibitmap[v,u]:=false;
- {Remove (v,u) from adjacency list.}
- adj2:=reginfo[v].adjlist;
- if adj2<>nil then
- begin
- adj2^.delete(v);
- if adj2^.length=0 then
- begin
- dispose(adj2,done);
- reginfo[v].adjlist:=nil;
- end;
- end;
- adj^.next(i);
- end;
- {Remove ( u,* ) from adjacency list.}
- dispose(adj,done);
- reginfo[u].adjlist:=nil;
- end;
- {$ifdef Principle_wrong_by_definition}
- {Now remove the moves.}
- if movelist[u]<>nil then
- begin
- for j:=0 to movelist[u]^.count-1 do
- begin
- m:=Tmoveins(movelist[u]^.data[j]);
- {Get the other register of the move instruction.}
- v:=m.instruction.oper[0]^.reg.number shr 8;
- if v=u then
- v:=m.instruction.oper[1]^.reg.number shr 8;
- repeat
- repeat
- if (u<>v) and (movelist[v]<>nil) then
- begin
- {Remove the move from it's movelist.}
- count:=movelist[v]^.count-1;
- for k:=0 to count do
- if m=movelist[v]^.data[k] then
- begin
- if k<>count then
- movelist[v]^.data[k]:=movelist[v]^.data[count];
- dec(movelist[v]^.count);
- if count=0 then
- begin
- dispose(movelist[v]);
- movelist[v]:=nil;
- end;
- break;
- end;
- end;
- {The complexity is enourmous: the register might have been
- coalesced. In that case it's movelists have been added to
- it's coalescing alias. (DM)}
- v:=alias[v];
- until v=0;
- {And also register u might have been coalesced.}
- u:=alias[u];
- until u=0;
- case m.moveset of
- ms_coalesced_moves:
- coalesced_moves.remove(m);
- ms_constrained_moves:
- constrained_moves.remove(m);
- ms_frozen_moves:
- frozen_moves.remove(m);
- ms_worklist_moves:
- worklist_moves.remove(m);
- ms_active_moves:
- active_moves.remove(m);
- end;
- end;
- dispose(movelist[u]);
- movelist[u]:=nil;
- end;
- {$endif Principle_wrong_by_definition}
- end;
- procedure trgobj.getregisterinline(list:Taasmoutput;
- position:Tai;subreg:Tsubregister;var result:Tregister);
- var p:Tsuperregister;
- r:Tregister;
- begin
- p:=getnewreg;
- supregset_exclude(unusedregs,p);
- r:=newreg(regtype,p,subreg);
- if position=nil then
- list.insert(Tai_regalloc.alloc(r))
- else
- list.insertafter(Tai_regalloc.alloc(r),position);
- add_edges_used(p);
- add_constraints(r);
- result:=r;
- end;
- procedure trgobj.ungetregisterinline(list:Taasmoutput;
- position:Tai;r:Tregister);
- var supreg:Tsuperregister;
- begin
- supreg:=getsupreg(r);
- supregset_include(unusedregs,supreg);
- if position=nil then
- list.insert(Tai_regalloc.dealloc(r))
- else
- list.insertafter(Tai_regalloc.dealloc(r),position);
- add_edges_used(supreg);
- add_constraints(r);
- end;
- function trgobj.spill_registers(list:Taasmoutput;headertai:tai):boolean;
- {Returns true if any help registers have been used.}
- var i : integer;
- t : tsuperregister;
- p,q : Tai;
- regs_to_spill_set : Tsuperregisterset;
- spill_temps : ^Tspill_temp_list;
- supreg : tsuperregister;
- templist : taasmoutput;
- begin
- spill_registers:=false;
- supregset_reset(unusedregs,true);
- {Precoloured nodes should have an infinite degree, which we can approach
- by 255.}
- for i:=0 to first_imaginary-1 do
- reginfo[i].degree:=255;
- for i:=first_imaginary to maxreg-1 do
- reginfo[i].degree:=0;
- { exclude(unusedregs,RS_STACK_POINTER_REG);}
- if current_procinfo.framepointer=NR_FRAME_POINTER_REG then
- {Make sure the register allocator won't allocate registers into ebp.}
- supregset_exclude(unusedregs,RS_FRAME_POINTER_REG);
- spill_temps:=allocmem(sizeof(treference)*maxreg);
- supregset_reset(regs_to_spill_set,false);
- { Allocate temps and insert in front of the list }
- templist:=taasmoutput.create;
- i:=spillednodes.head;
- while (i<>spillednodes.tail) do
- begin
- t:=spillednodes.buf[i];
- {Alternative representation.}
- supregset_include(regs_to_spill_set,t);
- {Clear all interferences of the spilled register.}
- clear_interferences(t);
- {Get a temp for the spilled register}
- tg.gettemp(templist,4,tt_noreuse,spill_temps^[t]);
- spillednodes.next(i);
- end;
- list.insertlistafter(headertai,templist);
- templist.free;
- { Walk through all instructions, we can start with the headertai,
- because before the header tai is only symbols }
- p:=headertai;
- while assigned(p) do
- begin
- case p.typ of
- ait_regalloc:
- begin
- if (getregtype(Tai_regalloc(p).reg)=regtype) then
- begin
- {A register allocation of a spilled register can be removed.}
- supreg:=getsupreg(Tai_regalloc(p).reg);
- if supregset_in(regs_to_spill_set,supreg) then
- begin
- q:=Tai(p.next);
- list.remove(p);
- p.free;
- p:=q;
- continue;
- end
- else
- if Tai_regalloc(p).allocation then
- supregset_exclude(unusedregs,supreg)
- else
- supregset_include(unusedregs,supreg);
- end;
- end;
- ait_instruction:
- begin
- aktfilepos:=Taicpu_abstract(p).fileinfo;
- if Taicpu_abstract(p).spill_registers(list,
- @getregisterinline,
- @ungetregisterinline,
- regs_to_spill_set,
- unusedregs,
- spill_temps^) then
- spill_registers:=true;
- if Taicpu_abstract(p).is_move then
- add_move_instruction(Taicpu(p));
- end;
- end;
- p:=Tai(p.next);
- end;
- aktfilepos:=current_procinfo.exitpos;
- i:=spillednodes.head;
- while (i<>spillednodes.tail) do
- begin
- tg.ungettemp(list,spill_temps^[spillednodes.buf[i]]);
- spillednodes.next(i);
- end;
- freemem(spill_temps);
- end;
- procedure Trgobj.translate_registers(list:taasmoutput);
- var hp,p,q:Tai;
- i:shortint;
- r:Preference;
- {$ifdef arm}
- so:pshifterop;
- {$endif arm}
- begin
- { Leave when no imaginary registers are used }
- if maxreg<=first_imaginary then
- exit;
- p:=Tai(list.first);
- while assigned(p) do
- begin
- case p.typ of
- ait_regalloc:
- begin
- if (getregtype(Tai_regalloc(p).reg)=regtype) then
- setsupreg(Tai_regalloc(p).reg,reginfo[getsupreg(Tai_regalloc(p).reg)].colour);
- {
- Remove sequences of release and
- allocation of the same register like:
- # Register X released
- # Register X allocated
- }
- if assigned(p.previous) and
- (Tai(p.previous).typ=ait_regalloc) and
- (Tai_regalloc(p.previous).reg=Tai_regalloc(p).reg) and
- { allocation,deallocation or deallocation,allocation }
- (Tai_regalloc(p.previous).allocation xor Tai_regalloc(p).allocation) then
- begin
- q:=Tai(p.next);
- hp:=tai(p.previous);
- list.remove(hp);
- hp.free;
- list.remove(p);
- p.free;
- p:=q;
- continue;
- end;
- end;
- ait_instruction:
- begin
- for i:=0 to Taicpu_abstract(p).ops-1 do
- case Taicpu_abstract(p).oper[i]^.typ of
- Top_reg:
- if (getregtype(Taicpu_abstract(p).oper[i]^.reg)=regtype) then
- setsupreg(Taicpu_abstract(p).oper[i]^.reg,reginfo[getsupreg(Taicpu_abstract(p).oper[i]^.reg)].colour);
- Top_ref:
- begin
- if regtype=R_INTREGISTER then
- begin
- r:=Taicpu_abstract(p).oper[i]^.ref;
- if r^.base<>NR_NO then
- setsupreg(r^.base,reginfo[getsupreg(r^.base)].colour);
- if r^.index<>NR_NO then
- setsupreg(r^.index,reginfo[getsupreg(r^.index)].colour);
- end;
- end;
- {$ifdef arm}
- Top_shifterop:
- begin
- so:=Taicpu_abstract(p).oper[i]^.shifterop;
- if so^.rs<>NR_NO then
- setsupreg(so^.rs,table[getsupreg(so^.rs)]);
- end;
- {$endif arm}
- end;
- { Maybe the operation can be removed when
- it is a move and both arguments are the same }
- if Taicpu_abstract(p).is_nop then
- begin
- q:=Tai(p.next);
- list.remove(p);
- p.free;
- p:=q;
- continue;
- end;
- end;
- end;
- p:=Tai(p.next);
- end;
- end;
- procedure Trgobj.check_unreleasedregs;
- {$ifdef EXTDEBUG}
- var
- sr : tsuperregister;
- {$endif EXTDEBUG}
- begin
- {$ifdef EXTDEBUG}
- for sr:=first_imaginary to maxreg-1 do
- if not(supregset_in(unusedregs,sr)) then
- Comment(V_Warning,'Register '+std_regname(newreg(R_INTREGISTER,sr,R_SUBNONE))+' not released');
- {$endif EXTDEBUG}
- end;
- end.
- {
- $Log$
- Revision 1.93 2003-10-30 16:22:40 peter
- * call firstpass before allocation and codegeneration is started
- * move leftover code from pass_2.generatecode() to psub
- Revision 1.92 2003/10/29 21:29:14 jonas
- * some ALLOWDUPREG improvements
- Revision 1.91 2003/10/21 15:15:36 peter
- * taicpu_abstract.oper[] changed to pointers
- Revision 1.90 2003/10/19 12:36:36 florian
- * improved speed; reduced memory usage of the interference bitmap
- Revision 1.89 2003/10/19 01:34:30 florian
- * some ppc stuff fixed
- * memory leak fixed
- Revision 1.88 2003/10/18 15:41:26 peter
- * made worklists dynamic in size
- Revision 1.87 2003/10/17 16:16:08 peter
- * fixed last commit
- Revision 1.86 2003/10/17 15:25:18 florian
- * fixed more ppc stuff
- Revision 1.85 2003/10/17 14:38:32 peter
- * 64k registers supported
- * fixed some memory leaks
- Revision 1.84 2003/10/11 16:06:42 florian
- * fixed some MMX<->SSE
- * started to fix ppc, needs an overhaul
- + stabs info improve for spilling, not sure if it works correctly/completly
- - MMX_SUPPORT removed from Makefile.fpc
- Revision 1.83 2003/10/10 17:48:14 peter
- * old trgobj moved to x86/rgcpu and renamed to trgx86fpu
- * tregisteralloctor renamed to trgobj
- * removed rgobj from a lot of units
- * moved location_* and reference_* to cgobj
- * first things for mmx register allocation
- Revision 1.82 2003/10/09 21:31:37 daniel
- * Register allocator splitted, ans abstract now
- Revision 1.81 2003/10/01 20:34:49 peter
- * procinfo unit contains tprocinfo
- * cginfo renamed to cgbase
- * moved cgmessage to verbose
- * fixed ppc and sparc compiles
- Revision 1.80 2003/09/30 19:54:42 peter
- * reuse registers with the least conflicts
- Revision 1.79 2003/09/29 20:58:56 peter
- * optimized releasing of registers
- Revision 1.78 2003/09/28 13:41:12 peter
- * return reg 255 when allowdupreg is defined
- Revision 1.77 2003/09/25 16:19:32 peter
- * fix filepositions
- * insert spill temp allocations at the start of the proc
- Revision 1.76 2003/09/16 16:17:01 peter
- * varspez in calls to push_addr_param
- Revision 1.75 2003/09/12 19:07:42 daniel
- * Fixed fast spilling functionality by re-adding the code that initializes
- precoloured nodes to degree 255. I would like to play hangman on the one
- who removed that code.
- Revision 1.74 2003/09/11 11:54:59 florian
- * improved arm code generation
- * move some protected and private field around
- * the temp. register for register parameters/arguments are now released
- before the move to the parameter register is done. This improves
- the code in a lot of cases.
- Revision 1.73 2003/09/09 20:59:27 daniel
- * Adding register allocation order
- Revision 1.72 2003/09/09 15:55:44 peter
- * use register with least interferences in spillregister
- Revision 1.71 2003/09/07 22:09:35 peter
- * preparations for different default calling conventions
- * various RA fixes
- Revision 1.70 2003/09/03 21:06:45 peter
- * fixes for FPU register allocation
- Revision 1.69 2003/09/03 15:55:01 peter
- * NEWRA branch merged
- Revision 1.68 2003/09/03 11:18:37 florian
- * fixed arm concatcopy
- + arm support in the common compiler sources added
- * moved some generic cg code around
- + tfputype added
- * ...
- Revision 1.67.2.5 2003/08/31 20:44:07 peter
- * fixed getexplicitregisterint tregister value
- Revision 1.67.2.4 2003/08/31 20:40:50 daniel
- * Fixed add_edges_used
- Revision 1.67.2.3 2003/08/29 17:28:59 peter
- * next batch of updates
- Revision 1.67.2.2 2003/08/28 18:35:08 peter
- * tregister changed to cardinal
- Revision 1.67.2.1 2003/08/27 19:55:54 peter
- * first tregister patch
- Revision 1.67 2003/08/23 10:46:21 daniel
- * Register allocator bugfix for h2pas
- Revision 1.66 2003/08/17 16:59:20 jonas
- * fixed regvars so they work with newra (at least for ppc)
- * fixed some volatile register bugs
- + -dnotranslation option for -dnewra, which causes the registers not to
- be translated from virtual to normal registers. Requires support in
- the assembler writer as well, which is only implemented in aggas/
- agppcgas currently
- Revision 1.65 2003/08/17 14:32:48 daniel
- * Precoloured nodes now have an infinite degree approached with 255,
- like they should.
- Revision 1.64 2003/08/17 08:48:02 daniel
- * Another register allocator bug fixed.
- * usable_registers_cnt set to 6 for i386
- Revision 1.63 2003/08/09 18:56:54 daniel
- * cs_regalloc renamed to cs_regvars to avoid confusion with register
- allocator
- * Some preventive changes to i386 spillinh code
- Revision 1.62 2003/08/03 14:09:50 daniel
- * Fixed a register allocator bug
- * Figured out why -dnewra generates superfluous "mov reg1,reg2"
- statements: changes in location_force. These moves are now no longer
- constrained so they are optimized away.
- Revision 1.61 2003/07/21 13:32:39 jonas
- * add_edges_used() is now also called for registers allocated with
- getexplicitregisterint()
- * writing the intereference graph is now only done with -dradebug2 and
- the created files are now called "igraph.<module_name>"
- Revision 1.60 2003/07/06 15:31:21 daniel
- * Fixed register allocator. *Lots* of fixes.
- Revision 1.59 2003/07/06 15:00:47 jonas
- * fixed my previous completely broken commit. It's not perfect though,
- registers > last_int_supreg and < max_intreg may still be "translated"
- Revision 1.58 2003/07/06 14:45:05 jonas
- * support integer registers that are not managed by newra (ie. don't
- translate register numbers that fall outside the range
- first_int_supreg..last_int_supreg)
- Revision 1.57 2003/07/02 22:18:04 peter
- * paraloc splitted in callerparaloc,calleeparaloc
- * sparc calling convention updates
- Revision 1.56 2003/06/17 16:34:44 jonas
- * lots of newra fixes (need getfuncretparaloc implementation for i386)!
- * renamed all_intregisters to volatile_intregisters and made it
- processor dependent
- Revision 1.55 2003/06/14 14:53:50 jonas
- * fixed newra cycle for x86
- * added constants for indicating source and destination operands of the
- "move reg,reg" instruction to aasmcpu (and use those in rgobj)
- Revision 1.54 2003/06/13 21:19:31 peter
- * current_procdef removed, use current_procinfo.procdef instead
- Revision 1.53 2003/06/12 21:11:10 peter
- * ungetregisterfpu gets size parameter
- Revision 1.52 2003/06/12 16:43:07 peter
- * newra compiles for sparc
- Revision 1.51 2003/06/09 14:54:26 jonas
- * (de)allocation of registers for parameters is now performed properly
- (and checked on the ppc)
- - removed obsolete allocation of all parameter registers at the start
- of a procedure (and deallocation at the end)
- Revision 1.50 2003/06/03 21:11:09 peter
- * cg.a_load_* get a from and to size specifier
- * makeregsize only accepts newregister
- * i386 uses generic tcgnotnode,tcgunaryminus
- Revision 1.49 2003/06/03 13:01:59 daniel
- * Register allocator finished
- Revision 1.48 2003/06/01 21:38:06 peter
- * getregisterfpu size parameter added
- * op_const_reg size parameter added
- * sparc updates
- Revision 1.47 2003/05/31 20:31:11 jonas
- * set inital costs of assigning a variable to a register to 120 for
- non-i386, because the used register must be store to memory at the
- start and loaded again at the end
- Revision 1.46 2003/05/30 18:55:21 jonas
- * fixed several regvar related bugs for non-i386. make cycle with -Or now
- works for ppc
- Revision 1.45 2003/05/30 12:36:13 jonas
- * use as little different registers on the ppc until newra is released,
- since every used register must be saved
- Revision 1.44 2003/05/17 13:30:08 jonas
- * changed tt_persistant to tt_persistent :)
- * tempcreatenode now doesn't accept a boolean anymore for persistent
- temps, but a ttemptype, so you can also create ansistring temps etc
- Revision 1.43 2003/05/16 14:33:31 peter
- * regvar fixes
- Revision 1.42 2003/04/26 20:03:49 daniel
- * Bug fix in simplify
- Revision 1.41 2003/04/25 20:59:35 peter
- * removed funcretn,funcretsym, function result is now in varsym
- and aliases for result and function name are added using absolutesym
- * vs_hidden parameter for funcret passed in parameter
- * vs_hidden fixes
- * writenode changed to printnode and released from extdebug
- * -vp option added to generate a tree.log with the nodetree
- * nicer printnode for statements, callnode
- Revision 1.40 2003/04/25 08:25:26 daniel
- * Ifdefs around a lot of calls to cleartempgen
- * Fixed registers that are allocated but not freed in several nodes
- * Tweak to register allocator to cause less spills
- * 8-bit registers now interfere with esi,edi and ebp
- Compiler can now compile rtl successfully when using new register
- allocator
- Revision 1.39 2003/04/23 20:23:06 peter
- * compile fix for no-newra
- Revision 1.38 2003/04/23 14:42:07 daniel
- * Further register allocator work. Compiler now smaller with new
- allocator than without.
- * Somebody forgot to adjust ppu version number
- Revision 1.37 2003/04/22 23:50:23 peter
- * firstpass uses expectloc
- * checks if there are differences between the expectloc and
- location.loc from secondpass in EXTDEBUG
- Revision 1.36 2003/04/22 10:09:35 daniel
- + Implemented the actual register allocator
- + Scratch registers unavailable when new register allocator used
- + maybe_save/maybe_restore unavailable when new register allocator used
- Revision 1.35 2003/04/21 19:16:49 peter
- * count address regs separate
- Revision 1.34 2003/04/17 16:48:21 daniel
- * Added some code to keep track of move instructions in register
- allocator
- Revision 1.33 2003/04/17 07:50:24 daniel
- * Some work on interference graph construction
- Revision 1.32 2003/03/28 19:16:57 peter
- * generic constructor working for i386
- * remove fixed self register
- * esi added as address register for i386
- Revision 1.31 2003/03/11 21:46:24 jonas
- * lots of new regallocator fixes, both in generic and ppc-specific code
- (ppc compiler still can't compile the linux system unit though)
- Revision 1.30 2003/03/09 21:18:59 olle
- + added cutils to the uses clause
- Revision 1.29 2003/03/08 20:36:41 daniel
- + Added newra version of Ti386shlshrnode
- + Added interference graph construction code
- Revision 1.28 2003/03/08 13:59:16 daniel
- * Work to handle new register notation in ag386nsm
- + Added newra version of Ti386moddivnode
- Revision 1.27 2003/03/08 10:53:48 daniel
- * Created newra version of secondmul in n386add.pas
- Revision 1.26 2003/03/08 08:59:07 daniel
- + $define newra will enable new register allocator
- + getregisterint will return imaginary registers with $newra
- + -sr switch added, will skip register allocation so you can see
- the direct output of the code generator before register allocation
- Revision 1.25 2003/02/26 20:50:45 daniel
- * Fixed ungetreference
- Revision 1.24 2003/02/19 22:39:56 daniel
- * Fixed a few issues
- Revision 1.23 2003/02/19 22:00:14 daniel
- * Code generator converted to new register notation
- - Horribily outdated todo.txt removed
- Revision 1.22 2003/02/02 19:25:54 carl
- * Several bugfixes for m68k target (register alloc., opcode emission)
- + VIS target
- + Generic add more complete (still not verified)
- Revision 1.21 2003/01/08 18:43:57 daniel
- * Tregister changed into a record
- Revision 1.20 2002/10/05 12:43:28 carl
- * fixes for Delphi 6 compilation
- (warning : Some features do not work under Delphi)
- Revision 1.19 2002/08/23 16:14:49 peter
- * tempgen cleanup
- * tt_noreuse temp type added that will be used in genentrycode
- Revision 1.18 2002/08/17 22:09:47 florian
- * result type handling in tcgcal.pass_2 overhauled
- * better tnode.dowrite
- * some ppc stuff fixed
- Revision 1.17 2002/08/17 09:23:42 florian
- * first part of procinfo rewrite
- Revision 1.16 2002/08/06 20:55:23 florian
- * first part of ppc calling conventions fix
- Revision 1.15 2002/08/05 18:27:48 carl
- + more more more documentation
- + first version include/exclude (can't test though, not enough scratch for i386 :()...
- Revision 1.14 2002/08/04 19:06:41 carl
- + added generic exception support (still does not work!)
- + more documentation
- Revision 1.13 2002/07/07 09:52:32 florian
- * powerpc target fixed, very simple units can be compiled
- * some basic stuff for better callparanode handling, far from being finished
- Revision 1.12 2002/07/01 18:46:26 peter
- * internal linker
- * reorganized aasm layer
- Revision 1.11 2002/05/18 13:34:17 peter
- * readded missing revisions
- Revision 1.10 2002/05/16 19:46:44 carl
- + defines.inc -> fpcdefs.inc to avoid conflicts if compiling by hand
- + try to fix temp allocation (still in ifdef)
- + generic constructor calls
- + start of tassembler / tmodulebase class cleanup
- Revision 1.8 2002/04/21 15:23:03 carl
- + makeregsize
- + changeregsize is now a local routine
- Revision 1.7 2002/04/20 21:32:25 carl
- + generic FPC_CHECKPOINTER
- + first parameter offset in stack now portable
- * rename some constants
- + move some cpu stuff to other units
- - remove unused constents
- * fix stacksize for some targets
- * fix generic size problems which depend now on EXTEND_SIZE constant
- Revision 1.6 2002/04/15 19:03:31 carl
- + reg2str -> std_reg2str()
- Revision 1.5 2002/04/06 18:13:01 jonas
- * several powerpc-related additions and fixes
- Revision 1.4 2002/04/04 19:06:04 peter
- * removed unused units
- * use tlocation.size in cg.a_*loc*() routines
- Revision 1.3 2002/04/02 17:11:29 peter
- * tlocation,treference update
- * LOC_CONSTANT added for better constant handling
- * secondadd splitted in multiple routines
- * location_force_reg added for loading a location to a register
- of a specified size
- * secondassignment parses now first the right and then the left node
- (this is compatible with Kylix). This saves a lot of push/pop especially
- with string operations
- * adapted some routines to use the new cg methods
- Revision 1.2 2002/04/01 19:24:25 jonas
- * fixed different parameter name in interface and implementation
- declaration of a method (only 1.0.x detected this)
- Revision 1.1 2002/03/31 20:26:36 jonas
- + a_loadfpu_* and a_loadmm_* methods in tcg
- * register allocation is now handled by a class and is mostly processor
- independent (+rgobj.pas and i386/rgcpu.pas)
- * temp allocation is now handled by a class (+tgobj.pas, -i386\tgcpu.pas)
- * some small improvements and fixes to the optimizer
- * some register allocation fixes
- * some fpuvaroffset fixes in the unary minus node
- * push/popusedregisters is now called rg.save/restoreusedregisters and
- (for i386) uses temps instead of push/pop's when using -Op3 (that code is
- also better optimizable)
- * fixed and optimized register saving/restoring for new/dispose nodes
- * LOC_FPU locations now also require their "register" field to be set to
- R_ST, not R_ST0 (the latter is used for LOC_CFPUREGISTER locations only)
- - list field removed of the tnode class because it's not used currently
- and can cause hard-to-find bugs
- }
|