| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043 | {    Copyright (c) 1998-2002 by Florian Klaempfl    Generate x86 assembler for in/case nodes    This program is free software; you can redistribute it and/or modify    it under the terms of the GNU General Public License as published by    the Free Software Foundation; either version 2 of the License, or    (at your option) any later version.    This program is distributed in the hope that it will be useful,    but WITHOUT ANY WARRANTY; without even the implied warranty of    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the    GNU General Public License for more details.    You should have received a copy of the GNU General Public License    along with this program; if not, write to the Free Software    Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. ****************************************************************************}unit nx86set;{$i fpcdefs.inc}interface    uses      globtype,constexp,      node,nset,pass_1,ncgset;    type       tx86innode = class(tinnode)         procedure pass_generate_code;override;         function pass_1 : tnode;override;       end;      tx86casenode = class(tcgcasenode)         function  has_jumptable : boolean;override;         procedure genjumptable(hp : pcaselabel;min_,max_ : int64);override;         procedure genlinearlist(hp : pcaselabel);override;         procedure genjmptreeentry(p : pcaselabel;parentvalue : TConstExprInt);override;      end;implementation    uses      systems,      verbose,globals,      symconst,symdef,defutil,cutils,      aasmbase,aasmtai,aasmdata,aasmcpu,      cgbase,pass_2,tgobj,      ncon,      cpubase,      cga,cgobj,hlcgobj,cgutils,ncgutil,      cgx86,      procinfo;{*****************************************************************************                                  TX86CASENODE*****************************************************************************}    function tx86casenode.has_jumptable : boolean;      begin        has_jumptable:=true;      end;    procedure tx86casenode.genjumptable(hp : pcaselabel;min_,max_ : int64);      var        table : tasmlabel;        last : TConstExprInt;        indexreg : tregister;        href : treference;        jtlist: tasmlist;        opcgsize: tcgsize;        jumpreg: tregister;        labeltyp: taiconst_type;        AlmostExhaustive: Boolean;        lv, hv: TConstExprInt;        ExhaustiveLimit, Range, x, oldmin : int64;      const        ExhaustiveLimitBase = 32;        procedure genitem(list:TAsmList;t : pcaselabel);          var            i : TConstExprInt;          begin            if assigned(t^.less) then              genitem(list,t^.less);            { fill possible hole }            i:=last+1;            while i<=t^._low-1 do              begin                list.concat(Tai_const.Create_type_sym(labeltyp,elselabel));                i:=i+1;              end;            i:=t^._low;            while i<=t^._high do              begin                list.concat(Tai_const.Create_type_sym(labeltyp,blocklabel(t^.blockid)));                i:=i+1;              end;            last:=t^._high;            if assigned(t^.greater) then              genitem(list,t^.greater);          end;      begin        lv:=0;        hv:=0;        oldmin:=0;        last:=min_;        { This generates near pointers on i8086 }        labeltyp:=aitconst_ptr;        opcgsize:=def_cgsize(opsize);        AlmostExhaustive := False;        if not(jumptable_no_range) then          begin            getrange(left.resultdef,lv,hv);            Range := aint(max_)-aint(min_);            if (cs_opt_size in current_settings.optimizerswitches) then              { Limit size of jump tables for small enumerations so they have                to be at least two-thirds full before being considered for the                "almost exhaustive" treatment }              ExhaustiveLimit := min(ExhaustiveLimitBase, labelcoverage shl 1)            else              ExhaustiveLimit := ExhaustiveLimitBase;            { If true, then this indicates that almost every possible value of x is covered by              a label.  As such, it's more cost-efficient to remove the initial range check and              instead insert the remaining values into the jump table, pointing at elselabel. [Kit] }            if ((hv - lv) - Range <= ExhaustiveLimit) then              begin                oldmin := min_;                min_ := lv.svalue;                AlmostExhaustive := True;              end            else              begin                { a <= x <= b <-> unsigned(x-a) <= (b-a) }                cg.a_op_const_reg(current_asmdata.CurrAsmList,OP_SUB,opcgsize,aint(min_),hregister);                { case expr greater than max_ => goto elselabel }                cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opcgsize,OC_A,aint(max_)-aint(min_),hregister,elselabel);                min_:=0;                { do not sign extend when we load the index register, as we applied an offset above }                opcgsize:=tcgsize2unsigned[opcgsize];              end;          end;        current_asmdata.getdatalabel(table);        { make it a 32bit register }        indexreg:=cg.makeregsize(current_asmdata.CurrAsmList,hregister,OS_INT);        cg.a_load_reg_reg(current_asmdata.CurrAsmList,opcgsize,OS_INT,hregister,indexreg);        { create reference }        reference_reset_symbol(href,table,0,sizeof(pint),[]);        href.offset:=(-aint(min_))*sizeof(aint);        href.index:=indexreg;{$ifdef i8086}        cg.a_op_const_reg(current_asmdata.CurrAsmList,OP_SHL,OS_INT,1,indexreg);{$else i8086}        href.scalefactor:=sizeof(aint);{$endif i8086}        if (not (target_info.system in [system_i386_darwin,system_i386_iphonesim])) and           (cs_create_pic in current_settings.moduleswitches) then          begin            labeltyp:=aitconst_gotoff_symbol;            jumpreg:=cg.getintregister(current_asmdata.CurrAsmList,OS_ADDR);            cg.a_load_ref_reg(current_asmdata.CurrAsmList,OS_ADDR,OS_ADDR,href,jumpreg);            cg.a_op_reg_reg(current_asmdata.CurrAsmList,OP_ADD,OS_ADDR,current_procinfo.got,jumpreg);            emit_reg(A_JMP,S_NO,jumpreg);            include(current_procinfo.flags,pi_needs_got);          end        else          emit_ref(A_JMP,S_NO,href);        { generate jump table }        if (target_info.system in [system_i386_darwin,system_i386_iphonesim]) then          jtlist:=current_asmdata.asmlists[al_const]        else          jtlist:=current_procinfo.aktlocaldata;        new_section(jtlist,sec_rodata,current_procinfo.procdef.mangledname,sizeof(aint));        jtlist.concat(Tai_label.Create(table));        if AlmostExhaustive then          begin            { Fill the table with the values below _min }            x := lv.svalue;            while x < oldmin do              begin                jtlist.concat(Tai_const.Create_type_sym(labeltyp, elselabel));                Inc(x);              end;            genitem(jtlist,hp);            { Fill the table with the values above _max }            { Subtracting one from hv and not adding 1 to max averts the risk of an overflow }            x := max_;            hv := hv - 1;            while x <= hv.svalue do              begin                jtlist.concat(Tai_const.Create_type_sym(labeltyp, elselabel));                Inc(x);              end;          end        else          genitem(jtlist,hp)      end;    procedure tx86casenode.genlinearlist(hp : pcaselabel);      var        first : boolean;        lastrange : boolean;        last : TConstExprInt;        cond_lt,cond_le : tresflags;        opcgsize: tcgsize;        procedure genitem(t : pcaselabel);          var             range, gap: aint;          begin             if assigned(t^.less) then               genitem(t^.less);             { need we to test the first value }             if first and (t^._low>get_min_value(left.resultdef)) then               begin                 cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opcgsize,jmp_lt,aint(t^._low.svalue),hregister,elselabel);               end;             if t^._low=t^._high then               begin                  if t^._low-last=0 then                    cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList, opcgsize, OC_EQ,0,hregister,blocklabel(t^.blockid))                  else                    begin                      cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                      cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_SUB, opcgsize, aint(t^._low.svalue-last.svalue), hregister);                      cg.a_jmp_flags(current_asmdata.CurrAsmList,F_E,blocklabel(t^.blockid));                      cg.a_reg_dealloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                    end;                  last:=t^._low;                  lastrange:=false;               end             else               begin                  range := aint(t^._high.svalue - t^._low.svalue);                  { it begins with the smallest label, if the value }                  { is even smaller then jump immediately to the    }                  { ELSE-label                                }                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  if first then                    begin                       { have we to ajust the first value ? }                       if (t^._low>get_min_value(left.resultdef)) or (get_min_value(left.resultdef)<>0) then                         cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_SUB, opcgsize, aint(t^._low.svalue), hregister);                    end                  else                    begin                      gap := aint(t^._low.svalue - last.svalue);                      { if there is no unused label between the last and the }                      { present label then the lower limit can be checked    }                      { immediately. else check the range in between:       }                      { we need to use A_SUB, if cond_lt uses the carry flags                        because A_DEC does not set the correct flags, therefor                        using a_op_const_reg(OP_SUB) is not possible }                      if (gap = 1) and (cond_lt in [F_C,F_NC,F_A,F_AE,F_B,F_BE]) then                        emit_const_reg(A_SUB, TCGSize2OpSize[opcgsize], gap, hregister)                      else                        cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_SUB, opcgsize, gap, hregister);                      { no jump necessary here if the new range starts at                        at the value following the previous one           }                      if (gap <> 1) or                         (not lastrange) then                        cg.a_jmp_flags(current_asmdata.CurrAsmList,cond_lt,elselabel);                    end;                  { we need to use A_SUB, if cond_le uses the carry flags                    because A_DEC does not set the correct flags, therefor                    using a_op_const_reg(OP_SUB) is not possible }                  if (cond_le in [F_C,F_NC,F_A,F_AE,F_B,F_BE]) and (range = 1) then                    emit_const_reg(A_SUB,TCGSize2OpSize[opcgsize], range, hregister)                  else                    cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_SUB, opcgsize, range, hregister);                  cg.a_jmp_flags(current_asmdata.CurrAsmList,cond_le,blocklabel(t^.blockid));                  cg.a_reg_dealloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  last:=t^._high;                  lastrange:=true;               end;             first:=false;             if assigned(t^.greater) then               genitem(t^.greater);          end;        begin           opcgsize:=def_cgsize(opsize);           if with_sign then             begin                cond_lt:=F_L;                cond_le:=F_LE;             end           else              begin                cond_lt:=F_B;                cond_le:=F_BE;             end;           { do we need to generate cmps? }{$ifdef i8086}           if (with_sign and (min_label<0)) or (opcgsize in [OS_32, OS_S32]) then{$else i8086}           if (with_sign and (min_label<0)) then{$endif i8086}             genlinearcmplist(hp)           else             begin                if (labelcnt>1) or not(cs_opt_level1 in current_settings.optimizerswitches) then                  begin                    last:=0;                    lastrange:=false;                    first:=true;                    genitem(hp);                  end                else                  begin                    { If only one label exists, we can greatly simplify the checks to a simple comparison }                    if hp^._low=hp^._high then                      cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList, opcgsize, OC_EQ, tcgint(hp^._low.svalue), hregister, blocklabel(hp^.blockid))                    else                      begin                        cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_SUB, opcgsize, tcgint(hp^._low.svalue), hregister);                        cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList, opcgsize, OC_BE, tcgint(hp^._high.svalue - hp^._low.svalue), hregister,blocklabel(hp^.blockid));                      end;                  end;                cg.a_jmp_always(current_asmdata.CurrAsmList,elselabel);             end;        end;      procedure tx86casenode.genjmptreeentry(p : pcaselabel;parentvalue : TConstExprInt);        var          lesslabel,greaterlabel : tasmlabel;          cond_gt: TResFlags;          cmplow : Boolean;        begin           if with_sign then             cond_gt:=F_G           else             cond_gt:=F_A;          current_asmdata.CurrAsmList.concat(cai_align.Create(current_settings.alignment.jumpalign));          cg.a_label(current_asmdata.CurrAsmList,p^.labellabel);          { calculate labels for left and right }          if p^.less=nil then            lesslabel:=elselabel          else            lesslabel:=p^.less^.labellabel;          if p^.greater=nil then            greaterlabel:=elselabel          else            greaterlabel:=p^.greater^.labellabel;          { calculate labels for left and right }          { no range label: }          if p^._low=p^._high then            begin              if greaterlabel=lesslabel then                hlcg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_NE,p^._low,hregister,lesslabel)              else                begin                  cmplow:=p^._low-1<>parentvalue;                  if cmplow then                    hlcg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,jmp_lt,p^._low,hregister,lesslabel);                  if p^._high+1<>parentvalue then                    begin                      if cmplow then                        hlcg.a_jmp_flags(current_asmdata.CurrAsmList,cond_gt,greaterlabel)                      else                        hlcg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,jmp_gt,p^._low,hregister,greaterlabel);                    end;                end;              hlcg.a_jmp_always(current_asmdata.CurrAsmList,blocklabel(p^.blockid));            end          else            begin              if p^._low-1<>parentvalue then                hlcg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,jmp_lt,p^._low,hregister,lesslabel);              if p^._high+1<>parentvalue then                hlcg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,jmp_gt,p^._high,hregister,greaterlabel);              hlcg.a_jmp_always(current_asmdata.CurrAsmList,blocklabel(p^.blockid));            end;           if assigned(p^.less) then             genjmptreeentry(p^.less,p^._low);           if assigned(p^.greater) then             genjmptreeentry(p^.greater,p^._high);        end;{*****************************************************************************                              TX86INNODE*****************************************************************************}    function tx86innode.pass_1 : tnode;      begin         result:=nil;         { this is the only difference from the generic version }         expectloc:=LOC_FLAGS;         firstpass(right);         firstpass(left);         if codegenerror then           exit;      end;    procedure tx86innode.pass_generate_code;       type         Tsetpart=record           range : boolean;      {Part is a range.}           start,stop : byte;    {Start/stop when range; Stop=element when an element.}         end;       var         hreg,{$ifndef i8086} hreg2, {$endif}         pleftreg   : tregister;         opsize     : tcgsize;         opdef      : torddef;         orgopsize  : tcgsize;         setparts   : array[1..8] of Tsetpart;         setbase    : aint;         adjustment : longint;         l,l2       : tasmlabel;         i,numparts : byte;         genjumps,         use_small,         ranges     : boolean;{$ifdef CORRECT_SET_IN_FPC}         AM         : tasmop;{$endif CORRECT_SET_IN_FPC}{$ifdef i8086}         extra_offset_reg: TRegister;{$endif i8086}         function analizeset(Aset:pconstset;is_small:boolean):boolean;           var             compares,maxcompares:word;             i:byte;           begin             if tnormalset(Aset^)=[] then                {The expression...                    if expr in []                 ...is allways false. It should be optimized away in the                 resultdef pass, and thus never occur here. Since we                 do generate wrong code for it, do internalerror.}                internalerror(2002072301);             analizeset:=false;             ranges:=false;             numparts:=0;             compares:=0;             { Lots of comparisions take a lot of time, so do not allow               too much comparisions. 8 comparisions are, however, still               smalller than emitting the set }             if cs_opt_size in current_settings.optimizerswitches then               maxcompares:=8             else               maxcompares:=5;             { when smallset is possible allow only 3 compares the smallset               code is for littlesize also smaller when more compares are used }             if is_small then               maxcompares:=3;             for i:=0 to 255 do              if i in tnormalset(Aset^) then               begin                 if (numparts=0) or (i<>setparts[numparts].stop+1) then                  begin                  {Set element is a separate element.}                    inc(compares);                    if compares>maxcompares then                         exit;                    inc(numparts);                    setparts[numparts].range:=false;                    setparts[numparts].stop:=i;                  end                 else                  {Set element is part of a range.}                  if not setparts[numparts].range then                   begin                     {Transform an element into a range.}                     setparts[numparts].range:=true;                     setparts[numparts].start:=setparts[numparts].stop;                     setparts[numparts].stop:=i;                     ranges := true;                   end                  else                   begin                    {Extend a range.}                    setparts[numparts].stop:=i;                   end;              end;             analizeset:=true;           end;{$ifdef i8086}         procedure add_extra_offset(offset_reg:TRegister;var ref:treference);           var             reg: TRegister;           begin             if ref.index=NR_NO then               ref.index:=offset_reg             else if ref.base=NR_NO then               ref.base:=offset_reg             else               begin                 reg:=cg.getaddressregister(current_asmdata.CurrAsmList);                 cg.a_load_reg_reg(current_asmdata.CurrAsmList,OS_ADDR,OS_ADDR,ref.index,reg);                 cg.a_op_reg_reg(current_asmdata.CurrAsmList,OP_ADD,OS_ADDR,offset_reg,reg);                 ref.index:=reg;               end;           end;{$endif i8086}       begin         ranges:=false;         numparts:=0;         fillchar(setparts,sizeof(setparts),0);         { We check first if we can generate jumps, this can be done           because the resultdef is already set in firstpass }         { check if we can use smallset operation using btl which is limited           to 32 bits, the left side may also not contain higher values or be signed !! }         use_small:=is_smallset(right.resultdef) and                    not is_signed(left.resultdef) and                    ((left.resultdef.typ=orddef) and (torddef(left.resultdef).high.svalue<{$ifdef i8086}16{$else}32{$endif}) or                     (left.resultdef.typ=enumdef) and (tenumdef(left.resultdef).max<{$ifdef i8086}16{$else}32{$endif}));         { Can we generate jumps? Possible for all types of sets }         genjumps:=(right.nodetype=setconstn) and                   analizeset(tsetconstnode(right).value_set,use_small);         { calculate both operators }         { the complex one first }         { not in case of genjumps, because then we don't secondpass    }         { right at all (so we have to make sure that "right" really is }         { "right" and not "swapped left" in that case)                 }         if not(genjumps) then           firstcomplex(self);         secondpass(left);         { Only process the right if we are not generating jumps }         if not genjumps then          begin            secondpass(right);          end;         if codegenerror then          exit;         { ofcourse not commutative }         if nf_swapped in flags then          swapleftright;         orgopsize := def_cgsize(left.resultdef);{$ifdef i8086}         opsize := OS_16;{$else i8086}         opsize := OS_32;{$endif i8086}         if is_signed(left.resultdef) then           opsize := tcgsize(ord(opsize)+(ord(OS_S8)-ord(OS_8)));         opdef:=cgsize_orddef(opsize);         if not(left.location.loc in [LOC_REGISTER,LOC_CREGISTER,LOC_REFERENCE,LOC_CREFERENCE,LOC_CONSTANT]) then           hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,true);         if (right.location.loc in [LOC_SUBSETREG,LOC_CSUBSETREG]) then           hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,left.resultdef,opdef,true);         if genjumps then          begin            { It gives us advantage to check for the set elements              separately instead of using the SET_IN_BYTE procedure.              To do: Build in support for LOC_JUMP }            { load and zero or sign extend as necessary }            hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,false);            pleftreg:=left.location.register;            { Get a label to jump to the end }            location_reset(location,LOC_FLAGS,OS_NO);            { It's better to use the zero flag when there are              no ranges }            if ranges then              location.resflags:=F_C            else              location.resflags:=F_E;            current_asmdata.getjumplabel(l);            { how much have we already substracted from the x in the }            { "x in [y..z]" expression                               }            adjustment := 0;            cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);            for i:=1 to numparts do             if setparts[i].range then              { use fact that a <= x <= b <=> cardinal(x-a) <= cardinal(b-a) }              begin                { is the range different from all legal values? }                if (setparts[i].stop-setparts[i].start <> 255) or not (orgopsize = OS_8) then                  begin                    { yes, is the lower bound <> 0? }                    if (setparts[i].start <> 0) then                      begin                        hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,false);                        hreg:=left.location.register;                        pleftreg:=hreg;                        cg.a_op_const_reg(current_asmdata.CurrAsmList,OP_SUB,opsize,setparts[i].start-adjustment,pleftreg);                      end;                    { new total value substracted from x:           }                    { adjustment + (setparts[i].start - adjustment) }                    adjustment := setparts[i].start;                    { check if result < b-a+1 (not "result <= b-a", since }                    { we need a carry in case the element is in the range }                    { (this will never overflow since we check at the     }                    { beginning whether stop-start <> 255)                }                    cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_B,setparts[i].stop-setparts[i].start+1,pleftreg,l);                    cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  end                else                  { if setparts[i].start = 0 and setparts[i].stop = 255,  }                  { it's always true since "in" is only allowed for bytes }                  begin                    current_asmdata.CurrAsmList.concat(taicpu.op_none(A_STC,S_NO));                    cg.a_jmp_always(current_asmdata.CurrAsmList,l);                  end;              end             else              begin                { Emit code to check if left is an element }                current_asmdata.CurrAsmList.concat(taicpu.op_const_reg(A_CMP,TCGSize2OpSize[opsize],setparts[i].stop-adjustment,                  pleftreg));                { Result should be in carry flag when ranges are used }                if ranges then                  current_asmdata.CurrAsmList.concat(taicpu.op_none(A_STC,S_NO));                { If found, jump to end }                cg.a_jmp_flags(current_asmdata.CurrAsmList,F_E,l);              end;             if ranges and                { if the last one was a range, the carry flag is already }                { set appropriately                                      }                not(setparts[numparts].range) then                  current_asmdata.CurrAsmList.concat(taicpu.op_none(A_CLC,S_NO));             { To compensate for not doing a second pass }             right.location.reference.symbol:=nil;             { Now place the end label }             cg.a_label(current_asmdata.CurrAsmList,l);          end         else          begin            location_reset(location,LOC_FLAGS,OS_NO);            setbase:=tsetdef(right.resultdef).setbase;            { We will now generated code to check the set itself, no jmps,              handle smallsets separate, because it allows faster checks }            if use_small then             begin               if left.location.loc=LOC_CONSTANT then                begin                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  location.resflags:=F_NE;                  case right.location.loc of                    LOC_REGISTER,                    LOC_CREGISTER:                      begin                         emit_const_reg(A_TEST,TCGSize2OpSize[right.location.size],                           1 shl ((left.location.value-setbase) and 31),right.location.register);                      end;                    LOC_REFERENCE,                    LOC_CREFERENCE :                      begin                        emit_const_ref(A_TEST,TCGSize2OpSize[right.location.size],1 shl ((left.location.value-setbase) and 31),                           right.location.reference);                      end;                    else                      internalerror(200203312);                  end;                end               else                begin{$ifdef i8086}                  register_maybe_adjust_setbase(current_asmdata.CurrAsmList,left.resultdef,left.location,setbase);                  cg.getcpuregister(current_asmdata.CurrAsmList,NR_CX);                  if TCGSize2Size[left.location.size] > 2 then                    left.location.size := OS_16;                  cg.a_load_loc_reg(current_asmdata.CurrAsmList,OS_16,left.location,NR_CX);                  if (tcgsize2size[right.location.size] < 2) or                     (right.location.loc = LOC_CONSTANT) then                    hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,u16inttype,true);                  hreg:=cg.getintregister(current_asmdata.CurrAsmList,OS_16);                  emit_const_reg(A_MOV,S_W,1,hreg);                  emit_reg_reg(A_SHL,S_W,NR_CL,hreg);                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  case right.location.loc of                    LOC_REGISTER,                    LOC_CREGISTER :                      begin                        emit_reg_reg(A_TEST,S_W,hreg,right.location.register);                      end;                     LOC_CREFERENCE,                     LOC_REFERENCE :                       begin                         emit_reg_ref(A_TEST,S_W,hreg,right.location.reference);                       end;                     else                       internalerror(2002032210);                  end;                  cg.ungetcpuregister(current_asmdata.CurrAsmList,NR_CX);                  location.resflags:=F_NE;{$else i8086}                  hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,u32inttype,true);                  register_maybe_adjust_setbase(current_asmdata.CurrAsmList,u32inttype,left.location,setbase);                  if (tcgsize2size[right.location.size] < opdef.size) or                    (right.location.loc = LOC_CONSTANT) or                    { bt ...,[mem] is slow, see #40039, so try to use a register if we are not optimizing for size }                    ((right.resultdef.size<=u32inttype.size) and not(cs_opt_size in current_settings.optimizerswitches)) then                    hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,u32inttype,true);                  hreg:=left.location.register;                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  case right.location.loc of                    LOC_REGISTER,                    LOC_CREGISTER :                      begin                        emit_reg_reg(A_BT,S_L,hreg,right.location.register);                      end;                     LOC_CREFERENCE,                     LOC_REFERENCE :                       begin                         emit_reg_ref(A_BT,S_L,hreg,right.location.reference);                       end;                     else                       internalerror(2002032210);                  end;                  location.resflags:=F_C;{$endif i8086}                end;             end            else             begin               if right.location.loc=LOC_CONSTANT then                begin{$ifdef i8086}                  location.resflags:=F_NE;                  current_asmdata.getjumplabel(l);                  current_asmdata.getjumplabel(l2);                  { load constants to a register }                  if (left.location.loc=LOC_CONSTANT) or                     (setbase<>0) then                    begin                      hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,true);                      register_maybe_adjust_setbase(current_asmdata.CurrAsmList,opdef,left.location,setbase);                    end;                  cg.getcpuregister(current_asmdata.CurrAsmList,NR_CX);                  if TCGSize2Size[left.location.size] > 2 then                    left.location.size := OS_16;                  cg.a_load_loc_reg(current_asmdata.CurrAsmList,OS_16,left.location,NR_CX);                  cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_BE,15,NR_CX,l);                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  { set the zero flag }                  current_asmdata.CurrAsmList.concat(taicpu.op_const_reg(A_TEST,S_B,0,NR_AL));                  cg.a_jmp_always(current_asmdata.CurrAsmList,l2);                  cg.a_reg_dealloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  hreg:=cg.getintregister(current_asmdata.CurrAsmList,OS_16);                  cg.a_label(current_asmdata.CurrAsmList,l);                  emit_const_reg(A_MOV,S_W,1,hreg);                  emit_reg_reg(A_SHL,S_W,NR_CL,hreg);                  cg.ungetcpuregister(current_asmdata.CurrAsmList,NR_CX);                  cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                  emit_const_reg(A_TEST,S_W,right.location.value,hreg);                  cg.a_label(current_asmdata.CurrAsmList,l2);{$else i8086}                  location.resflags:=F_C;                  current_asmdata.getjumplabel(l);                  current_asmdata.getjumplabel(l2);                  { load constants to a register }                  if (left.location.loc=LOC_CONSTANT) or                     (setbase<>0) then                    begin                      hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,true);                      register_maybe_adjust_setbase(current_asmdata.CurrAsmList,opdef,left.location,setbase);                    end;                  case left.location.loc of                     LOC_REGISTER,                     LOC_CREGISTER:                       begin                          hreg:=cg.makeregsize(current_asmdata.CurrAsmList,left.location.register,opsize);                          cg.a_load_reg_reg(current_asmdata.CurrAsmList,left.location.size,opsize,left.location.register,hreg);                          cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_BE,31,hreg,l);                          cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                          { reset carry flag }                          current_asmdata.CurrAsmList.concat(taicpu.op_none(A_CLC,S_NO));                          cg.a_jmp_always(current_asmdata.CurrAsmList,l2);                          cg.a_label(current_asmdata.CurrAsmList,l);                          { We have to load the value into a register because                            btl does not accept values only refs or regs (PFV) }                          hreg2:=cg.getintregister(current_asmdata.CurrAsmList,OS_32);                          cg.a_load_const_reg(current_asmdata.CurrAsmList,OS_32,right.location.value,hreg2);                          emit_reg_reg(A_BT,S_L,hreg,hreg2);                       end;                     else                       begin                          cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                          emit_const_ref(A_CMP,TCGSize2OpSize[orgopsize],31,left.location.reference);                          cg.a_jmp_flags(current_asmdata.CurrAsmList,F_BE,l);                          { reset carry flag }                          current_asmdata.CurrAsmList.concat(taicpu.op_none(A_CLC,S_NO));                          cg.a_jmp_always(current_asmdata.CurrAsmList,l2);                          cg.a_label(current_asmdata.CurrAsmList,l);                          hreg:=cg.getintregister(current_asmdata.CurrAsmList,OS_32);                          cg.a_load_ref_reg(current_asmdata.CurrAsmList,OS_32,OS_32,left.location.reference,hreg);                          { We have to load the value into a register because                            btl does not accept values only refs or regs (PFV) }                          hreg2:=cg.getintregister(current_asmdata.CurrAsmList,OS_32);                          cg.a_load_const_reg(current_asmdata.CurrAsmList,OS_32,right.location.value,hreg2);                          emit_reg_reg(A_BT,S_L,hreg,hreg2);                       end;                  end;                  cg.a_label(current_asmdata.CurrAsmList,l2);{$endif i8086}                end { of right.location.loc=LOC_CONSTANT }               { do search in a normal set which could have >32 elementsm                 but also used if the left side contains values > 32 or < 0 }               else if left.location.loc=LOC_CONSTANT then                begin                  if (left.location.value<setbase) or (((left.location.value-setbase) shr 3) >= right.resultdef.size) then                    {should be caught earlier }                    internalerror(2007020201);                  location.resflags:=F_NE;                  case right.location.loc of                    LOC_REFERENCE,LOC_CREFERENCE:                      begin                        inc(right.location.reference.offset,(left.location.value-setbase) shr 3);                        cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                        emit_const_ref(A_TEST,S_B,1 shl ((left.location.value-setbase) and 7),right.location.reference);                      end;                    LOC_REGISTER,LOC_CREGISTER:                      begin                        cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                        emit_const_reg(A_TEST,TCGSize2OpSize[right.location.size],1 shl (left.location.value-setbase),right.location.register);                      end;                    else                      internalerror(2007051901);                  end;                end               else                begin{$ifdef i8086}                  hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,false);                  register_maybe_adjust_setbase(current_asmdata.CurrAsmList,opdef,left.location,setbase);                  if TCGSize2Size[left.location.size] > 2 then                    left.location.size := OS_16;                  if not use_small then                    begin                      extra_offset_reg:=cg.getintregister(current_asmdata.CurrAsmList,OS_16);                      cg.a_load_loc_reg(current_asmdata.CurrAsmList,OS_16,left.location,extra_offset_reg);                      cg.a_op_const_reg(current_asmdata.CurrAsmList,OP_SHR,OS_16,4,extra_offset_reg);                      cg.a_op_const_reg(current_asmdata.CurrAsmList,OP_SHL,OS_16,1,extra_offset_reg);                    end                  else                    extra_offset_reg:=NR_NO;                  cg.getcpuregister(current_asmdata.CurrAsmList,NR_CX);                  cg.a_load_loc_reg(current_asmdata.CurrAsmList,OS_16,left.location,NR_CX);                  if not use_small then                    current_asmdata.CurrAsmList.concat(taicpu.op_const_reg(A_AND,S_B,15,NR_CL));                  pleftreg:=cg.getintregister(current_asmdata.CurrAsmList,OS_16);                  if (right.location.loc in [LOC_REGISTER,LOC_CREGISTER]) then                    hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,opdef,true);                  if (opsize >= OS_S8) or { = if signed }                     ((left.resultdef.typ=orddef) and                      ((torddef(left.resultdef).low < int64(tsetdef(right.resultdef).setbase)) or                       (torddef(left.resultdef).high > int64(tsetdef(right.resultdef).setmax)))) or                     ((left.resultdef.typ=enumdef) and                      ((tenumdef(left.resultdef).min < aint(tsetdef(right.resultdef).setbase)) or                       (tenumdef(left.resultdef).max > aint(tsetdef(right.resultdef).setmax)))) then                   begin                    { we have to check if the value is < 0 or > setmax }                    current_asmdata.getjumplabel(l);                    current_asmdata.getjumplabel(l2);                    { BE will be false for negative values }                    cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_BE,tsetdef(right.resultdef).setmax-tsetdef(right.resultdef).setbase,pleftreg,l);                    { set the zero flag }                    cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                    current_asmdata.CurrAsmList.concat(taicpu.op_const_reg(A_TEST,S_B,0,NR_AL));                    cg.a_jmp_always(current_asmdata.CurrAsmList,l2);                    cg.a_label(current_asmdata.CurrAsmList,l);                    cg.a_reg_dealloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                    emit_const_reg(A_MOV,S_W,1,pleftreg);                    emit_reg_reg(A_SHL,S_W,NR_CL,pleftreg);                    cg.ungetcpuregister(current_asmdata.CurrAsmList,NR_CX);                    case right.location.loc of                      LOC_REGISTER, LOC_CREGISTER :                        begin                          cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                          emit_reg_reg(A_TEST,S_W,pleftreg,right.location.register);                        end;                      LOC_CREFERENCE, LOC_REFERENCE :                        begin                          if not use_small then                            add_extra_offset(extra_offset_reg,right.location.reference);                          cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                          emit_reg_ref(A_TEST,S_W,pleftreg,right.location.reference);                        end;                    else                      internalerror(2007020301);                    end;                    cg.a_label(current_asmdata.CurrAsmList,l2);                    location.resflags:=F_NE;                   end                  else                   begin                      emit_const_reg(A_MOV,S_W,1,pleftreg);                      emit_reg_reg(A_SHL,S_W,NR_CL,pleftreg);                      cg.ungetcpuregister(current_asmdata.CurrAsmList,NR_CX);                      case right.location.loc of                        LOC_REGISTER, LOC_CREGISTER :                          begin                            cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                            emit_reg_reg(A_TEST,S_W,pleftreg,right.location.register);                          end;                        LOC_CREFERENCE, LOC_REFERENCE :                          begin                            if not use_small then                              add_extra_offset(extra_offset_reg,right.location.reference);                            cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                            emit_reg_ref(A_TEST,S_W,pleftreg,right.location.reference);                          end;                      else                        internalerror(2007020302);                      end;                      location.resflags:=F_NE;                   end;{$else i8086}                  hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,opdef,false);                  register_maybe_adjust_setbase(current_asmdata.CurrAsmList,opdef,left.location,setbase);                  if (right.location.loc in [LOC_REGISTER,LOC_CREGISTER]) or                    { bt ...,[mem] is slow, see #40039, so try to use a register if we are not optimizing for size }                    ((right.resultdef.size<=opdef.size) and not(cs_opt_size in current_settings.optimizerswitches)) then                    hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,opdef,true);                  pleftreg:=left.location.register;                  if (opsize >= OS_S8) or { = if signed }                     ((left.resultdef.typ=orddef) and                      ((torddef(left.resultdef).low < int64(tsetdef(right.resultdef).setbase)) or                       (torddef(left.resultdef).high > int64(tsetdef(right.resultdef).setmax)))) or                     ((left.resultdef.typ=enumdef) and                      ((tenumdef(left.resultdef).min < aint(tsetdef(right.resultdef).setbase)) or                       (tenumdef(left.resultdef).max > aint(tsetdef(right.resultdef).setmax)))) then                    begin                      { we have to check if the value is < 0 or > setmax }                      current_asmdata.getjumplabel(l);                      current_asmdata.getjumplabel(l2);                      { BE will be false for negative values }                      cg.a_cmp_const_reg_label(current_asmdata.CurrAsmList,opsize,OC_BE,tsetdef(right.resultdef).setmax-tsetdef(right.resultdef).setbase,pleftreg,l);                      cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                      { reset carry flag }                      current_asmdata.CurrAsmList.concat(taicpu.op_none(A_CLC,S_NO));                      cg.a_jmp_always(current_asmdata.CurrAsmList,l2);                      cg.a_label(current_asmdata.CurrAsmList,l);                      pleftreg:=left.location.register;                      case right.location.loc of                        LOC_REGISTER, LOC_CREGISTER :                          emit_reg_reg(A_BT,S_L,pleftreg,right.location.register);                        LOC_CREFERENCE, LOC_REFERENCE :                          emit_reg_ref(A_BT,S_L,pleftreg,right.location.reference);                      else                        internalerror(2007020301);                      end;                      cg.a_label(current_asmdata.CurrAsmList,l2);                      location.resflags:=F_C;                    end                  else                    begin                      cg.a_reg_alloc(current_asmdata.CurrAsmList, NR_DEFAULTFLAGS);                      case right.location.loc of                        LOC_REGISTER, LOC_CREGISTER :                          emit_reg_reg(A_BT,S_L,pleftreg,right.location.register);                        LOC_CREFERENCE, LOC_REFERENCE :                          emit_reg_ref(A_BT,S_L,pleftreg,right.location.reference);                      else                        internalerror(2007020302);                      end;                      location.resflags:=F_C;                    end;{$endif i8086}                end;             end;          end;          if not genjumps then            location_freetemp(current_asmdata.CurrAsmList,right.location);       end;begin   cinnode:=tx86innode;   ccasenode:=tx86casenode;end.
 |