diff options
author | Nick Ing-Simmons <nik@tiuk.ti.com> | 2000-09-03 21:54:46 +0000 |
---|---|---|
committer | Nick Ing-Simmons <nik@tiuk.ti.com> | 2000-09-03 21:54:46 +0000 |
commit | 1c846c1f6d96d2ca4dfccdcfc0ff050c1474993e (patch) | |
tree | 052cab67c23c5f42f2f3fbf0d595e76961d271d2 /sv.c | |
parent | 6570e624857a0fc90e8fa87d3479a32bd7482703 (diff) | |
download | perl-1c846c1f6d96d2ca4dfccdcfc0ff050c1474993e.tar.gz |
Hash lookup of constant strings optimization:
Introduce SvREADONLY && SvFAKE to flag an SV which has SvPVX pointing
to string table (as per sharepvn). Add newSV_pvn_share to create such
a thing. Make hv.c compare addresses of strings and skip string compare
if equal. Make method_named and helem ops use these shared-string SVs
when arg is constant. Make keys op return shared-string SVs (less clearly
a win).
p4raw-id: //depot/perl@7016
Diffstat (limited to 'sv.c')
-rw-r--r-- | sv.c | 156 |
1 files changed, 101 insertions, 55 deletions
@@ -834,7 +834,7 @@ S_more_xpvbm(pTHX) #define new_XPVHV() my_safemalloc(sizeof(XPVHV)) #define del_XPVHV(p) my_safefree(p) - + #define new_XPVMG() my_safemalloc(sizeof(XPVMG)) #define del_XPVMG(p) my_safefree(p) @@ -872,7 +872,7 @@ S_more_xpvbm(pTHX) #define new_XPVHV() (void*)new_xpvhv() #define del_XPVHV(p) del_xpvhv((XPVHV *)p) - + #define new_XPVMG() (void*)new_xpvmg() #define del_XPVMG(p) del_xpvmg((XPVMG *)p) @@ -886,10 +886,10 @@ S_more_xpvbm(pTHX) #define new_XPVGV() my_safemalloc(sizeof(XPVGV)) #define del_XPVGV(p) my_safefree(p) - + #define new_XPVFM() my_safemalloc(sizeof(XPVFM)) #define del_XPVFM(p) my_safefree(p) - + #define new_XPVIO() my_safemalloc(sizeof(XPVIO)) #define del_XPVIO(p) my_safefree(p) @@ -1523,7 +1523,7 @@ Perl_sv_2iv(pTHX_ register SV *sv) SvUVX(sv) = U_V(SvNVX(sv)); SvIsUV_on(sv); ret_iv_max: - DEBUG_c(PerlIO_printf(Perl_debug_log, + DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"UVuf" => %"IVdf") (as unsigned)\n", PTR2UV(sv), SvUVX(sv), @@ -1537,7 +1537,7 @@ Perl_sv_2iv(pTHX_ register SV *sv) /* We want to avoid a possible problem when we cache an IV which may be later translated to an NV, and the resulting NV is not the translation of the initial data. - + This means that if we cache such an IV, we need to cache the NV as well. Moreover, we trade speed for space, and do not cache the NV if not needed. @@ -1652,7 +1652,7 @@ Perl_sv_2uv(pTHX_ register SV *sv) else { SvIVX(sv) = I_V(SvNVX(sv)); ret_zero: - DEBUG_c(PerlIO_printf(Perl_debug_log, + DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"IVdf" => %"IVdf") (as signed)\n", PTR2UV(sv), SvIVX(sv), @@ -1666,7 +1666,7 @@ Perl_sv_2uv(pTHX_ register SV *sv) /* We want to avoid a possible problem when we cache a UV which may be later translated to an NV, and the resulting NV is not the translation of the initial data. - + This means that if we cache such a UV, we need to cache the NV as well. Moreover, we trade speed for space, and do not cache the NV if not needed. @@ -1768,7 +1768,7 @@ Perl_sv_2nv(pTHX_ register SV *sv) return Atof(SvPVX(sv)); } if (SvIOKp(sv)) { - if (SvIsUV(sv)) + if (SvIsUV(sv)) return (NV)SvUVX(sv); else return (NV)SvIVX(sv); @@ -1928,7 +1928,7 @@ Perl_looks_like_number(pTHX_ SV *sv) STRLEN len; if (SvPOK(sv)) { - sbegin = SvPVX(sv); + sbegin = SvPVX(sv); len = SvCUR(sv); } else if (SvPOKp(sv)) @@ -1966,7 +1966,7 @@ Perl_looks_like_number(pTHX_ SV *sv) numtype |= IS_NUMBER_TO_INT_BY_ATOL; if (*s == '.' -#ifdef USE_LOCALE_NUMERIC +#ifdef USE_LOCALE_NUMERIC || IS_NUMERIC_RADIX(*s) #endif ) { @@ -1977,7 +1977,7 @@ Perl_looks_like_number(pTHX_ SV *sv) } } else if (*s == '.' -#ifdef USE_LOCALE_NUMERIC +#ifdef USE_LOCALE_NUMERIC || IS_NUMERIC_RADIX(*s) #endif ) { @@ -2087,7 +2087,7 @@ Perl_sv_2pv(pTHX_ register SV *sv, STRLEN *lp) return SvPVX(sv); } if (SvIOKp(sv)) { - if (SvIsUV(sv)) + if (SvIsUV(sv)) (void)sprintf(tmpbuf,"%"UVuf, (UV)SvUVX(sv)); else (void)sprintf(tmpbuf,"%"IVdf, (IV)SvIVX(sv)); @@ -2123,7 +2123,7 @@ Perl_sv_2pv(pTHX_ register SV *sv, STRLEN *lp) switch (SvTYPE(sv)) { case SVt_PVMG: if ( ((SvFLAGS(sv) & - (SVs_OBJECT|SVf_OK|SVs_GMG|SVs_SMG|SVs_RMG)) + (SVs_OBJECT|SVf_OK|SVs_GMG|SVs_SMG|SVs_RMG)) == (SVs_OBJECT|SVs_RMG)) && strEQ(s=HvNAME(SvSTASH(sv)), "Regexp") && (mg = mg_find(sv, 'r'))) { @@ -2212,7 +2212,7 @@ Perl_sv_2pv(pTHX_ register SV *sv, STRLEN *lp) * --jhi Sep 1999 */ if (SvTYPE(sv) < SVt_PVNV) sv_upgrade(sv, SVt_PVNV); - /* The +20 is pure guesswork. Configure test needed. --jhi */ + /* The +20 is pure guesswork. Configure test needed. --jhi */ SvGROW(sv, NV_DIG + 20); s = SvPVX(sv); olderrno = errno; /* some Xenix systems wipe out errno here */ @@ -2346,7 +2346,7 @@ Perl_sv_2pvutf8(pTHX_ register SV *sv, STRLEN *lp) sv_utf8_upgrade(sv); return sv_2pv(sv,lp); } - + /* This function is only called on magical items */ bool Perl_sv_2bool(pTHX_ register SV *sv) @@ -2498,7 +2498,7 @@ Perl_sv_utf8_downgrade(pTHX_ register SV* sv, bool fail_ok) =for apidoc sv_utf8_encode Convert the PV of an SV to UTF8-encoded, but then turn off the C<SvUTF8> -flag so that it looks like bytes again. Nothing calls this. +flag so that it looks like bytes again. Nothing calls this. =cut */ @@ -2787,22 +2787,22 @@ Perl_sv_setsv(pTHX_ SV *dstr, register SV *sstr) (CvROOT(cv) || CvXSUB(cv))) { SV *const_sv = cv_const_sv(cv); - bool const_changed = TRUE; + bool const_changed = TRUE; if(const_sv) - const_changed = sv_cmp(const_sv, - op_const_sv(CvSTART((CV*)sref), + const_changed = sv_cmp(const_sv, + op_const_sv(CvSTART((CV*)sref), (CV*)sref)); /* ahem, death to those who redefine * active sort subs */ if (PL_curstackinfo->si_type == PERLSI_SORT && PL_sortcop == CvSTART(cv)) - Perl_croak(aTHX_ + Perl_croak(aTHX_ "Can't redefine active sort subroutine %s", GvENAME((GV*)dstr)); if ((const_changed && const_sv) || ckWARN(WARN_REDEFINE)) - Perl_warner(aTHX_ WARN_REDEFINE, const_sv ? + Perl_warner(aTHX_ WARN_REDEFINE, const_sv ? "Constant subroutine %s redefined" - : "Subroutine %s redefined", + : "Subroutine %s redefined", GvENAME((GV*)dstr)); } cv_ckproto(cv, (GV*)dstr, @@ -2888,7 +2888,8 @@ Perl_sv_setsv(pTHX_ SV *dstr, register SV *sstr) if (SvTEMP(sstr) && /* slated for free anyway? */ SvREFCNT(sstr) == 1 && /* and no other references to it? */ - !(sflags & SVf_OOK)) /* and not involved in OOK hack? */ + !(sflags & SVf_OOK) && /* and not involved in OOK hack? */ + SvLEN(sstr)) /* and really is a string */ { if (SvPVX(dstr)) { /* we know that dtype >= SVt_PV */ if (SvOOK(dstr)) { @@ -3070,7 +3071,7 @@ Perl_sv_setpv_mg(pTHX_ register SV *sv, register const char *ptr) =for apidoc sv_usepvn Tells an SV to use C<ptr> to find its string value. Normally the string is -stored inside the SV but sv_usepvn allows the SV to use an outside string. +stored inside the SV but sv_usepvn allows the SV to use an outside string. The C<ptr> should point to memory that was allocated by C<malloc>. The string length, C<len>, must be supplied. This function will realloc the memory pointed to by C<ptr>, so that pointer should not be freed or used by @@ -3121,7 +3122,18 @@ Perl_sv_force_normal(pTHX_ register SV *sv) { if (SvREADONLY(sv)) { dTHR; - if (PL_curcop != &PL_compiling) + if (SvFAKE(sv)) { + char *pvx = SvPVX(sv); + STRLEN len = SvCUR(sv); + U32 hash = SvUVX(sv); + SvGROW(sv, len + 1); + Move(pvx,SvPVX(sv),len,char); + *SvEND(sv) = '\0'; + SvFAKE_off(sv); + SvREADONLY_off(sv); + unsharepvn(pvx,len,hash); + } + else if (PL_curcop != &PL_compiling) Perl_croak(aTHX_ PL_no_modify); } if (SvROK(sv)) @@ -3129,11 +3141,11 @@ Perl_sv_force_normal(pTHX_ register SV *sv) else if (SvFAKE(sv) && SvTYPE(sv) == SVt_PVGV) sv_unglob(sv); } - + /* =for apidoc sv_chop -Efficient removal of characters from the beginning of the string buffer. +Efficient removal of characters from the beginning of the string buffer. SvPOK(sv) must be true and the C<ptr> must be a pointer to somewhere inside the string buffer. The C<ptr> becomes the first character of the adjusted string. @@ -3143,8 +3155,8 @@ string. void Perl_sv_chop(pTHX_ register SV *sv, register char *ptr) /* like set but assuming ptr is in sv */ - - + + { register STRLEN delta; @@ -3305,7 +3317,7 @@ SV * Perl_newSV(pTHX_ STRLEN len) { register SV *sv; - + new_SV(sv); if (len) { sv_upgrade(sv, SVt_PV); @@ -3328,7 +3340,7 @@ void Perl_sv_magic(pTHX_ register SV *sv, SV *obj, int how, const char *name, I32 namlen) { MAGIC* mg; - + if (SvREADONLY(sv)) { dTHR; if (PL_curcop != &PL_compiling && !strchr("gBf", how)) @@ -3362,7 +3374,7 @@ Perl_sv_magic(pTHX_ register SV *sv, SV *obj, int how, const char *name, I32 nam mg->mg_ptr = savepvn(name, namlen); else if (namlen == HEf_SVKEY) mg->mg_ptr = (char*)SvREFCNT_inc((SV*)name); - + switch (how) { case 0: mg->mg_virtual = &PL_vtbl_sv; @@ -3548,7 +3560,7 @@ Perl_sv_rvweaken(pTHX_ SV *sv) tsv = SvRV(sv); sv_add_backref(tsv, sv); SvWEAKREF_on(sv); - SvREFCNT_dec(tsv); + SvREFCNT_dec(tsv); return sv; } @@ -3567,7 +3579,7 @@ S_sv_add_backref(pTHX_ SV *tsv, SV *sv) av_push(av,sv); } -STATIC void +STATIC void S_sv_del_backref(pTHX_ SV *sv) { AV *av; @@ -3606,7 +3618,7 @@ Perl_sv_insert(pTHX_ SV *bigstr, STRLEN offset, STRLEN len, char *little, STRLEN register char *bigend; register I32 i; STRLEN curlen; - + if (!bigstr) Perl_croak(aTHX_ "Can't modify non-existent substring"); @@ -3843,6 +3855,10 @@ Perl_sv_clear(pTHX_ register SV *sv) } else if (SvPVX(sv) && SvLEN(sv)) Safefree(SvPVX(sv)); + else if (SvPVX(sv) && SvREADONLY(sv) && SvFAKE(sv)) { + unsharepvn(SvPVX(sv),SvCUR(sv),SvUVX(sv)); + SvFAKE_off(sv); + } break; /* case SVt_NV: @@ -4081,7 +4097,7 @@ Perl_sv_pos_b2u(pTHX_ register SV *sv, I32* offsetp) } if (s != send) { dTHR; - if (ckWARN_d(WARN_UTF8)) + if (ckWARN_d(WARN_UTF8)) Perl_warner(aTHX_ WARN_UTF8, "Malformed UTF-8 character"); --len; } @@ -4161,7 +4177,7 @@ Perl_sv_cmp(pTHX_ register SV *sv1, register SV *sv2) { STRLEN cur1, cur2; char *pv1, *pv2; - I32 cmp; + I32 cmp; bool pv1tmp = FALSE; bool pv2tmp = FALSE; @@ -4400,7 +4416,7 @@ Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append) /* See if we know enough about I/O mechanism to cheat it ! */ /* This used to be #ifdef test - it is made run-time test for ease - of abstracting out stdio interface. One call should be cheap + of abstracting out stdio interface. One call should be cheap enough here - and may even be a macro allowing compile time optimization. */ @@ -4448,7 +4464,7 @@ Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append) "Screamer: entering, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt)); DEBUG_P(PerlIO_printf(Perl_debug_log, "Screamer: entering: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n", - PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), + PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), PTR2UV(PerlIO_has_base(fp) ? PerlIO_get_base(fp) : 0))); for (;;) { screamer: @@ -4461,8 +4477,8 @@ Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append) } } else { - Copy(ptr, bp, cnt, char); /* this | eat */ - bp += cnt; /* screams | dust */ + Copy(ptr, bp, cnt, char); /* this | eat */ + bp += cnt; /* screams | dust */ ptr += cnt; /* louder | sed :-) */ cnt = 0; } @@ -4484,15 +4500,15 @@ Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append) PerlIO_set_ptrcnt(fp, ptr, cnt); /* deregisterize cnt and ptr */ DEBUG_P(PerlIO_printf(Perl_debug_log, "Screamer: pre: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n", - PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), + PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0))); - /* This used to call 'filbuf' in stdio form, but as that behaves like + /* This used to call 'filbuf' in stdio form, but as that behaves like getc when cnt <= 0 we use PerlIO_getc here to avoid introducing another abstraction. */ i = PerlIO_getc(fp); /* get more characters */ DEBUG_P(PerlIO_printf(Perl_debug_log, "Screamer: post: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n", - PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), + PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0))); cnt = PerlIO_get_cnt(fp); ptr = (STDCHAR*)PerlIO_get_ptr(fp); /* reregisterize cnt and ptr */ @@ -4525,7 +4541,7 @@ thats_really_all_folks: PerlIO_set_ptrcnt(fp, ptr, cnt); /* put these back or we're in trouble */ DEBUG_P(PerlIO_printf(Perl_debug_log, "Screamer: end: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n", - PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), + PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp), PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0))); *bp = '\0'; SvCUR_set(sv, bp - (STDCHAR*)SvPVX(sv)); /* set length */ @@ -4589,7 +4605,7 @@ screamer2: } } - if (RsPARA(PL_rs)) { /* have to do this both before and after */ + if (RsPARA(PL_rs)) { /* have to do this both before and after */ while (i != EOF) { /* to make sure file boundaries work right */ i = PerlIO_getc(fp); if (i != '\n') { @@ -4655,7 +4671,7 @@ Perl_sv_inc(pTHX_ register SV *sv) else { (void)SvIOK_only(sv); ++SvIVX(sv); - } + } } return; } @@ -4685,7 +4701,7 @@ Perl_sv_inc(pTHX_ register SV *sv) /* MKS: The original code here died if letters weren't consecutive. * at least it didn't have to worry about non-C locales. The * new code assumes that ('z'-'a')==('Z'-'A'), letters are - * arranged in order (although not consecutively) and that only + * arranged in order (although not consecutively) and that only * [A-Za-z] are accepted by isALPHA in the C locale. */ if (*d != 'z' && *d != 'Z') { @@ -4759,14 +4775,14 @@ Perl_sv_dec(pTHX_ register SV *sv) else { (void)SvIOK_only_UV(sv); --SvUVX(sv); - } + } } else { if (SvIVX(sv) == IV_MIN) sv_setnv(sv, (NV)IV_MIN - 1.0); else { (void)SvIOK_only(sv); --SvIVX(sv); - } + } } return; } @@ -4880,7 +4896,7 @@ Perl_newSVpv(pTHX_ const char *s, STRLEN len) =for apidoc newSVpvn Creates a new SV and copies a string into it. The reference count for the -SV is set to 1. Note that if C<len> is zero, Perl will create a zero length +SV is set to 1. Note that if C<len> is zero, Perl will create a zero length string. You are responsible for ensuring that the source string is at least C<len> bytes long. @@ -4897,6 +4913,36 @@ Perl_newSVpvn(pTHX_ const char *s, STRLEN len) return sv; } +/* +=for apidoc newSVpvn_share + +Creates a new SV and populates it with a string from +the string table. Turns on READONLY and FAKE. +The idea here is that as string table is used for shared hash +keys these strings will have SvPVX == HeKEY and hash lookup +will avoid string compare. + +=cut +*/ + +SV * +Perl_newSVpvn_share(pTHX_ const char *src, STRLEN len, U32 hash) +{ + register SV *sv; + if (!hash) + PERL_HASH(hash, src, len); + new_SV(sv); + sv_upgrade(sv, SVt_PVIV); + SvPVX(sv) = sharepvn(src, len, hash); + SvCUR(sv) = len; + SvUVX(sv) = hash; + SvLEN(sv) = 0; + SvREADONLY_on(sv); + SvFAKE_on(sv); + SvPOK_on(sv); + return sv; +} + #if defined(PERL_IMPLICIT_CONTEXT) SV * Perl_newSVpvf_nocontext(const char* pat, ...) @@ -5341,7 +5387,7 @@ Perl_sv_pvn_force(pTHX_ SV *sv, STRLEN *lp) if (SvTHINKFIRST(sv) && !SvROK(sv)) sv_force_normal(sv); - + if (SvPOK(sv)) { *lp = SvCUR(sv); } @@ -5355,7 +5401,7 @@ Perl_sv_pvn_force(pTHX_ SV *sv, STRLEN *lp) s = sv_2pv(sv, lp); if (s != SvPVX(sv)) { /* Almost, but not quite, sv_setpvn() */ STRLEN len = *lp; - + if (SvROK(sv)) sv_unref(sv); (void)SvUPGRADE(sv, SVt_PV); /* Never FALSE */ @@ -6622,7 +6668,7 @@ Perl_sv_vcatpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV (PL_op->op_type == OP_PRTF) ? "printf" : "sprintf"); if (c) { if (isPRINT(c)) - Perl_sv_catpvf(aTHX_ msg, + Perl_sv_catpvf(aTHX_ msg, "\"%%%c\"", c & 0xFF); else Perl_sv_catpvf(aTHX_ msg, |