perl/universal.c
James E Keenan f430ad845a Fatalization of calling import/unimport method with argument
This commit is mostly a manual reversion of commit f1cf82e.  Return to
using a perl_croak in universal.c; adjust regen/warnings.pl as needed; run 'make
regen'; get t/op/universal.t passing.  No documentation changes yet.

Add test for undefined unimport method, then refactor repeated code into
a subroutine.  Perform a pattern match rather than a string equality
test because testing for exact line numbers inside a test program is too
fragile for maintenance purposes.

'mispelled' was misspelled in one location; correct.  Suppress 'used
only once' warning in one location.  POD formatting improvements as
suggested by Elvin Aslanov, with one other word change.

Correct case of one character in error message so that it's the same in
both universal.c and pod/perldiag.pod.  This enables us to preserve
status of universal.c in t/porting/diag.t.  Per: Tony Cook review.

Rebasing on blead in the wake of d306795336, meant that merge conflicts
appeared, which necessitated two rounds of running 'make regen'.
Simplify test_undefined_method(). Update entry in
pod/perldeprecation.pod.

For: GH #23623
2025-12-19 06:51:32 -05:00

1443 lines
40 KiB
C

#line 2 "universal.c"
/* universal.c
*
* Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
* 2005, 2006, 2007, 2008 by Larry Wall and others
*
* You may distribute under the terms of either the GNU General Public
* License or the Artistic License, as specified in the README file.
*
*/
/*
* '"The roots of those mountains must be roots indeed; there must be
* great secrets buried there which have not been discovered since the
* beginning."' --Gandalf, relating Gollum's history
*
* [p.54 of _The Lord of the Rings_, I/ii: "The Shadow of the Past"]
*/
/* This file contains the code that implements the functions in Perl's
* UNIVERSAL package, such as UNIVERSAL->can().
*
* It is also used to store XS functions that need to be present in
* miniperl for a lack of a better place to put them. It might be
* clever to move them to separate XS files which would then be pulled
* in by some to-be-written build process.
*/
#include "EXTERN.h"
#define PERL_IN_UNIVERSAL_C
#include "perl.h"
#if defined(USE_PERLIO)
#include "perliol.h" /* For the PERLIO_F_XXX */
#endif
/*
* Contributed by Graham Barr <Graham.Barr@tiuk.ti.com>
* The main guts of traverse_isa was actually copied from gv_fetchmeth
*/
STATIC bool
S_isa_lookup(pTHX_ HV *stash, SV *namesv, const char * name, STRLEN len, U32 flags)
{
PERL_ARGS_ASSERT_ISA_LOOKUP;
const struct mro_meta *const meta = HvMROMETA(stash);
HV *isa = meta->isa;
const HV *our_stash;
if (!isa) {
(void)mro_get_linear_isa(stash);
isa = meta->isa;
}
if (hv_common(isa, namesv, name, len, ( flags & SVf_UTF8 ? HVhek_UTF8 : 0),
HV_FETCH_ISEXISTS, NULL, 0)) {
/* Direct name lookup worked. */
return TRUE;
}
/* A stash/class can go by many names (ie. User == main::User), so
we use the HvENAME in the stash itself, which is canonical, falling
back to HvNAME if necessary. */
our_stash = gv_stashsvpvn_cached(namesv, name, len, flags);
if (our_stash) {
HEK *canon_name = HvENAME_HEK(our_stash);
if (!canon_name) canon_name = HvNAME_HEK(our_stash);
assert(canon_name);
if (hv_common(isa, NULL, HEK_KEY(canon_name), HEK_LEN(canon_name),
HEK_FLAGS(canon_name),
HV_FETCH_ISEXISTS, NULL, HEK_HASH(canon_name))) {
return TRUE;
}
}
return FALSE;
}
STATIC bool
S_sv_derived_from_svpvn(pTHX_ SV *sv, SV *namesv, const char * name, const STRLEN len, U32 flags)
{
HV* stash;
PERL_ARGS_ASSERT_SV_DERIVED_FROM_SVPVN;
SvGETMAGIC(sv);
if (SvROK(sv)) {
const char *type;
sv = SvRV(sv);
type = sv_reftype(sv,0);
if (type) {
if (namesv)
name = SvPV_nolen(namesv);
if (strEQ(name, type))
return TRUE;
}
if (!SvOBJECT(sv))
return FALSE;
stash = SvSTASH(sv);
}
else {
stash = gv_stashsv(sv, 0);
}
if (stash && isa_lookup(stash, namesv, name, len, flags))
return TRUE;
stash = gv_stashpvs("UNIVERSAL", 0);
return stash && isa_lookup(stash, namesv, name, len, flags);
}
/*
=for apidoc_section $SV
=for apidoc sv_derived_from
=for apidoc_item sv_derived_from_hv
=for apidoc_item sv_derived_from_pv
=for apidoc_item sv_derived_from_pvn
=for apidoc_item sv_derived_from_sv
These each return a boolean indicating whether C<sv> is derived from the
specified class I<at the C level>. To check derivation at the Perl level, call
C<isa()> as a normal Perl method.
The differences between the forms is how the class is specified, and the
UTF-8ness of its name.
In C<sv_derived_from_sv>, the class name is extracted from C<namesv> using
some version of L</C<SvPV>>. This is the preferred form. The class name is
considered to be in UTF-8 iff C<namesv> is marked as such, hence C<flags> is
effectively currently ignored.
In C<sv_derived_from_hv>, the class name is C<HvNAME(hv)> (which would
presumably represent a stash). Its UTF8ness is C<HvNAMEUTF8(hv)>.
In the remaining forms, the class name is specified by the C<name> parameter.
In C<sv_derived_from> and C<sv_derived_from_pv>, it is a NUL-terminated C
string. In C<sv_derived_from_pvn>, C<name> points to the first byte of the
string specifying the class, and an additional parameter, C<len>, specifies
its length in bytes. Hence, C<name> may contain embedded-NUL characters.
C<name> is never considered to be encoded as UTF-8 in C<sv_derived_from>. The
remaining forms have a C<flags> parameter. If the C<SVf_UTF8> is set in it,
the class name is encoded as UTF-8; otherwise not. No other flags are
currently meaningful.
=cut
*/
bool
Perl_sv_derived_from_sv(pTHX_ SV *sv, SV *namesv, U32 flags)
{
PERL_ARGS_ASSERT_SV_DERIVED_FROM_SV;
return sv_derived_from_svpvn(sv, namesv, NULL, 0, flags);
}
bool
Perl_sv_derived_from(pTHX_ SV *sv, const char *const name)
{
PERL_ARGS_ASSERT_SV_DERIVED_FROM;
return sv_derived_from_svpvn(sv, NULL, name, strlen(name), 0);
}
bool
Perl_sv_derived_from_pv(pTHX_ SV *sv, const char *const name, U32 flags)
{
PERL_ARGS_ASSERT_SV_DERIVED_FROM_PV;
return sv_derived_from_svpvn(sv, NULL, name, strlen(name), flags);
}
bool
Perl_sv_derived_from_pvn(pTHX_ SV *sv, const char *const name, const STRLEN len, U32 flags)
{
PERL_ARGS_ASSERT_SV_DERIVED_FROM_PVN;
return sv_derived_from_svpvn(sv, NULL, name, len, flags);
}
bool
Perl_sv_derived_from_hv(pTHX_ SV *sv, HV *hv)
{
PERL_ARGS_ASSERT_SV_DERIVED_FROM_HV;
const char *hvname = HvNAME(hv);
if(!hvname)
return FALSE;
return sv_derived_from_svpvn(sv, NULL, hvname, HvNAMELEN(hv), HvNAMEUTF8(hv) ? SVf_UTF8 : 0);
}
/*
=for apidoc sv_isa_sv
Returns a boolean indicating whether the SV is an object reference and is
derived from the specified class, respecting any C<isa()> method overloading
it may have. Returns false if C<sv> is not a reference to an object, or is
not derived from the specified class.
This is the function used to implement the behaviour of the C<isa> operator.
Does not invoke magic on C<sv>.
Not to be confused with the older C<sv_isa> function, which does not use an
overloaded C<isa()> method, nor will check subclassing.
=cut
*/
bool
Perl_sv_isa_sv(pTHX_ SV *sv, SV *namesv)
{
GV *isagv;
PERL_ARGS_ASSERT_SV_ISA_SV;
if(!SvROK(sv) || !SvOBJECT(SvRV(sv)))
return FALSE;
isagv = gv_fetchmeth_pvn(SvSTASH(SvRV(sv)), "isa", 3, -1, GV_NOUNIVERSAL);
if(isagv) {
dSP;
CV *isacv = isGV(isagv) ? GvCV(isagv) : (CV *)isagv;
SV *retsv;
bool ret;
PUTBACK;
ENTER;
SAVETMPS;
EXTEND(SP, 2);
PUSHMARK(SP);
PUSHs(sv);
PUSHs(namesv);
PUTBACK;
call_sv((SV *)isacv, G_SCALAR);
SPAGAIN;
retsv = POPs;
ret = SvTRUE(retsv);
PUTBACK;
FREETMPS;
LEAVE;
return ret;
}
/* TODO: Support namesv being an HV ref to the stash directly? */
return sv_derived_from_sv(sv, namesv, 0);
}
/*
=for apidoc sv_does
=for apidoc_item sv_does_pv
=for apidoc_item sv_does_pvn
=for apidoc_item sv_does_sv
These each return a boolean indicating whether C<sv> performs a specific, named
role.
C<sv> can be a Perl object or the name of a Perl class.
The forms differ in how the role is specified.
In C<sv_does> and C<sv_does_pv>, the role is in C<name>, which is a
NUL-terminated string, which means that it may not contain embedded NUL
characters.
In C<sv_does_pvn>, the role is in C<name> whose length is given by C<len>.
Hence it may contain embedded NUL characters.
In C<sv_does_sv>, the role is extracted from C<namesv>. Its C<flags> argument
is currently ignored.
You can pass C<SVf_UTF8> to the other functions that have a C<flags> argument
to indicate that C<name> is encoded as UTF-8. C<sv_does> does not have a
C<flags> argument, so its role is never considered to be UTF-8.
=cut
The above is based on the behavior of newSVpvn_flags at the time of this
writing. It only recognizes SVs_TEMP and SVf_UTF8.
XXX extracted in sv_does_sv is more complicated than the hand waving above
*/
#include "XSUB.h"
bool
Perl_sv_does_sv(pTHX_ SV *sv, SV *namesv, U32 flags)
{
SV *classname;
bool does_it;
SV *methodname;
dSP;
PERL_ARGS_ASSERT_SV_DOES_SV;
PERL_UNUSED_ARG(flags);
ENTER;
SAVETMPS;
SvGETMAGIC(sv);
if (!SvOK(sv) || !(SvROK(sv) || (SvPOK(sv) && SvCUR(sv)))) {
LEAVE;
return FALSE;
}
if (SvROK(sv) && SvOBJECT(SvRV(sv))) {
classname = sv_ref(NULL,SvRV(sv),TRUE);
} else {
classname = sv;
}
if (sv_eq(classname, namesv)) {
LEAVE;
return TRUE;
}
PUSHMARK(SP);
EXTEND(SP, 2);
PUSHs(sv);
PUSHs(namesv);
PUTBACK;
/* create a PV with value "isa", but with a special address
* so that perl knows we're really doing "DOES" instead */
methodname = newSV_type_mortal(SVt_PV);
SvLEN_set(methodname, 0);
SvCUR_set(methodname, strlen(PL_isa_DOES));
SvPVX(methodname) = (char *)PL_isa_DOES; /* discard 'const' qualifier */
SvPOK_on(methodname);
call_sv(methodname, G_SCALAR | G_METHOD);
SPAGAIN;
does_it = SvTRUE_NN( TOPs );
FREETMPS;
LEAVE;
return does_it;
}
bool
Perl_sv_does(pTHX_ SV *sv, const char *const name)
{
PERL_ARGS_ASSERT_SV_DOES;
return sv_does_sv(sv, newSVpvn_flags(name, strlen(name), SVs_TEMP), 0);
}
bool
Perl_sv_does_pv(pTHX_ SV *sv, const char *const name, U32 flags)
{
PERL_ARGS_ASSERT_SV_DOES_PV;
return sv_does_sv(sv, newSVpvn_flags(name, strlen(name), SVs_TEMP | flags), flags);
}
bool
Perl_sv_does_pvn(pTHX_ SV *sv, const char *const name, const STRLEN len, U32 flags)
{
PERL_ARGS_ASSERT_SV_DOES_PVN;
return sv_does_sv(sv, newSVpvn_flags(name, len, flags | SVs_TEMP), flags);
}
/*
=for apidoc croak_xs_usage
A specialised variant of C<croak()> for emitting the usage message for xsubs
croak_xs_usage(cv, "eee_yow");
works out the package name and subroutine name from C<cv>, and then calls
C<croak()>. Hence if C<cv> is C<&ouch::awk>, it would call C<croak> as:
croak("Usage: %" SVf "::%" SVf "(%s)", "ouch", "awk",
"eee_yow");
=cut
*/
void
Perl_croak_xs_usage(const CV *const cv, const char *const params)
{
/* Avoid CvGV as it requires aTHX. */
const GV *gv = CvNAMED(cv) ? NULL : cv->sv_any->xcv_gv_u.xcv_gv;
PERL_ARGS_ASSERT_CROAK_XS_USAGE;
if (gv) got_gv: {
const HV *const stash = GvSTASH(gv);
if (HvNAME_get(stash))
/* diag_listed_as: SKIPME */
Perl_croak_nocontext("Usage: %" HEKf "::%" HEKf "(%s)",
HEKfARG(HvNAME_HEK(stash)),
HEKfARG(GvNAME_HEK(gv)),
params);
else
/* diag_listed_as: SKIPME */
Perl_croak_nocontext("Usage: %" HEKf "(%s)",
HEKfARG(GvNAME_HEK(gv)), params);
} else {
dTHX;
if ((gv = CvGV(cv))) goto got_gv;
/* Pants. I don't think that it should be possible to get here. */
/* diag_listed_as: SKIPME */
Perl_croak_nocontext("Usage: CODE(0x%" UVxf ")(%s)", PTR2UV(cv), params);
}
}
XS(XS_UNIVERSAL_isa); /* prototype to pass -Wmissing-prototypes */
XS(XS_UNIVERSAL_isa)
{
dXSARGS;
if (items != 2)
croak_xs_usage(cv, "reference, kind");
else {
SV * const sv = ST(0);
SvGETMAGIC(sv);
if (!SvOK(sv) || !(SvROK(sv) || (SvPOK(sv) && SvCUR(sv))))
XSRETURN_UNDEF;
ST(0) = boolSV(sv_derived_from_sv(sv, ST(1), 0));
XSRETURN(1);
}
}
XS(XS_UNIVERSAL_import_unimport); /* prototype to pass -Wmissing-prototypes */
XS(XS_UNIVERSAL_import_unimport)
{
dXSARGS;
dXSI32;
if (items > 1) {
char *class_pv= SvPV_nolen(ST(0));
if (strEQ(class_pv,"UNIVERSAL"))
croak("UNIVERSAL does not export anything");
/* _charnames is special - ignore it for now as the code that
* depends on it has its own "no import" logic that produces better
* warnings than this does. */
if (strNE(class_pv,"_charnames"))
Perl_croak(aTHX_
"Attempt to call undefined %s method with arguments via package "
"%" SVf_QUOTEDPREFIX " (Perhaps you forgot to load the package?)",
ix ? "unimport" : "import", SVfARG(ST(0)));
}
XSRETURN_EMPTY;
}
XS(XS_UNIVERSAL_can); /* prototype to pass -Wmissing-prototypes */
XS(XS_UNIVERSAL_can)
{
dXSARGS;
SV *sv;
SV *rv;
HV *pkg = NULL;
GV *iogv;
if (items != 2)
croak_xs_usage(cv, "object-ref, method");
sv = ST(0);
SvGETMAGIC(sv);
/* Reject undef and empty string. Note that the string form takes
precedence here over the numeric form, as (!1)->foo treats the
invocant as the empty string, though it is a dualvar. */
if (!SvOK(sv) || (SvPOK(sv) && !SvCUR(sv)))
XSRETURN_UNDEF;
rv = &PL_sv_undef;
if (SvROK(sv)) {
sv = MUTABLE_SV(SvRV(sv));
if (SvOBJECT(sv))
pkg = SvSTASH(sv);
else if (isGV_with_GP(sv) && GvIO(sv))
pkg = SvSTASH(GvIO(sv));
}
else if (isGV_with_GP(sv) && GvIO(sv))
pkg = SvSTASH(GvIO(sv));
else if ((iogv = gv_fetchsv_nomg(sv, 0, SVt_PVIO)) && GvIO(iogv))
pkg = SvSTASH(GvIO(iogv));
else {
pkg = gv_stashsv(sv, 0);
if (!pkg)
pkg = gv_stashpvs("UNIVERSAL", 0);
}
if (pkg) {
GV * const gv = gv_fetchmethod_sv_flags(pkg, ST(1), 0);
if (gv && isGV(gv))
rv = sv_2mortal(newRV(MUTABLE_SV(GvCV(gv))));
}
ST(0) = rv;
XSRETURN(1);
}
XS(XS_UNIVERSAL_DOES); /* prototype to pass -Wmissing-prototypes */
XS(XS_UNIVERSAL_DOES)
{
dXSARGS;
PERL_UNUSED_ARG(cv);
if (items != 2)
croak("Usage: invocant->DOES(kind)");
else {
SV * const sv = ST(0);
if (sv_does_sv( sv, ST(1), 0 ))
XSRETURN_YES;
XSRETURN_NO;
}
}
XS(XS_utf8_is_utf8); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_is_utf8)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
else {
SV * const sv = ST(0);
SvGETMAGIC(sv);
if (SvUTF8(sv))
XSRETURN_YES;
else
XSRETURN_NO;
}
XSRETURN_EMPTY;
}
XS(XS_utf8_valid); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_valid)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
else {
SV * const sv = ST(0);
STRLEN len;
const char * const s = SvPV_const(sv,len);
if (!SvUTF8(sv) || is_utf8_string((const U8*)s,len))
XSRETURN_YES;
else
XSRETURN_NO;
}
XSRETURN_EMPTY;
}
XS(XS_utf8_encode); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_encode)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
sv_utf8_encode(ST(0));
SvSETMAGIC(ST(0));
XSRETURN_EMPTY;
}
XS(XS_utf8_decode); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_decode)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
else {
SV * const sv = ST(0);
bool RETVAL;
SvPV_force_nolen(sv);
RETVAL = sv_utf8_decode(sv);
SvSETMAGIC(sv);
ST(0) = boolSV(RETVAL);
}
XSRETURN(1);
}
XS(XS_utf8_upgrade); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_upgrade)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
else {
SV * const sv = ST(0);
STRLEN RETVAL = 0;
dXSTARG;
XSprePUSH;
if (UNLIKELY(! sv)) {
XSRETURN_UNDEF;
}
SvGETMAGIC(sv);
if (UNLIKELY(! SvOK(sv))) {
XSRETURN_UNDEF;
}
RETVAL = sv_utf8_upgrade_nomg(sv);
PUSHi( (IV) RETVAL);
}
XSRETURN(1);
}
XS(XS_utf8_downgrade); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_downgrade)
{
dXSARGS;
if (items < 1 || items > 2)
croak_xs_usage(cv, "sv, failok=0");
else {
SV * const sv0 = ST(0);
SV * const sv1 = ST(1);
const bool failok = (items < 2) ? 0 : SvTRUE_NN(sv1) ? 1 : 0;
const bool RETVAL = sv_utf8_downgrade(sv0, failok);
ST(0) = boolSV(RETVAL);
}
XSRETURN(1);
}
XS(XS_utf8_native_to_unicode); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_native_to_unicode)
{
dXSARGS;
const UV uv = SvUV(ST(0));
if (items > 1)
croak_xs_usage(cv, "sv");
ST(0) = sv_2mortal(newSVuv(NATIVE_TO_UNI(uv)));
XSRETURN(1);
}
XS(XS_utf8_unicode_to_native); /* prototype to pass -Wmissing-prototypes */
XS(XS_utf8_unicode_to_native)
{
dXSARGS;
const UV uv = SvUV(ST(0));
if (items > 1)
croak_xs_usage(cv, "sv");
ST(0) = sv_2mortal(newSVuv(UNI_TO_NATIVE(uv)));
XSRETURN(1);
}
XS(XS_Internals_SvREADONLY); /* prototype to pass -Wmissing-prototypes */
XS(XS_Internals_SvREADONLY) /* This is dangerous stuff. */
{
dXSARGS;
SV * const svz = ST(0);
SV * sv;
/* [perl #77776] - called as &foo() not foo() */
if (!SvROK(svz))
croak_xs_usage(cv, "SCALAR[, ON]");
sv = SvRV(svz);
if (items == 1) {
if (SvREADONLY(sv))
XSRETURN_YES;
else
XSRETURN_NO;
}
else if (items == 2) {
SV *sv1 = ST(1);
if (SvTRUE_NN(sv1)) {
SvFLAGS(sv) |= SVf_READONLY;
XSRETURN_YES;
}
else {
/* I hope you really know what you are doing. */
SvFLAGS(sv) &=~ SVf_READONLY;
XSRETURN_NO;
}
}
XSRETURN_UNDEF; /* Can't happen. */
}
XS(XS_constant__make_const); /* prototype to pass -Wmissing-prototypes */
XS(XS_constant__make_const) /* This is dangerous stuff. */
{
dXSARGS;
SV * const svz = ST(0);
SV * sv;
/* [perl #77776] - called as &foo() not foo() */
if (!SvROK(svz) || items != 1)
croak_xs_usage(cv, "SCALAR");
sv = SvRV(svz);
SvREADONLY_on(sv);
if (SvTYPE(sv) == SVt_PVAV && AvFILLp(sv) != -1) {
/* for constant.pm; nobody else should be calling this
on arrays anyway. */
SV **svp;
for (svp = AvARRAY(sv) + AvFILLp(sv)
; svp >= AvARRAY(sv)
; --svp)
if (*svp) SvPADTMP_on(*svp);
}
XSRETURN(0);
}
XS(XS_Internals_SvREFCNT); /* prototype to pass -Wmissing-prototypes */
XS(XS_Internals_SvREFCNT) /* This is dangerous stuff. */
{
dXSARGS;
SV * const svz = ST(0);
SV * sv;
U32 refcnt;
/* [perl #77776] - called as &foo() not foo() */
if ((items != 1 && items != 2) || !SvROK(svz))
croak_xs_usage(cv, "SCALAR[, REFCOUNT]");
sv = SvRV(svz);
/* I hope you really know what you are doing. */
/* idea is for SvREFCNT(sv) to be accessed only once */
refcnt = items == 2 ?
/* we free one ref on exit */
(SvREFCNT(sv) = SvUV(ST(1)) + 1)
: SvREFCNT(sv);
XSRETURN_UV(refcnt - 1); /* Minus the ref created for us. */
}
XS(XS_Internals_hv_clear_placehold); /* prototype to pass -Wmissing-prototypes */
XS(XS_Internals_hv_clear_placehold)
{
dXSARGS;
if (items != 1 || !SvROK(ST(0)))
croak_xs_usage(cv, "hv");
else {
HV * const hv = HV_FROM_REF(ST(0));
hv_clear_placeholders(hv);
XSRETURN(0);
}
}
XS(XS_Internals_stack_refcounted); /* prototype to pass -Wmissing-prototypes */
XS(XS_Internals_stack_refcounted)
{
dXSARGS;
UV val = 0;
if (items != 0)
croak_xs_usage(cv, "");
#ifdef PERL_RC_STACK
val |= 1;
#endif
XSRETURN_UV(val);
}
XS(XS_PerlIO_get_layers); /* prototype to pass -Wmissing-prototypes */
XS(XS_PerlIO_get_layers)
{
dXSARGS;
if (items < 1 || items % 2 == 0)
croak_xs_usage(cv, "filehandle[,args]");
#if defined(USE_PERLIO)
{
SV * sv;
GV * gv;
IO * io = NULL;
bool input = TRUE;
bool details = FALSE;
if (items > 1) {
SV * const *svp;
for (svp = MARK + 2; svp <= SP; svp += 2) {
SV * const * const varp = svp;
SV * const * const valp = svp + 1;
STRLEN klen;
const char * const key = SvPV_const(*varp, klen);
switch (*key) {
case 'i':
if (memEQs(key, klen, "input")) {
input = SvTRUE(*valp);
break;
}
goto fail;
case 'o':
if (memEQs(key, klen, "output")) {
input = !SvTRUE(*valp);
break;
}
goto fail;
case 'd':
if (memEQs(key, klen, "details")) {
details = SvTRUE(*valp);
break;
}
goto fail;
default:
fail:
croak(
"get_layers: unknown argument '%s'",
key);
}
}
SP -= (items - 1);
}
sv = POPs;
/* MAYBE_DEREF_GV will call get magic */
if ((gv = MAYBE_DEREF_GV(sv)))
io = GvIO(gv);
else if (SvROK(sv) && SvTYPE(SvRV(sv)) == SVt_PVIO)
io = (IO*)SvRV(sv);
else if (!SvROK(sv) && (gv = gv_fetchsv_nomg(sv, 0, SVt_PVIO)))
io = GvIO(gv);
if (io) {
AV* const av = PerlIO_get_layers(aTHX_ input ?
IoIFP(io) : IoOFP(io));
SSize_t i;
const SSize_t last = av_top_index(av);
SSize_t nitem = 0;
for (i = last; i >= 0; i -= 3) {
SV * const * const namsvp = av_fetch(av, i - 2, FALSE);
SV * const * const argsvp = av_fetch(av, i - 1, FALSE);
SV * const * const flgsvp = av_fetch(av, i, FALSE);
const bool namok = namsvp && *namsvp && SvPOK(*namsvp);
const bool argok = argsvp && *argsvp && SvPOK(*argsvp);
const bool flgok = flgsvp && *flgsvp && SvIOK(*flgsvp);
EXTEND(SP, 3); /* Three is the max in all branches: better check just once */
if (details) {
/* Indents of 5? Yuck. */
/* We know that PerlIO_get_layers creates a new SV for
the name and flags, so we can just take a reference
and "steal" it when we free the AV below. */
PUSHs(namok
? sv_2mortal(SvREFCNT_inc_simple_NN(*namsvp))
: &PL_sv_undef);
PUSHs(argok
? newSVpvn_flags(SvPVX_const(*argsvp),
SvCUR(*argsvp),
(SvUTF8(*argsvp) ? SVf_UTF8 : 0)
| SVs_TEMP)
: &PL_sv_undef);
PUSHs(flgok
? sv_2mortal(SvREFCNT_inc_simple_NN(*flgsvp))
: &PL_sv_undef);
nitem += 3;
}
else {
if (namok && argok)
PUSHs(sv_2mortal(Perl_newSVpvf(aTHX_ "%" SVf "(%" SVf ")",
SVfARG(*namsvp),
SVfARG(*argsvp))));
else if (namok)
PUSHs(sv_2mortal(SvREFCNT_inc_simple_NN(*namsvp)));
else
PUSHs(&PL_sv_undef);
nitem++;
if (flgok) {
const IV flags = SvIVX(*flgsvp);
if (flags & PERLIO_F_UTF8) {
PUSHs(newSVpvs_flags("utf8", SVs_TEMP));
nitem++;
}
}
}
}
SvREFCNT_dec(av);
XSRETURN(nitem);
}
}
#endif
XSRETURN(0);
}
XS(XS_re_is_regexp); /* prototype to pass -Wmissing-prototypes */
XS(XS_re_is_regexp)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
if (SvRXOK(ST(0))) {
XSRETURN_YES;
} else {
XSRETURN_NO;
}
}
XS(XS_re_regnames_count); /* prototype to pass -Wmissing-prototypes */
XS(XS_re_regnames_count)
{
REGEXP *rx = PL_curpm ? PM_GETRE(PL_curpm) : NULL;
SV * ret;
dXSARGS;
if (items != 0)
croak_xs_usage(cv, "");
if (!rx)
XSRETURN_UNDEF;
ret = CALLREG_NAMED_BUFF_COUNT(rx);
SPAGAIN;
PUSHs(ret ? sv_2mortal(ret) : &PL_sv_undef);
XSRETURN(1);
}
XS(XS_re_regname); /* prototype to pass -Wmissing-prototypes */
XS(XS_re_regname)
{
dXSARGS;
REGEXP * rx;
U32 flags;
SV * ret;
if (items < 1 || items > 2)
croak_xs_usage(cv, "name[, all ]");
SP -= items;
PUTBACK;
rx = PL_curpm ? PM_GETRE(PL_curpm) : NULL;
if (!rx)
XSRETURN_UNDEF;
if (items == 2 && SvTRUE_NN(ST(1))) {
flags = RXapif_ALL;
} else {
flags = RXapif_ONE;
}
ret = CALLREG_NAMED_BUFF_FETCH(rx, ST(0), (flags | RXapif_REGNAME));
SPAGAIN;
PUSHs(ret ? sv_2mortal(ret) : &PL_sv_undef);
XSRETURN(1);
}
XS(XS_re_regnames); /* prototype to pass -Wmissing-prototypes */
XS(XS_re_regnames)
{
dXSARGS;
REGEXP * rx;
U32 flags;
SV *ret;
AV *av;
SSize_t length;
SSize_t i;
SV **entry;
if (items > 1)
croak_xs_usage(cv, "[all]");
rx = PL_curpm ? PM_GETRE(PL_curpm) : NULL;
if (!rx)
XSRETURN_UNDEF;
if (items == 1 && SvTRUE_NN(ST(0))) {
flags = RXapif_ALL;
} else {
flags = RXapif_ONE;
}
SP -= items;
PUTBACK;
ret = CALLREG_NAMED_BUFF_ALL(rx, (flags | RXapif_REGNAMES));
SPAGAIN;
if (!ret)
XSRETURN_UNDEF;
av = AV_FROM_REF(ret);
length = av_count(av);
EXTEND(SP, length); /* better extend stack just once */
for (i = 0; i < length; i++) {
entry = av_fetch(av, i, FALSE);
if (!entry)
/* diag_listed_as: SKIPME */
croak("NULL array element in re::regnames()");
mPUSHs(SvREFCNT_inc_simple_NN(*entry));
}
SvREFCNT_dec(ret);
PUTBACK;
return;
}
XS(XS_re_regexp_pattern); /* prototype to pass -Wmissing-prototypes */
XS(XS_re_regexp_pattern)
{
dXSARGS;
REGEXP *re;
U8 const gimme = GIMME_V;
EXTEND(SP, 2);
SP -= items;
if (items != 1)
croak_xs_usage(cv, "sv");
/*
Checks if a reference is a regex or not. If the parameter is
not a ref, or is not the result of a qr// then returns false
in scalar context and an empty list in list context.
Otherwise in list context it returns the pattern and the
modifiers, in scalar context it returns the pattern just as it
would if the qr// was stringified normally, regardless as
to the class of the variable and any stringification overloads
on the object.
*/
if ((re = SvRX(ST(0)))) /* assign deliberate */
{
/* Houston, we have a regex! */
SV *pattern;
if ( gimme == G_LIST ) {
STRLEN left = 0;
char reflags[sizeof(INT_PAT_MODS) + MAX_CHARSET_NAME_LENGTH];
const char *fptr;
char ch;
U16 match_flags;
/*
we are in list context so stringify
the modifiers that apply. We ignore "negative
modifiers" in this scenario, and the default character set
*/
if (get_regex_charset(RX_EXTFLAGS(re)) != REGEX_DEPENDS_CHARSET) {
STRLEN len;
const char* const name = get_regex_charset_name(RX_EXTFLAGS(re),
&len);
Copy(name, reflags + left, len, char);
left += len;
}
fptr = INT_PAT_MODS;
match_flags = (U16)((RX_EXTFLAGS(re) & RXf_PMf_COMPILETIME)
>> RXf_PMf_STD_PMMOD_SHIFT);
while((ch = *fptr++)) {
if(match_flags & 1) {
reflags[left++] = ch;
}
match_flags >>= 1;
}
pattern = newSVpvn_flags(RX_PRECOMP(re),RX_PRELEN(re),
(RX_UTF8(re) ? SVf_UTF8 : 0) | SVs_TEMP);
/* return the pattern and the modifiers */
PUSHs(pattern);
PUSHs(newSVpvn_flags(reflags, left, SVs_TEMP));
XSRETURN(2);
} else {
/* Scalar, so use the string that Perl would return */
/* return the pattern in (?msixn:..) format */
pattern = sv_mortalcopy_flags(MUTABLE_SV(re), SV_GMAGIC|SV_NOSTEAL);
PUSHs(pattern);
XSRETURN(1);
}
} else {
/* It ain't a regexp folks */
if ( gimme == G_LIST ) {
/* return the empty list */
XSRETURN_EMPTY;
} else {
/* Because of the (?:..) wrapping involved in a
stringified pattern it is impossible to get a
result for a real regexp that would evaluate to
false. Therefore we can return PL_sv_no to signify
that the object is not a regex, this means that one
can say
if (regex($might_be_a_regex) eq '(?:foo)') { }
and not worry about undefined values.
*/
XSRETURN_NO;
}
}
NOT_REACHED; /* NOTREACHED */
}
#if defined(HAS_GETCWD) && defined(PERL_IS_MINIPERL)
XS(XS_Internals_getcwd)
{
dXSARGS;
SV *sv = sv_newmortal();
if (items != 0)
croak_xs_usage(cv, "");
(void)getcwd_sv(sv);
SvTAINTED_on(sv);
PUSHs(sv);
XSRETURN(1);
}
#endif
XS(XS_NamedCapture_tie_it)
{
dXSARGS;
if (items != 1)
croak_xs_usage(cv, "sv");
{
SV *sv = ST(0);
GV * const gv = (GV *)sv;
HV * const hv = GvHVn(gv);
SV *rv = newSV_type(SVt_IV);
const char *gv_name = GvNAME(gv);
sv_setrv_noinc(rv, newSVuv(
strEQ(gv_name, "-") || strEQ(gv_name, "\003APTURE_ALL")
? RXapif_ALL : RXapif_ONE));
sv_bless(rv, GvSTASH(CvGV(cv)));
sv_unmagic((SV *)hv, PERL_MAGIC_tied);
sv_magic((SV *)hv, rv, PERL_MAGIC_tied, NULL, 0);
SvREFCNT_dec(rv); /* As sv_magic increased it by one. */
}
XSRETURN_EMPTY;
}
XS(XS_NamedCapture_TIEHASH)
{
dXSARGS;
if (items < 1)
croak_xs_usage(cv, "package, ...");
{
const char * package = (const char *)SvPV_nolen(ST(0));
UV flag = RXapif_ONE;
mark += 2;
while(mark < sp) {
STRLEN len;
const char *p = SvPV_const(*mark, len);
if(memEQs(p, len, "all"))
flag = SvTRUE(mark[1]) ? RXapif_ALL : RXapif_ONE;
mark += 2;
}
ST(0) = newSV_type_mortal(SVt_IV);
sv_setuv(newSVrv(ST(0), package), flag);
}
XSRETURN(1);
}
/* These are tightly coupled to the RXapif_* flags defined in regexp.h */
#define UNDEF_FATAL 0x80000
#define DISCARD 0x40000
#define EXPECT_SHIFT 24
#define ACTION_MASK 0x000FF
#define FETCH_ALIAS (RXapif_FETCH | (2 << EXPECT_SHIFT))
#define STORE_ALIAS (RXapif_STORE | (3 << EXPECT_SHIFT) | UNDEF_FATAL | DISCARD)
#define DELETE_ALIAS (RXapif_DELETE | (2 << EXPECT_SHIFT) | UNDEF_FATAL)
#define CLEAR_ALIAS (RXapif_CLEAR | (1 << EXPECT_SHIFT) | UNDEF_FATAL | DISCARD)
#define EXISTS_ALIAS (RXapif_EXISTS | (2 << EXPECT_SHIFT))
#define SCALAR_ALIAS (RXapif_SCALAR | (1 << EXPECT_SHIFT))
XS(XS_NamedCapture_FETCH)
{
dXSARGS;
dXSI32;
PERL_UNUSED_VAR(cv); /* -W */
PERL_UNUSED_VAR(ax); /* -Wall */
SP -= items;
{
REGEXP *const rx = PL_curpm ? PM_GETRE(PL_curpm) : NULL;
U32 flags;
SV *ret;
const U32 action = ix & ACTION_MASK;
const int expect = ix >> EXPECT_SHIFT;
if (items != expect)
croak_xs_usage(cv, expect == 2 ? "$key"
: (expect == 3 ? "$key, $value"
: ""));
if (!rx || !SvROK(ST(0))) {
if (ix & UNDEF_FATAL)
croak_no_modify();
else
XSRETURN_UNDEF;
}
flags = (U32)SvUV(SvRV(MUTABLE_SV(ST(0))));
PUTBACK;
ret = RX_ENGINE(rx)->named_buff(aTHX_ (rx), expect >= 2 ? ST(1) : NULL,
expect >= 3 ? ST(2) : NULL, flags | action);
SPAGAIN;
if (ix & DISCARD) {
/* Called with G_DISCARD, so our return stack state is thrown away.
Hence if we were returned anything, free it immediately. */
SvREFCNT_dec(ret);
} else {
PUSHs(ret ? sv_2mortal(ret) : &PL_sv_undef);
}
PUTBACK;
return;
}
}
XS(XS_NamedCapture_FIRSTKEY)
{
dXSARGS;
dXSI32;
PERL_UNUSED_VAR(cv); /* -W */
PERL_UNUSED_VAR(ax); /* -Wall */
SP -= items;
{
REGEXP *const rx = PL_curpm ? PM_GETRE(PL_curpm) : NULL;
U32 flags;
SV *ret;
const int expect = ix ? 2 : 1;
const U32 action = ix ? RXapif_NEXTKEY : RXapif_FIRSTKEY;
if (items != expect)
croak_xs_usage(cv, expect == 2 ? "$lastkey" : "");
if (!rx || !SvROK(ST(0)))
XSRETURN_UNDEF;
flags = (U32)SvUV(SvRV(MUTABLE_SV(ST(0))));
PUTBACK;
ret = RX_ENGINE(rx)->named_buff_iter(aTHX_ (rx),
expect >= 2 ? ST(1) : NULL,
flags | action);
SPAGAIN;
PUSHs(ret ? sv_2mortal(ret) : &PL_sv_undef);
PUTBACK;
return;
}
}
/* is this still needed? */
XS(XS_NamedCapture_flags)
{
dXSARGS;
PERL_UNUSED_VAR(cv); /* -W */
PERL_UNUSED_VAR(ax); /* -Wall */
SP -= items;
{
EXTEND(SP, 2);
mPUSHu(RXapif_ONE);
mPUSHu(RXapif_ALL);
PUTBACK;
return;
}
}
#include "vutil.h"
#include "vxs.inc"
struct xsub_details {
const char *name;
XSUBADDR_t xsub;
const char *proto;
int ix;
};
static const struct xsub_details these_details[] = {
{"UNIVERSAL::isa", XS_UNIVERSAL_isa, NULL, 0 },
{"UNIVERSAL::can", XS_UNIVERSAL_can, NULL, 0 },
{"UNIVERSAL::DOES", XS_UNIVERSAL_DOES, NULL, 0 },
{"UNIVERSAL::import", XS_UNIVERSAL_import_unimport, NULL, 0},
{"UNIVERSAL::unimport", XS_UNIVERSAL_import_unimport, NULL, 1},
#define VXS_XSUB_DETAILS
#include "vxs.inc"
#undef VXS_XSUB_DETAILS
{"utf8::is_utf8", XS_utf8_is_utf8, NULL, 0 },
{"utf8::valid", XS_utf8_valid, NULL, 0 },
{"utf8::encode", XS_utf8_encode, NULL, 0 },
{"utf8::decode", XS_utf8_decode, NULL, 0 },
{"utf8::upgrade", XS_utf8_upgrade, NULL, 0 },
{"utf8::downgrade", XS_utf8_downgrade, NULL, 0 },
{"utf8::native_to_unicode", XS_utf8_native_to_unicode, NULL, 0 },
{"utf8::unicode_to_native", XS_utf8_unicode_to_native, NULL, 0 },
{"Internals::SvREADONLY", XS_Internals_SvREADONLY, "\\[$%@];$", 0 },
{"Internals::SvREFCNT", XS_Internals_SvREFCNT, "\\[$%@];$", 0 },
{"Internals::hv_clear_placeholders", XS_Internals_hv_clear_placehold, "\\%", 0 },
{"Internals::stack_refcounted", XS_Internals_stack_refcounted, NULL, 0 },
{"constant::_make_const", XS_constant__make_const, "\\[$@]", 0 },
{"PerlIO::get_layers", XS_PerlIO_get_layers, "*;@", 0 },
{"re::is_regexp", XS_re_is_regexp, "$", 0 },
{"re::regname", XS_re_regname, ";$$", 0 },
{"re::regnames", XS_re_regnames, ";$", 0 },
{"re::regnames_count", XS_re_regnames_count, "", 0 },
{"re::regexp_pattern", XS_re_regexp_pattern, "$", 0 },
#if defined(HAS_GETCWD) && defined(PERL_IS_MINIPERL)
{"Internals::getcwd", XS_Internals_getcwd, "", 0 },
#endif
{"Tie::Hash::NamedCapture::_tie_it", XS_NamedCapture_tie_it, NULL, 0 },
{"Tie::Hash::NamedCapture::TIEHASH", XS_NamedCapture_TIEHASH, NULL, 0 },
{"Tie::Hash::NamedCapture::FETCH", XS_NamedCapture_FETCH, NULL, FETCH_ALIAS },
{"Tie::Hash::NamedCapture::STORE", XS_NamedCapture_FETCH, NULL, STORE_ALIAS },
{"Tie::Hash::NamedCapture::DELETE", XS_NamedCapture_FETCH, NULL, DELETE_ALIAS },
{"Tie::Hash::NamedCapture::CLEAR", XS_NamedCapture_FETCH, NULL, CLEAR_ALIAS },
{"Tie::Hash::NamedCapture::EXISTS", XS_NamedCapture_FETCH, NULL, EXISTS_ALIAS },
{"Tie::Hash::NamedCapture::SCALAR", XS_NamedCapture_FETCH, NULL, SCALAR_ALIAS },
{"Tie::Hash::NamedCapture::FIRSTKEY", XS_NamedCapture_FIRSTKEY, NULL, 0 },
{"Tie::Hash::NamedCapture::NEXTKEY", XS_NamedCapture_FIRSTKEY, NULL, 1 },
{"Tie::Hash::NamedCapture::flags", XS_NamedCapture_flags, NULL, 0 },
};
STATIC OP*
optimize_out_native_convert_function(pTHX_ OP* entersubop,
GV* namegv,
SV* protosv)
{
/* Optimizes out an identity function, i.e., one that just returns its
* argument. The passed in function is assumed to be an identity function,
* with no checking. This is designed to be called for utf8_to_native()
* and native_to_utf8() on ASCII platforms, as they just return their
* arguments, but it could work on any such function.
*
* The code is mostly just cargo-culted from Memoize::Lift */
OP *pushop, *argop;
OP *parent;
SV* prototype = newSVpvs("$");
PERL_UNUSED_ARG(protosv);
assert(entersubop->op_type == OP_ENTERSUB);
entersubop = ck_entersub_args_proto(entersubop, namegv, prototype);
parent = entersubop;
SvREFCNT_dec(prototype);
pushop = cUNOPx(entersubop)->op_first;
if (! OpHAS_SIBLING(pushop)) {
parent = pushop;
pushop = cUNOPx(pushop)->op_first;
}
argop = OpSIBLING(pushop);
/* Carry on without doing the optimization if it is not something we're
* expecting, so continues to work */
if ( ! argop
|| ! OpHAS_SIBLING(argop)
|| OpHAS_SIBLING(OpSIBLING(argop))
) {
return entersubop;
}
/* cut argop from the subtree */
(void)op_sibling_splice(parent, pushop, 1, NULL);
op_free(entersubop);
return argop;
}
void
Perl_boot_core_UNIVERSAL(pTHX)
{
static const char file[] = __FILE__;
const struct xsub_details *xsub = these_details;
const struct xsub_details *end = C_ARRAY_END(these_details);
do {
CV *cv = newXS_flags(xsub->name, xsub->xsub, file, xsub->proto, 0);
XSANY.any_i32 = xsub->ix;
} while (++xsub < end);
#ifndef EBCDIC
{ /* On ASCII platforms these functions just return their argument, so can
be optimized away */
CV* to_native_cv = get_cv("utf8::unicode_to_native", 0);
CV* to_unicode_cv = get_cv("utf8::native_to_unicode", 0);
cv_set_call_checker_flags(to_native_cv,
optimize_out_native_convert_function,
(SV*) to_native_cv, 0);
cv_set_call_checker_flags(to_unicode_cv,
optimize_out_native_convert_function,
(SV*) to_unicode_cv, 0);
}
#endif
/* Providing a Regexp::DESTROY fixes #21347. See test in t/op/ref.t */
{
CV * const cv =
newCONSTSUB(get_hv("Regexp::", GV_ADD), "DESTROY", NULL);
char ** cvfile = &CvFILE(cv);
char * oldfile = *cvfile;
CvDYNFILE_off(cv);
*cvfile = (char *)file;
Safefree(oldfile);
}
}
/*
* ex: set ts=8 sts=4 sw=4 et:
*/