Clarifying that the PerlIO technical node applies only to older Perl.

[perl5.git] / pod / perlfunc.pod
diff --git a/pod/perlfunc.pod b/pod/perlfunc.pod

index c5e599b..8978a51 100644 (file)
--- a/pod/perlfunc.pod
+++ b/pod/perlfunc.pod
@@ -242,7 +242,7 @@ L<C<chroot>|/chroot FILENAME>,
  L<C<fcntl>|/fcntl FILEHANDLE,FUNCTION,SCALAR>, L<C<glob>|/glob EXPR>,
  L<C<ioctl>|/ioctl FILEHANDLE,FUNCTION,SCALAR>,
  L<C<link>|/link OLDFILE,NEWFILE>, L<C<lstat>|/lstat FILEHANDLE>,
-L<C<mkdir>|/mkdir FILENAME,MODE>, L<C<open>|/open FILEHANDLE,EXPR>,
+L<C<mkdir>|/mkdir FILENAME,MODE>, L<C<open>|/open FILEHANDLE,MODE,EXPR>,
  L<C<opendir>|/opendir DIRHANDLE,EXPR>, L<C<readlink>|/readlink EXPR>,
  L<C<rename>|/rename OLDNAME,NEWNAME>, L<C<rmdir>|/rmdir FILENAME>,
  L<C<select>|/select FILEHANDLE>, L<C<stat>|/stat FILEHANDLE>,
@@ -256,7 +256,7 @@ X<control flow>
  
  =for Pod::Functions =Flow
  
-L<C<caller>|/caller EXPR>,
+L<C<break>|/break>, L<C<caller>|/caller EXPR>,
  L<C<continue>|/continue BLOCK>, L<C<die>|/die LIST>, L<C<do>|/do BLOCK>,
  L<C<dump>|/dump LABEL>, L<C<eval>|/eval EXPR>,
  L<C<evalbytes>|/evalbytes EXPR>, L<C<exit>|/exit EXPR>,
@@ -267,9 +267,16 @@ L<C<redo>|/redo LABEL>, L<C<return>|/return EXPR>,
  L<C<sub>|/sub NAME BLOCK>, L<C<__SUB__>|/__SUB__>,
  L<C<wantarray>|/wantarray>
  
-In Perl v5.14 and earlier, L<C<continue>|/continue BLOCK>
-required the L<C<"switch"> feature|feature/The 'switch' feature> to
-be enabled.
+L<C<break>|/break> is available only if you enable the experimental
+L<C<"switch"> feature|feature/The 'switch' feature> or use the C<CORE::>
+prefix.  The L<C<"switch"> feature|feature/The 'switch' feature> also
+enables the C<default>, C<given> and C<when> statements, which are
+documented in L<perlsyn/"Switch Statements">.
+The L<C<"switch"> feature|feature/The 'switch' feature> is enabled
+automatically with a C<use v5.10> (or higher) declaration in the current
+scope.  In Perl v5.14 and earlier, L<C<continue>|/continue BLOCK>
+required the L<C<"switch"> feature|feature/The 'switch' feature>, like
+the other keywords.
  
  L<C<evalbytes>|/evalbytes EXPR> is only available with the
  L<C<"evalbytes"> feature|feature/The 'unicode_eval' and 'evalbytes' features>
@@ -420,10 +427,10 @@ L<C<time>|/time>, L<C<times>|/times>
  =for Pod::Functions =!Non-functions
  
  C<and>, C<AUTOLOAD>, C<BEGIN>, C<CHECK>, C<cmp>, C<CORE>, C<__DATA__>,
-C<DESTROY>, C<else>, C<elseif>, C<elsif>, C<END>, C<__END__>,
+C<default>, C<DESTROY>, C<else>, C<elseif>, C<elsif>, C<END>, C<__END__>,
  C<eq>, C<for>, C<foreach>, C<ge>, C<given>, C<gt>, C<if>, C<INIT>, C<le>,
-C<lt>, C<ne>, C<not>, C<or>, C<UNITCHECK>, C<unless>, C<until>,
-C<whereis>, C<whereso>, C<while>, C<x>, C<xor>
+C<lt>, C<ne>, C<not>, C<or>, C<UNITCHECK>, C<unless>, C<until>, C<when>,
+C<while>, C<x>, C<xor>
  
  =back
  
@@ -464,7 +471,7 @@ L<C<kill>|/kill SIGNAL, LIST>, L<C<link>|/link OLDFILE,NEWFILE>,
  L<C<lstat>|/lstat FILEHANDLE>, L<C<msgctl>|/msgctl ID,CMD,ARG>,
  L<C<msgget>|/msgget KEY,FLAGS>,
  L<C<msgrcv>|/msgrcv ID,VAR,SIZE,TYPE,FLAGS>,
-L<C<msgsnd>|/msgsnd ID,MSG,FLAGS>, L<C<open>|/open FILEHANDLE,EXPR>,
+L<C<msgsnd>|/msgsnd ID,MSG,FLAGS>, L<C<open>|/open FILEHANDLE,MODE,EXPR>,
  L<C<pipe>|/pipe READHANDLE,WRITEHANDLE>, L<C<readlink>|/readlink EXPR>,
  L<C<rename>|/rename OLDNAME,NEWNAME>,
  L<C<select>|/select RBITS,WBITS,EBITS,TIMEOUT>,
@@ -515,6 +522,10 @@ argument is omitted, tests L<C<$_>|perlvar/$_>, except for C<-t>, which
  tests STDIN.  Unless otherwise documented, it returns C<1> for true and
  C<''> for false.  If the file doesn't exist or can't be examined, it
  returns L<C<undef>|/undef EXPR> and sets L<C<$!>|perlvar/$!> (errno).
+With the exception of the C<-l> test they all follow symbolic links
+because they use C<stat()> and not C<lstat()> (so dangling symlinks can't
+be examined and will therefore report failure).
+
  Despite the funny names, precedence is the same as any other named unary
  operator.  The operator may be any of:
  
@@ -807,8 +818,8 @@ translation and marking it as bytes (as opposed to Unicode characters).
  Note that, despite what may be implied in I<"Programming Perl"> (the
  Camel, 3rd edition) or elsewhere, C<:raw> is I<not> simply the inverse of C<:crlf>.
  Other layers that would affect the binary nature of the stream are
-I<also> disabled.  See L<PerlIO>, L<perlrun>, and the discussion about the
-PERLIO environment variable.
+I<also> disabled.  See L<PerlIO>, and the discussion about the PERLIO
+environment variable in L<perlrun|perlrun/PERLIO>.
  
  The C<:bytes>, C<:crlf>, C<:utf8>, and any other directives of the
  form C<:...>, are called I/O I<layers>.  The L<open> pragma can be used to
@@ -828,7 +839,7 @@ while C<:encoding(UTF-8)> checks the data for actually being valid
  UTF-8.  More details can be found in L<PerlIO::encoding>.
  
  In general, L<C<binmode>|/binmode FILEHANDLE, LAYER> should be called
-after L<C<open>|/open FILEHANDLE,EXPR> but before any I/O is done on the
+after L<C<open>|/open FILEHANDLE,MODE,EXPR> but before any I/O is done on the
  filehandle.  Calling L<C<binmode>|/binmode FILEHANDLE, LAYER> normally
  flushes any pending buffered output data (and perhaps pending input
  data) on the handle.  An exception to this is the C<:encoding> layer
@@ -905,6 +916,19 @@ uses the result of L<C<ref>|/ref EXPR> as a truth value.
  
  See L<perlmod/"Perl Modules">.
  
+=item break
+
+=for Pod::Functions +switch break out of a C<given> block
+
+Break out of a C<given> block.
+
+L<C<break>|/break> is available only if the
+L<C<"switch"> feature|feature/The 'switch' feature> is enabled or if it
+is prefixed with C<CORE::>. The
+L<C<"switch"> feature|feature/The 'switch' feature> is enabled
+automatically with a C<use v5.10> (or higher) declaration in the current
+scope.
+
  =item caller EXPR
  X<caller> X<call stack> X<stack> X<stack trace>
  
@@ -923,6 +947,10 @@ list context, caller returns
         # 0         1          2
      my ($package, $filename, $line) = caller;
  
+Like L<C<__FILE__>|/__FILE__> and L<C<__LINE__>|/__LINE__>, the filename and
+line number returned here may be altered by the mechanism described at
+L<perlsyn/"Plain Old Comments (Not!)">.
+
  With EXPR, it returns some extra information that the debugger uses to
  print a stack trace.  The value of EXPR indicates how many call frames
  to go back before the current one.
@@ -1204,9 +1232,10 @@ change your current working directory, which is unaffected.)  For security
  reasons, this call is restricted to the superuser.  If FILENAME is
  omitted, does a L<C<chroot>|/chroot FILENAME> to L<C<$_>|perlvar/$_>.
  
-B<NOTE:>  It is good security practice to do C<chdir("/")>
+B<NOTE:>  It is mandatory for security to C<chdir("/")>
  (L<C<chdir>|/chdir EXPR> to the root directory) immediately after a
-L<C<chroot>|/chroot FILENAME>.
+L<C<chroot>|/chroot FILENAME>, otherwise the current working directory
+may be outside of the new root.
  
  Portability issues: L<perlport/chroot>.
  
@@ -1224,12 +1253,12 @@ layer.  Closes the currently selected filehandle if the argument is
  omitted.
  
  You don't have to close FILEHANDLE if you are immediately going to do
-another L<C<open>|/open FILEHANDLE,EXPR> on it, because
-L<C<open>|/open FILEHANDLE,EXPR> closes it for you.  (See
-L<C<open>|/open FILEHANDLE,EXPR>.) However, an explicit
+another L<C<open>|/open FILEHANDLE,MODE,EXPR> on it, because
+L<C<open>|/open FILEHANDLE,MODE,EXPR> closes it for you.  (See
+L<C<open>|/open FILEHANDLE,MODE,EXPR>.) However, an explicit
  L<C<close>|/close FILEHANDLE> on an input file resets the line counter
  (L<C<$.>|perlvar/$.>), while the implicit close done by
-L<C<open>|/open FILEHANDLE,EXPR> does not.
+L<C<open>|/open FILEHANDLE,MODE,EXPR> does not.
  
  If the filehandle came from a piped open, L<C<close>|/close FILEHANDLE>
  returns false if one of the other syscalls involved fails or if its
@@ -1322,10 +1351,9 @@ using an empty one, logically enough, so L<C<next>|/next LABEL> goes
  directly back to check the condition at the top of the loop.
  
  When there is no BLOCK, L<C<continue>|/continue BLOCK> is a function
-that exits the current C<whereis> or C<whereso> block,
-avoiding the implicit C<next>
-that happens when execution reaches the end of such a block.
-In Perl 5.14 and earlier, this form of
+that falls through the current C<when> or C<default> block instead of
+iterating a dynamically enclosing C<foreach> or exiting a lexically
+enclosing C<given>.  In Perl 5.14 and earlier, this form of
  L<C<continue>|/continue BLOCK> was only available when the
  L<C<"switch"> feature|feature/The 'switch' feature> was enabled.  See
  L<feature> and L<perlsyn/"Switch Statements"> for more information.
@@ -1453,7 +1481,7 @@ L<C<tie>|/tie VARIABLE,CLASSNAME,LIST> function.]
  
  This binds a L<dbm(3)>, L<ndbm(3)>, L<sdbm(3)>, L<gdbm(3)>, or Berkeley
  DB file to a hash.  HASH is the name of the hash.  (Unlike normal
-L<C<open>|/open FILEHANDLE,EXPR>, the first argument is I<not> a
+L<C<open>|/open FILEHANDLE,MODE,EXPR>, the first argument is I<not> a
  filehandle, even though it looks like one).  DBNAME is the name of the
  database (without the F<.dir> or F<.pag> extension if any).  If the
  database does not exist, it is created with protection specified by MASK
@@ -1576,10 +1604,13 @@ so that L<C<exists>|/exists EXPR> on that element no longer returns
  true.  Setting a hash element to the undefined value does not remove its
  key, but deleting it does; see L<C<exists>|/exists EXPR>.
  
-In list context, returns the value or values deleted, or the last such
-element in scalar context.  The return list's length always matches that of
+In list context, usually returns the value or values deleted, or the last such
+element in scalar context.  The return list's length corresponds to that of
  the argument list: deleting non-existent elements returns the undefined value
-in their corresponding positions.
+in their corresponding positions. When a
+L<keyE<sol>value hash slice|perldata/KeyE<sol>Value Hash Slices> is passed to
+C<delete>, the return value is a list of key/value pairs (two elements for each
+item deleted from the hash).
  
  L<C<delete>|/delete EXPR> may also be used on arrays and array slices,
  but its behavior is less straightforward.  Although
@@ -1882,7 +1913,7 @@ X<dump> X<core> X<undump>
  =for Pod::Functions create an immediate core dump
  
  This function causes an immediate core dump.  See also the B<-u>
-command-line switch in L<perlrun>, which does the same thing.
+command-line switch in L<perlrun|perlrun/-u>, which does the same thing.
  Primarily this is so that you can use the B<undump> program (not
  supplied) to turn your core dump into an executable binary after
  having initialized all your variables at the beginning of the
@@ -1899,9 +1930,8 @@ be open any more when the program is reincarnated, with possible
  resulting confusion by Perl.
  
  This function is now largely obsolete, mostly because it's very hard to
-convert a core file into an executable.  That's why you should now invoke
-it as C<CORE::dump()> if you don't want to be warned against a possible
-typo.
+convert a core file into an executable.  As of Perl 5.30, it must be invoked
+as C<CORE::dump()>.
  
  Unlike most named operators, this has the same precedence as assignment.
  It is also exempt from the looks-like-a-function rule, so
@@ -1947,7 +1977,8 @@ its own internal iterator, accessed by L<C<each>|/each HASH>,
  L<C<keys>|/keys HASH>, and L<C<values>|/values HASH>.  The iterator is
  implicitly reset when L<C<each>|/each HASH> has reached the end as just
  described; it can be explicitly reset by calling L<C<keys>|/keys HASH>
-or L<C<values>|/values HASH> on the hash or array.  If you add or delete
+or L<C<values>|/values HASH> on the hash or array, or by referencing
+the hash (but not array) in list context.  If you add or delete
  a hash's elements while iterating over it, the effect on the iterator is
  unspecified; for example, entries may be skipped or duplicated--so don't
  do that.  Exception: It is always safe to delete the item most recently
@@ -1961,6 +1992,21 @@ returned by L<C<each>|/each HASH>, so the following code works properly:
  Tied hashes may have a different ordering behaviour to perl's hash
  implementation.
  
+The iterator used by C<each> is attached to the hash or array, and is
+shared between all iteration operations applied to the same hash or array.
+Thus all uses of C<each> on a single hash or array advance the same
+iterator location.  All uses of C<each> are also subject to having the
+iterator reset by any use of C<keys> or C<values> on the same hash or
+array, or by the hash (but not array) being referenced in list context.
+This makes C<each>-based loops quite fragile: it is easy to arrive at
+such a loop with the iterator already part way through the object, or to
+accidentally clobber the iterator state during execution of the loop body.
+It's easy enough to explicitly reset the iterator before starting a loop,
+but there is no way to insulate the iterator state used by a loop from
+the iterator state used by anything else that might execute during the
+loop body.  To avoid these problems, use a C<foreach> loop rather than
+C<while>-C<each>.
+
  This prints out your environment like the L<printenv(1)> program,
  but in a different order:
  
@@ -1974,6 +2020,10 @@ been deemed unsuccessful, and was removed as of Perl 5.24.
  
  As of Perl 5.18 you can use a bare L<C<each>|/each HASH> in a C<while>
  loop, which will set L<C<$_>|perlvar/$_> on every iteration.
+If either an C<each> expression or an explicit assignment of an C<each>
+expression to a scalar is used as a C<while>/C<for> condition, then
+the condition actually tests for definedness of the expression's value,
+not for its regular truth value.
  
      while (each %ENV) {
         print "$_=$ENV{$_}\n";
@@ -2261,7 +2311,7 @@ Examples:
  If you want to trap errors when loading an XS module, some problems with
  the binary interface (such as Perl version skew) may be fatal even with
  C<eval> unless C<$ENV{PERL_DL_NONLAZY}> is set.  See
-L<perlrun>.
+L<perlrun|perlrun/PERL_DL_NONLAZY>.
  
  Using the C<eval {}> form as an exception trap in libraries does have some
  issues.  Due to the current arguably broken state of C<__DIE__> hooks, you
@@ -2575,8 +2625,8 @@ L<Unicode::UCD/B<prop_invmap()>>.
  For further information on casefolding, refer to
  the Unicode Standard, specifically sections 3.13 C<Default Case Operations>,
  4.2 C<Case-Normative>, and 5.18 C<Case Mappings>,
-available at L<http://www.unicode.org/versions/latest/>, as well as the
-Case Charts available at L<http://www.unicode.org/charts/case/>.
+available at L<https://www.unicode.org/versions/latest/>, as well as the
+Case Charts available at L<https://www.unicode.org/charts/case/>.
  
  If EXPR is omitted, uses L<C<$_>|perlvar/$_>.
  
@@ -2655,6 +2705,8 @@ X<__FILE__>
  =for Pod::Functions the name of the current source file
  
  A special token that returns the name of the file in which it occurs.
+It can be altered by the mechanism described at
+L<perlsyn/"Plain Old Comments (Not!)">.
  
  =item fileno FILEHANDLE
  X<fileno>
@@ -2667,7 +2719,7 @@ Returns the file descriptor for a filehandle or directory handle,
  or undefined if the
  filehandle is not open.  If there is no real file descriptor at the OS
  level, as can happen with filehandles connected to memory objects via
-L<C<open>|/open FILEHANDLE,EXPR> with a reference for the third
+L<C<open>|/open FILEHANDLE,MODE,EXPR> with a reference for the third
  argument, -1 is returned.
  
  This is mainly useful for constructing bitmaps for
@@ -3351,6 +3403,13 @@ See L<File::Glob> for details, including
  L<C<bsd_glob>|File::Glob/C<bsd_glob>>, which does not treat whitespace
  as a pattern separator.
  
+If a C<glob> expression is used as the condition of a C<while> or C<for>
+loop, then it will be implicitly assigned to C<$_>.  If either a C<glob>
+expression or an explicit assignment of a C<glob> expression to a scalar
+is used as a C<while>/C<for> condition, then the condition actually
+tests for definedness of the expression's value, not for its regular
+truth value.
+
  Portability issues: L<perlport/glob>.
  
  =item gmtime EXPR
@@ -3411,7 +3470,11 @@ Use of C<goto LABEL> or C<goto EXPR> to jump into a construct is
  deprecated and will issue a warning.  Even then, it may not be used to
  go into any construct that requires initialization, such as a
  subroutine, a C<foreach> loop, or a C<given>
-block.  It also can't be used to go into a
+block.  In general, it may not be used to jump into the parameter
+of a binary or list operator, but it may be used to jump into the
+I<first> parameter of a binary operator.  (The C<=>
+assignment operator's "first" operand is its right-hand
+operand.)  It also can't be used to go into a
  construct that is optimized away.
  
  The C<goto &NAME> form is quite different from the other forms of
@@ -3630,7 +3693,8 @@ may behave differently to Perl's hashes with respect to changes in order on
  insertion and deletion of items.
  
  As a side effect, calling L<C<keys>|/keys HASH> resets the internal
-iterator of the HASH or ARRAY (see L<C<each>|/each HASH>).  In
+iterator of the HASH or ARRAY (see L<C<each>|/each HASH>) before
+yielding the keys.  In
  particular, calling L<C<keys>|/keys HASH> in void context resets the
  iterator with no other overhead.
  
@@ -3778,13 +3842,13 @@ L<C<continue>|/continue BLOCK> block, if any, is not executed:
          #...
      }
  
-L<C<last>|/last LABEL> cannot be used to exit a block that returns a
-value such as C<eval {}>, C<sub {}>, or C<do {}>, and should not be used
-to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
+L<C<last>|/last LABEL> cannot return a value from a block that typically
+returns a value, such as C<eval {}>, C<sub {}>, or C<do {}>. It will perform
+its flow control behavior, which precludes any return value. It should not be
+used to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
  operation.
  
-Note that a block by itself or a C<given> construct
-is semantically identical to a loop
+Note that a block by itself is semantically identical to a loop
  that executes once.  Thus L<C<last>|/last LABEL> can be used to effect
  an early exit out of such a block.
  
@@ -3897,6 +3961,8 @@ X<__LINE__>
  =for Pod::Functions the current source line number
  
  A special token that compiles to the current line number.
+It can be altered by the mechanism described at
+L<perlsyn/"Plain Old Comments (Not!)">.
  
  =item link OLDFILE,NEWFILE
  X<link>
@@ -4309,13 +4375,13 @@ refers to the innermost enclosing loop.  The C<next EXPR> form, available
  as of Perl 5.18.0, allows a label name to be computed at run time, being
  otherwise identical to C<next LABEL>.
  
-L<C<next>|/next LABEL> cannot be used to exit a block which returns a
-value such as C<eval {}>, C<sub {}>, or C<do {}>, and should not be used
-to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
+L<C<next>|/next LABEL> cannot return a value from a block that typically
+returns a value, such as C<eval {}>, C<sub {}>, or C<do {}>. It will perform
+its flow control behavior, which precludes any return value. It should not be
+used to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
  operation.
  
-Note that a block by itself or a C<given> construct
-is semantically identical to a loop
+Note that a block by itself is semantically identical to a loop
  that executes once.  Thus L<C<next>|/next LABEL> will exit such a block
  early.
  
@@ -4378,46 +4444,84 @@ Leading white space is ignored without warning, as too are any trailing
  non-digits, such as a decimal point (L<C<oct>|/oct EXPR> only handles
  non-negative integers, not negative integers or floating point).
  
-=item open FILEHANDLE,EXPR
-X<open> X<pipe> X<file, open> X<fopen>
-
  =item open FILEHANDLE,MODE,EXPR
+X<open> X<pipe> X<file, open> X<fopen>
  
  =item open FILEHANDLE,MODE,EXPR,LIST
  
  =item open FILEHANDLE,MODE,REFERENCE
  
+=item open FILEHANDLE,EXPR
+
  =item open FILEHANDLE
  
  =for Pod::Functions open a file, pipe, or descriptor
  
-Opens the file whose filename is given by EXPR, and associates it with
-FILEHANDLE.
+Associates an internal FILEHANDLE with the external file specified by
+EXPR. That filehandle will subsequently allow you to perform
+I/O operations on that file, such as reading from it or writing to it.
+
+Instead of a filename, you may specify an external command
+(plus an optional argument list) or a scalar reference, in order to open
+filehandles on commands or in-memory scalars, respectively.
  
-Simple examples to open a file for reading:
+A thorough reference to C<open> follows. For a gentler introduction to
+the basics of C<open>, see also the L<perlopentut> manual page.
+
+=over
+ 
+=item Common usage: working with files
+
+Most often, C<open> gets invoked with three arguments: the required
+FILEHANDLE (usually an empty scalar variable), followed by MODE (usually
+a literal describing the I/O mode the filehandle will use), and then the
+filename  that the new filehandle will refer to.
+
+=over
+
+=item Simple examples
+
+Reading from a file:
  
      open(my $fh, "<", "input.txt")
-       or die "Can't open < input.txt: $!";
+       or die "Can't open < input.txt: $!";
+       
+    # Process every line in input.txt
+    while (my $line = <$fh>) {
+        #
+        # ... do something interesting with $line here ...
+        #
+    }
  
-and for writing:
+or writing to one:
  
      open(my $fh, ">", "output.txt")
-       or die "Can't open > output.txt: $!";
-
-(The following is a comprehensive reference to
-L<C<open>|/open FILEHANDLE,EXPR>: for a gentler introduction you may
-consider L<perlopentut>.)
-
-If FILEHANDLE is an undefined scalar variable (or array or hash element), a
-new filehandle is autovivified, meaning that the variable is assigned a
-reference to a newly allocated anonymous filehandle.  Otherwise if
-FILEHANDLE is an expression, its value is the real filehandle.  (This is
-considered a symbolic reference, so C<use strict "refs"> should I<not> be
-in effect.)
-
-If three (or more) arguments are specified, the open mode (including
-optional encoding) in the second argument are distinct from the filename in
-the third.  If MODE is C<< < >> or nothing, the file is opened for input.
+        or die "Can't open > output.txt: $!";
+       
+    print $fh "This line gets printed directly into output.txt.\n";
+
+For a summary of common filehandle operations such as these, see
+L<perlintro/Files and I/O>.
+
+=item About filehandles
+
+The first argument to C<open>, labeled FILEHANDLE in this reference, is
+usually a scalar variable. (Exceptions exist, described in "Other
+considerations", below.) If the call to C<open> succeeds, then the
+expression provided as FILEHANDLE will get assigned an open
+I<filehandle>. That filehandle provides an internal reference to the
+specified external file, conveniently stored in a Perl variable, and
+ready for I/O operations such as reading and writing.
+
+=item About modes
+
+When calling C<open> with three or more arguments, the second argument
+-- labeled MODE here -- defines the I<open mode>. MODE is usually a
+literal string comprising special characters that define the intended
+I/O role of the filehandle being created: whether it's read-only, or
+read-and-write, and so on.
+
+If MODE is C<< < >>, the file is opened for input (read-only).
  If MODE is C<< > >>, the file is opened for output, with existing files
  first being truncated ("clobbered") and nonexisting files newly created.
  If MODE is C<<< >> >>>, the file is opened for appending, again being
@@ -4428,60 +4532,59 @@ indicate that you want both read and write access to the file; thus
  C<< +< >> is almost always preferred for read/write updates--the
  C<< +> >> mode would clobber the file first.  You can't usually use
  either read-write mode for updating textfiles, since they have
-variable-length records.  See the B<-i> switch in L<perlrun> for a
-better approach.  The file is created with permissions of C<0666>
-modified by the process's L<C<umask>|/umask EXPR> value.
+variable-length records.  See the B<-i> switch in
+L<perlrun|perlrun/-i[extension]> for a better approach.  The file is
+created with permissions of C<0666> modified by the process's
+L<C<umask>|/umask EXPR> value.
  
  These various prefixes correspond to the L<fopen(3)> modes of C<r>,
  C<r+>, C<w>, C<w+>, C<a>, and C<a+>.
  
-In the one- and two-argument forms of the call, the mode and filename
-should be concatenated (in that order), preferably separated by white
-space.  You can--but shouldn't--omit the mode in these forms when that mode
-is C<< < >>.  It is safe to use the two-argument form of
-L<C<open>|/open FILEHANDLE,EXPR> if the filename argument is a known literal.
+More examples of different modes in action:
  
-For three or more arguments if MODE is C<|->, the filename is
-interpreted as a command to which output is to be piped, and if MODE
-is C<-|>, the filename is interpreted as a command that pipes
-output to us.  In the two-argument (and one-argument) form, one should
-replace dash (C<->) with the command.
-See L<perlipc/"Using open() for IPC"> for more examples of this.
-(You are not allowed to L<C<open>|/open FILEHANDLE,EXPR> to a command
-that pipes both in I<and> out, but see L<IPC::Open2>, L<IPC::Open3>, and
-L<perlipc/"Bidirectional Communication with Another Process"> for
-alternatives.)
+ # Open a file for concatenation
+ open(my $log, ">>", "/usr/spool/news/twitlog")
+     or warn "Couldn't open log file; input will be discarded";
  
-In the form of pipe opens taking three or more arguments, if LIST is specified
-(extra arguments after the command name) then LIST becomes arguments
-to the command invoked if the platform supports it.  The meaning of
-L<C<open>|/open FILEHANDLE,EXPR> with more than three arguments for
-non-pipe modes is not yet defined, but experimental "layers" may give
-extra LIST arguments meaning.
+ # Open a file for reading and writing
+ open(my $dbase, "+<", "dbase.mine")
+     or die "Can't open 'dbase.mine' for update: $!";
  
-In the two-argument (and one-argument) form, opening C<< <- >>
-or C<-> opens STDIN and opening C<< >- >> opens STDOUT.
+=item Checking the return value
+
+Open returns nonzero on success, the undefined value otherwise.  If
+the L<C<open>|/open FILEHANDLE,MODE,EXPR> involved a pipe, the return value
+happens to be the pid of the subprocess.
  
-You may (and usually should) use the three-argument form of open to specify
-I/O layers (sometimes referred to as "disciplines") to apply to the handle
-that affect how the input and output are processed (see L<open> and
+When opening a file, it's seldom a good idea to continue
+if the request failed, so L<C<open>|/open FILEHANDLE,MODE,EXPR> is frequently
+used with L<C<die>|/die LIST>. Even if you want your code to do
+something other than C<die> on a failed open, you should still always
+check
+the return value from opening a file.
+
+=back
+
+=item Specifying I/O layers in MODE
+
+You can use the three-argument form of open to specify
+I/O layers (sometimes referred to as "disciplines") to apply to the new
+filehanle. These affect how the input and output are processed (see
+L<open> and
  L<PerlIO> for more details).  For example:
  
    open(my $fh, "<:encoding(UTF-8)", $filename)
      || die "Can't open UTF-8 encoded $filename: $!";
  
-opens the UTF8-encoded file containing Unicode characters;
+This opens the UTF8-encoded file containing Unicode characters;
  see L<perluniintro>.  Note that if layers are specified in the
-three-argument form, then default layers stored in ${^OPEN} (see L<perlvar>;
-usually set by the L<open> pragma or the switch C<-CioD>) are ignored.
+three-argument form, then default layers stored in
+L<C<${^OPEN}>|perlvar/${^OPEN}>
+(usually set by the L<open> pragma or the switch C<-CioD>) are ignored.
  Those layers will also be ignored if you specify a colon with no name
  following it.  In that case the default layer for the operating system
  (:raw on Unix, :crlf on Windows) is used.
  
-Open returns nonzero on success, the undefined value otherwise.  If
-the L<C<open>|/open FILEHANDLE,EXPR> involved a pipe, the return value
-happens to be the pid of the subprocess.
-
  On some systems (in general, DOS- and Windows-based systems)
  L<C<binmode>|/binmode FILEHANDLE, LAYER> is necessary when you're not
  working with a text file.  For the sake of portability it is a good idea
@@ -4489,41 +4592,7 @@ always to use it when appropriate, and never to use it when it isn't
  appropriate.  Also, people can set their I/O to be by default
  UTF8-encoded Unicode, not bytes.
  
-When opening a file, it's seldom a good idea to continue
-if the request failed, so L<C<open>|/open FILEHANDLE,EXPR> is frequently
-used with L<C<die>|/die LIST>.  Even if L<C<die>|/die LIST> won't do
-what you want (say, in a CGI script,
-where you want to format a suitable error message (but there are
-modules that can help with that problem)) always check
-the return value from opening a file.
-
-The filehandle will be closed when its reference count reaches zero.
-If it is a lexically scoped variable declared with L<C<my>|/my VARLIST>,
-that usually
-means the end of the enclosing scope.  However, this automatic close
-does not check for errors, so it is better to explicitly close
-filehandles, especially those used for writing:
-
-    close($handle)
-       || warn "close failed: $!";
-
-An older style is to use a bareword as the filehandle, as
-
-    open(FH, "<", "input.txt")
-       or die "Can't open < input.txt: $!";
-
-Then you can use C<FH> as the filehandle, in C<< close FH >> and C<<
-<FH> >> and so on.  Note that it's a global variable, so this form is
-not recommended in new code.
-
-As a shortcut a one-argument call takes the filename from the global
-scalar variable of the same name as the filehandle:
-
-    $ARTICLE = 100;
-    open(ARTICLE) or die "Can't find article $ARTICLE: $!\n";
-
-Here C<$ARTICLE> must be a global (package) scalar variable - not one
-declared with L<C<my>|/my VARLIST> or L<C<state>|/state VARLIST>.
+=item Using C<undef> for temporary files
  
  As a special case the three-argument form with a read/write mode and the third
  argument being L<C<undef>|/undef EXPR>:
@@ -4535,11 +4604,16 @@ opens a filehandle to a newly created empty anonymous temporary file.
  sensible mode to use.)  You will need to
  L<C<seek>|/seek FILEHANDLE,POSITION,WHENCE> to do the reading.
  
-Perl is built using PerlIO by default.  Unless you've
-changed this (such as building Perl with C<Configure -Uuseperlio>), you can
-open filehandles directly to Perl scalars via:
  
-    open(my $fh, ">", \$variable) || ..
+=item Opening a filehandle into an in-memory scalar
+
+You can open filehandles directly to Perl scalars instead of a file or
+other resource external to the program. Accomplish this by providing a
+reference to that scalar as the third argument to C<open>, like so:
+
+ open(my $memory, ">", \$var)
+     or die "Can't open memory file: $!";
+ print $memory "foo!\n";              # output will appear in $var
  
  To (re)open C<STDOUT> or C<STDERR> as an in-memory file, close it first:
  
@@ -4554,33 +4628,111 @@ any code points over 0xFF.
  Opening in-memory files I<can> fail for a variety of reasons.  As with
  any other C<open>, check the return value for success.
  
+I<Technical note>: This feature works only when Perl is built with
+PerlIO -- the default, except with older (pre-5.16) Perl installations
+specifically built without it (e.g. via C<Configure -Uuseperlio>). You
+can see whether your Perl was built with PerlIO by running C<perl
+-V:useperlio>.  If it says C<'define'>, you have PerlIO; otherwise you
+don't.
+
  See L<perliol> for detailed info on PerlIO.
  
-General examples:
+=item Opening a filehandle into a command
  
- open(my $log, ">>", "/usr/spool/news/twitlog");
- # if the open fails, output is discarded
+If MODE is C<|->, then the filename is
+interpreted as a command to which output is to be piped, and if MODE
+is C<-|>, the filename is interpreted as a command that pipes
+output to us.  In the two-argument (and one-argument) form, one should
+replace dash (C<->) with the command.
+See L<perlipc/"Using open() for IPC"> for more examples of this.
+(You are not allowed to L<C<open>|/open FILEHANDLE,MODE,EXPR> to a command
+that pipes both in I<and> out, but see L<IPC::Open2>, L<IPC::Open3>, and
+L<perlipc/"Bidirectional Communication with Another Process"> for
+alternatives.)
  
- open(my $dbase, "+<", "dbase.mine")      # open for update
-     or die "Can't open 'dbase.mine' for update: $!";
-
- open(my $dbase, "+<dbase.mine")          # ditto
-     or die "Can't open 'dbase.mine' for update: $!";
  
   open(my $article_fh, "-|", "caesar <$article")  # decrypt
                                                   # article
       or die "Can't start caesar: $!";
-
+     
   open(my $article_fh, "caesar <$article |")      # ditto
       or die "Can't start caesar: $!";
  
   open(my $out_fh, "|-", "sort >Tmp$$")    # $$ is our process id
       or die "Can't start sort: $!";
  
- # in-memory files
- open(my $memory, ">", \$var)
-     or die "Can't open memory file: $!";
- print $memory "foo!\n";              # output will appear in $var
+
+In the form of pipe opens taking three or more arguments, if LIST is specified
+(extra arguments after the command name) then LIST becomes arguments
+to the command invoked if the platform supports it.  The meaning of
+L<C<open>|/open FILEHANDLE,MODE,EXPR> with more than three arguments for
+non-pipe modes is not yet defined, but experimental "layers" may give
+extra LIST arguments meaning.
+
+If you open a pipe on the command C<-> (that is, specify either C<|-> or C<-|>
+with the one- or two-argument forms of
+L<C<open>|/open FILEHANDLE,MODE,EXPR>), an implicit L<C<fork>|/fork> is done,
+so L<C<open>|/open FILEHANDLE,MODE,EXPR> returns twice: in the parent process
+it returns the pid
+of the child process, and in the child process it returns (a defined) C<0>.
+Use C<defined($pid)> or C<//> to determine whether the open was successful.
+
+For example, use either
+
+   my $child_pid = open(my $from_kid, "-|") // die "Can't fork: $!";
+
+or
+
+   my $child_pid = open(my $to_kid,   "|-") // die "Can't fork: $!";
+
+followed by
+
+    if ($child_pid) {
+       # am the parent:
+       # either write $to_kid or else read $from_kid
+       ...
+       waitpid $child_pid, 0;
+    } else {
+       # am the child; use STDIN/STDOUT normally
+       ...
+       exit;
+    }
+
+The filehandle behaves normally for the parent, but I/O to that
+filehandle is piped from/to the STDOUT/STDIN of the child process.
+In the child process, the filehandle isn't opened--I/O happens from/to
+the new STDOUT/STDIN.  Typically this is used like the normal
+piped open when you want to exercise more control over just how the
+pipe command gets executed, such as when running setuid and
+you don't want to have to scan shell commands for metacharacters.
+
+The following blocks are more or less equivalent:
+
+    open(my $fh, "|tr '[a-z]' '[A-Z]'");
+    open(my $fh, "|-", "tr '[a-z]' '[A-Z]'");
+    open(my $fh, "|-") || exec 'tr', '[a-z]', '[A-Z]';
+    open(my $fh, "|-", "tr", '[a-z]', '[A-Z]');
+
+    open(my $fh, "cat -n '$file'|");
+    open(my $fh, "-|", "cat -n '$file'");
+    open(my $fh, "-|") || exec "cat", "-n", $file;
+    open(my $fh, "-|", "cat", "-n", $file);
+
+The last two examples in each block show the pipe as "list form", which is
+not yet supported on all platforms.  A good rule of thumb is that if
+your platform has a real L<C<fork>|/fork> (in other words, if your platform is
+Unix, including Linux and MacOS X), you can use the list form.  You would
+want to use the list form of the pipe so you can pass literal arguments
+to the command without risk of the shell interpreting any shell metacharacters
+in them.  However, this also bars you from opening pipes to commands
+that intentionally contain shell metacharacters, such as:
+
+    open(my $fh, "|cat -n | expand -4 | lpr")
+       || die "Can't open pipeline to lpr: $!";
+
+See L<perlipc/"Safe Pipe Opens"> for more examples of this.
+
+=item Duping filehandles
  
  You may also, in the Bourne shell tradition, specify an EXPR beginning
  with C<< >& >>, in which case the rest of the string is interpreted
@@ -4646,72 +4798,74 @@ L<fdopen(3)> to implement the C<=> functionality.  On many Unix systems,
  L<fdopen(3)> fails when file descriptors exceed a certain value, typically 255.
  For Perls 5.8.0 and later, PerlIO is (most often) the default.
  
-You can see whether your Perl was built with PerlIO by running
-C<perl -V:useperlio>.  If it says C<'define'>, you have PerlIO;
-otherwise you don't.
+=item Legacy usage
  
-If you open a pipe on the command C<-> (that is, specify either C<|-> or C<-|>
-with the one- or two-argument forms of
-L<C<open>|/open FILEHANDLE,EXPR>), an implicit L<C<fork>|/fork> is done,
-so L<C<open>|/open FILEHANDLE,EXPR> returns twice: in the parent process
-it returns the pid
-of the child process, and in the child process it returns (a defined) C<0>.
-Use C<defined($pid)> or C<//> to determine whether the open was successful.
+This section describes ways to call C<open> outside of best practices;
+you may encounter these uses in older code. Perl does not consider their
+use deprecated, exactly, but neither is it recommended in new code, for
+the sake of clarity and readability.
  
-For example, use either
+=over
  
-   my $child_pid = open(my $from_kid, "-|") // die "Can't fork: $!";
+=item Specifying mode and filename as a single argument
  
-or
+In the one- and two-argument forms of the call, the mode and filename
+should be concatenated (in that order), preferably separated by white
+space.  You can--but shouldn't--omit the mode in these forms when that mode
+is C<< < >>.  It is safe to use the two-argument form of
+L<C<open>|/open FILEHANDLE,MODE,EXPR> if the filename argument is a known literal.
  
-   my $child_pid = open(my $to_kid,   "|-") // die "Can't fork: $!";
+ open(my $dbase, "+<dbase.mine")          # ditto
+     or die "Can't open 'dbase.mine' for update: $!";
  
-followed by
+In the two-argument (and one-argument) form, opening C<< <- >>
+or C<-> opens STDIN and opening C<< >- >> opens STDOUT.
  
-    if ($child_pid) {
-       # am the parent:
-       # either write $to_kid or else read $from_kid
-       ...
-       waitpid $child_pid, 0;
-    } else {
-       # am the child; use STDIN/STDOUT normally
-       ...
-       exit;
-    }
+New code should favor the three-argument form of C<open> over this older
+form. Declaring the mode and the filename as two distinct arguments
+avoids any confusion between the two.
  
-The filehandle behaves normally for the parent, but I/O to that
-filehandle is piped from/to the STDOUT/STDIN of the child process.
-In the child process, the filehandle isn't opened--I/O happens from/to
-the new STDOUT/STDIN.  Typically this is used like the normal
-piped open when you want to exercise more control over just how the
-pipe command gets executed, such as when running setuid and
-you don't want to have to scan shell commands for metacharacters.
+=item Calling C<open> with one argument via global variables
  
-The following blocks are more or less equivalent:
+As a shortcut, a one-argument call takes the filename from the global
+scalar variable of the same name as the filehandle:
  
-    open(my $fh, "|tr '[a-z]' '[A-Z]'");
-    open(my $fh, "|-", "tr '[a-z]' '[A-Z]'");
-    open(my $fh, "|-") || exec 'tr', '[a-z]', '[A-Z]';
-    open(my $fh, "|-", "tr", '[a-z]', '[A-Z]');
+    $ARTICLE = 100;
+    open(ARTICLE) or die "Can't find article $ARTICLE: $!\n";
  
-    open(my $fh, "cat -n '$file'|");
-    open(my $fh, "-|", "cat -n '$file'");
-    open(my $fh, "-|") || exec "cat", "-n", $file;
-    open(my $fh, "-|", "cat", "-n", $file);
+Here C<$ARTICLE> must be a global (package) scalar variable - not one
+declared with L<C<my>|/my VARLIST> or L<C<state>|/state VARLIST>.
  
-The last two examples in each block show the pipe as "list form", which is
-not yet supported on all platforms.  A good rule of thumb is that if
-your platform has a real L<C<fork>|/fork> (in other words, if your platform is
-Unix, including Linux and MacOS X), you can use the list form.  You would
-want to use the list form of the pipe so you can pass literal arguments
-to the command without risk of the shell interpreting any shell metacharacters
-in them.  However, this also bars you from opening pipes to commands
-that intentionally contain shell metacharacters, such as:
+=item Assigning a filehandle to a bareword
  
-    open(my $fh, "|cat -n | expand -4 | lpr")
-       || die "Can't open pipeline to lpr: $!";
+An older style is to use a bareword as the filehandle, as
  
-See L<perlipc/"Safe Pipe Opens"> for more examples of this.
+    open(FH, "<", "input.txt")
+       or die "Can't open < input.txt: $!";
+
+Then you can use C<FH> as the filehandle, in C<< close FH >> and C<<
+<FH> >> and so on.  Note that it's a global variable, so this form is
+not recommended in new code.
+
+=back
+
+=item Other considerations
+
+=over
+
+=item Automatic filehandle closure
+
+The filehandle will be closed when its reference count reaches zero.
+If it is a lexically scoped variable declared with L<C<my>|/my VARLIST>,
+that usually
+means the end of the enclosing scope.  However, this automatic close
+does not check for errors, so it is better to explicitly close
+filehandles, especially those used for writing:
+
+    close($handle)
+       || warn "close failed: $!";
+
+=item Automatic pipe flushing
  
  Perl will attempt to flush all files opened for
  output before any operation that may do a fork, but this may not be
@@ -4728,8 +4882,19 @@ Closing any piped filehandle causes the parent process to wait for the
  child to finish, then returns the status value in L<C<$?>|perlvar/$?> and
  L<C<${^CHILD_ERROR_NATIVE}>|perlvar/${^CHILD_ERROR_NATIVE}>.
  
+=item Direct versus by-reference assignment of filehandles
+
+If FILEHANDLE -- the first argument in a call to C<open> -- is an
+undefined scalar variable (or array or hash element), a new filehandle
+is autovivified, meaning that the variable is assigned a reference to a
+newly allocated anonymous filehandle.  Otherwise if FILEHANDLE is an
+expression, its value is the real filehandle.  (This is considered a
+symbolic reference, so C<use strict "refs"> should I<not> be in effect.)
+
+=item Whitespace and special characters in the filename argument
+
  The filename passed to the one- and two-argument forms of
-L<C<open>|/open FILEHANDLE,EXPR> will
+L<C<open>|/open FILEHANDLE,MODE,EXPR> will
  have leading and trailing whitespace deleted and normal
  redirection characters honored.  This property, known as "magic open",
  can often be used to good effect.  A user could specify a filename of
@@ -4751,7 +4916,7 @@ otherwise it's necessary to protect any leading and trailing whitespace:
  
  (this may not work on some bizarre filesystems).  One should
  conscientiously choose between the I<magic> and I<three-argument> form
-of L<C<open>|/open FILEHANDLE,EXPR>:
+of L<C<open>|/open FILEHANDLE,MODE,EXPR>:
  
      open(my $in, $ARGV[0]) || die "Can't open $ARGV[0]: $!";
  
@@ -4765,10 +4930,12 @@ will have exactly the opposite restrictions. (However, some shells
  support the syntax C<< perl your_program.pl <( rsh cat file ) >>, which
  produces a filename that can be opened normally.)
  
+=item Invoking C-style C<open>
+
  If you want a "real" C L<open(2)>, then you should use the
  L<C<sysopen>|/sysopen FILEHANDLE,FILENAME,MODE> function, which involves
  no such magic (but uses different filemodes than Perl
-L<C<open>|/open FILEHANDLE,EXPR>, which corresponds to C L<fopen(3)>).
+L<C<open>|/open FILEHANDLE,MODE,EXPR>, which corresponds to C L<fopen(3)>).
  This is another way to protect your filenames from interpretation.  For
  example:
  
@@ -4783,7 +4950,14 @@ example:
  See L<C<seek>|/seek FILEHANDLE,POSITION,WHENCE> for some details about
  mixing reading and writing.
  
-Portability issues: L<perlport/open>.
+=item Portability issues
+
+See L<perlport/open>.
+
+=back
+
+=back
+
  
  =item opendir DIRHANDLE,EXPR
  X<opendir>
@@ -5979,7 +6153,7 @@ This protects against those locales where characters such as C<"|"> are
  considered to be word characters.
  
  Otherwise, Perl quotes non-ASCII characters using an adaptation from
-Unicode (see L<http://www.unicode.org/reports/tr31/>).
+Unicode (see L<https://www.unicode.org/reports/tr31/>).
  The only code points that are quoted are those that have any of the
  Unicode properties:  Pattern_Syntax, Pattern_White_Space, White_Space,
  Default_Ignorable_Code_Point, or General_Category=Control.
@@ -6070,14 +6244,15 @@ results in the string being padded to the required size with C<"\0">
  bytes before the result of the read is appended.
  
  The call is implemented in terms of either Perl's or your system's native
-L<fread(3)> library function.  To get a true L<read(2)> system call, see
+L<fread(3)> library function, via the L<PerlIO> layers applied to the
+handle.  To get a true L<read(2)> system call, see
  L<sysread|/sysread FILEHANDLE,SCALAR,LENGTH,OFFSET>.
  
  Note the I<characters>: depending on the status of the filehandle,
  either (8-bit) bytes or characters are read.  By default, all
  filehandles operate on bytes, but for example if the filehandle has
  been opened with the C<:utf8> I/O layer (see
-L<C<open>|/open FILEHANDLE,EXPR>, and the L<open>
+L<C<open>|/open FILEHANDLE,MODE,EXPR>, and the L<open>
  pragma), the I/O will operate on UTF8-encoded Unicode
  characters, not bytes.  Similarly for the C<:encoding> layer:
  in that case pretty much any characters can be read.
@@ -6104,6 +6279,10 @@ it would have been testing the wrong file.
  
  As of Perl 5.12 you can use a bare L<C<readdir>|/readdir DIRHANDLE> in a
  C<while> loop, which will set L<C<$_>|perlvar/$_> on every iteration.
+If either a C<readdir> expression or an explicit assignment of a
+C<readdir> expression to a scalar is used as a C<while>/C<for> condition,
+then the condition actually tests for definedness of the expression's
+value, not for its regular truth value.
  
      opendir(my $dh, $some_dir) || die "Can't open $some_dir: $!";
      while (readdir $dh) {
@@ -6173,6 +6352,13 @@ L<C<eof>|/eof FILEHANDLE> handles C<ARGV> differently.
          }
      }
  
+Like the C<< <EXPR> >> operator, if a C<readline> expression is
+used as the condition of a C<while> or C<for> loop, then it will be
+implicitly assigned to C<$_>.  If either a C<readline> expression or
+an explicit assignment of a C<readline> expression to a scalar is used
+as a C<while>/C<for> condition, then the condition actually tests for
+definedness of the expression's value, not for its regular truth value.
+
  =item readlink EXPR
  X<readlink>
  
@@ -6202,7 +6388,7 @@ multi-line) string.  In list context, returns a list of lines
  C<$INPUT_RECORD_SEPARATOR> in L<English>)).
  This is the internal function implementing the C<qx/EXPR/>
  operator, but you can use it directly.  The C<qx/EXPR/>
-operator is discussed in more detail in L<perlop/"I/O Operators">.
+operator is discussed in more detail in L<perlop/"C<qx/I<STRING>/>">.
  If EXPR is omitted, uses L<C<$_>|perlvar/$_>.
  
  =item recv SOCKET,SCALAR,LENGTH,FLAGS
@@ -6219,14 +6405,9 @@ string otherwise.  If there's an error, returns the undefined value.
  This call is actually implemented in terms of the L<recvfrom(2)> system call.
  See L<perlipc/"UDP: Message Passing"> for examples.
  
-Note the I<characters>: depending on the status of the socket, either
-(8-bit) bytes or characters are received.  By default all sockets
-operate on bytes, but for example if the socket has been changed using
-L<C<binmode>|/binmode FILEHANDLE, LAYER> to operate with the
-C<:encoding(UTF-8)> I/O layer (see the L<open> pragma), the I/O will
-operate on UTF8-encoded Unicode
-characters, not bytes.  Similarly for the C<:encoding> layer: in that
-case pretty much any characters can be read.
+Note that if the socket has been marked as C<:utf8>, C<recv> will
+throw an exception.  The C<:encoding(...)> layer implicitly introduces
+the C<:utf8> layer.  See L<C<binmode>|/binmode FILEHANDLE, LAYER>.
  
  =item redo LABEL
  X<redo>
@@ -6263,13 +6444,13 @@ normally use this command:
          print;
      }
  
-L<C<redo>|/redo LABEL> cannot be used to retry a block that returns a
-value such as C<eval {}>, C<sub {}>, or C<do {}>, and should not be used
-to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
+L<C<redo>|/redo LABEL> cannot return a value from a block that typically
+returns a value, such as C<eval {}>, C<sub {}>, or C<do {}>. It will perform
+its flow control behavior, which precludes any return value. It should not be
+used to exit a L<C<grep>|/grep BLOCK LIST> or L<C<map>|/map BLOCK LIST>
  operation.
  
-Note that a block by itself or a C<given> construct
-is semantically identical to a loop
+Note that a block by itself is semantically identical to a loop
  that executes once.  Thus L<C<redo>|/redo LABEL> inside such a block
  will effectively turn it into a looping construct.
  
@@ -6316,7 +6497,9 @@ C<HASH>, C<CODE>, C<FORMAT>, or C<IO>, indicating only which kind of
  object it is.  If the unblessed referent is a scalar, then the return
  value will be one of the strings C<SCALAR>, C<VSTRING>, C<REF>, C<GLOB>,
  C<LVALUE>, or C<REGEXP>, depending on the kind of value the scalar
-currently has.  Beware that these built-in type names can also be used as
+currently has.   But note that C<qr//> scalars are created already
+blessed, so C<ref qr/.../> will likely return C<Regexp>.  Beware that
+these built-in type names can also be used as
  class names, so C<ref> returning one of these names doesn't unambiguously
  indicate that the referent is of the kind to which the name refers.
  
@@ -6372,7 +6555,7 @@ compile time.
  
  Specifying VERSION as a numeric argument of the form 5.024001 should
  generally be avoided as older less readable syntax compared to
-v5.24.1. Before perl 5.8.0 released in 2002 the more verbose numeric
+v5.24.1. Before perl 5.8.0 (released in 2002), the more verbose numeric
  form was the only supported syntax, which is why you might see it in
  older code.
  
@@ -6446,14 +6629,16 @@ statements.
  If EXPR is a bareword, L<C<require>|/require VERSION> assumes a F<.pm>
  extension and replaces C<::> with C</> in the filename for you,
  to make it easy to load standard modules.  This form of loading of
-modules does not risk altering your namespace.
+modules does not risk altering your namespace, however it will autovivify
+the stash for the required module.
  
  In other words, if you try this:
  
          require Foo::Bar;     # a splendid bareword
  
  The require function will actually look for the F<Foo/Bar.pm> file in the
-directories specified in the L<C<@INC>|perlvar/@INC> array.
+directories specified in the L<C<@INC>|perlvar/@INC> array, and it will
+autovivify the C<Foo::Bar::> stash at compile time.
  
  But if you try this:
  
@@ -6468,12 +6653,20 @@ will complain about not finding F<Foo::Bar> there.  In this case you can do:
  
          eval "require $class";
  
+or you could do
+
+        require "Foo/Bar.pm";
+
+Neither of these forms will autovivify any stashes at compile time and
+only have run time effects.
+
  Now that you understand how L<C<require>|/require VERSION> looks for
  files with a bareword argument, there is a little extra functionality
  going on behind the scenes.  Before L<C<require>|/require VERSION> looks
  for a F<.pm> extension, it will first look for a similar filename with a
  F<.pmc> extension.  If this file is found, it will be loaded in place of
-any file ending in a F<.pm> extension.
+any file ending in a F<.pm> extension. This applies to both the explicit
+C<require "Foo/Bar.pm";> form and the C<require Foo::Bar;> form.
  
  You can also insert hooks into the import facility by putting Perl code
  directly into the L<C<@INC>|perlvar/@INC> array.  There are three forms
@@ -6579,7 +6772,8 @@ Generally used in a L<C<continue>|/continue BLOCK> block at the end of a
  loop to clear variables and reset C<m?pattern?> searches so that they
  work again.  The
  expression is interpreted as a list of single characters (hyphens
-allowed for ranges).  All variables and arrays beginning with one of
+allowed for ranges).  All variables (scalars, arrays, and hashes)
+in the current package beginning with one of
  those letters are reset to their pristine state.  If the expression is
  omitted, one-match searches (C<m?pattern?>) are reset to match again.
  Only resets variables or searches in the current package.  Always returns
@@ -6592,6 +6786,7 @@ Only resets variables or searches in the current package.  Always returns
  Resetting C<"A-Z"> is not recommended because you'll wipe out your
  L<C<@ARGV>|perlvar/@ARGV> and L<C<@INC>|perlvar/@INC> arrays and your
  L<C<%ENV>|perlvar/%ENV> hash.
+
  Resets only package variables; lexical variables are unaffected, but
  they clean themselves up on scope exit anyway, so you'll probably want
  to use them instead.  See L<C<my>|/my VARLIST>.
@@ -6605,8 +6800,8 @@ X<return>
  
  Returns from a subroutine, L<C<eval>|/eval EXPR>,
  L<C<do FILE>|/do EXPR>, L<C<sort>|/sort SUBNAME LIST> block or regex
-eval block (but not a L<C<grep>|/grep BLOCK LIST> or
-L<C<map>|/map BLOCK LIST> block) with the value
+eval block (but not a L<C<grep>|/grep BLOCK LIST>,
+L<C<map>|/map BLOCK LIST>, or L<C<do BLOCK>|/do BLOCK> block) with the value
  given in EXPR.  Evaluation of EXPR may be in list, scalar, or void
  context, depending on how the return value will be used, and the context
  may vary from one execution to the next (see
@@ -6712,8 +6907,8 @@ X<say>
  =for Pod::Functions +say output a list to a filehandle, appending a newline
  
  Just like L<C<print>|/print FILEHANDLE LIST>, but implicitly appends a
-newline.  C<say LIST> is simply an abbreviation for
-C<{ local $\ = "\n"; print LIST }>.  To use FILEHANDLE without a LIST to
+newline at the end of the LIST instead of any value L<C<$\>|perlvar/$\>
+might have.  To use FILEHANDLE without a LIST to
  print the contents of L<C<$_>|perlvar/$_> to it, you must use a bareword
  filehandle like C<FH>, not an indirect one like C<$fh>.
  
@@ -7008,14 +7203,9 @@ case it does a L<sendto(2)> syscall.  Returns the number of characters sent,
  or the undefined value on error.  The L<sendmsg(2)> syscall is currently
  unimplemented.  See L<perlipc/"UDP: Message Passing"> for examples.
  
-Note the I<characters>: depending on the status of the socket, either
-(8-bit) bytes or characters are sent.  By default all sockets operate
-on bytes, but for example if the socket has been changed using
-L<C<binmode>|/binmode FILEHANDLE, LAYER> to operate with the
-C<:encoding(UTF-8)> I/O layer (see L<C<open>|/open FILEHANDLE,EXPR>, or
-the L<open> pragma), the I/O will operate on UTF-8
-encoded Unicode characters, not bytes.  Similarly for the C<:encoding>
-layer: in that case pretty much any characters can be sent.
+Note that if the socket has been marked as C<:utf8>, C<send> will
+throw an exception.  The C<:encoding(...)> layer implicitly introduces
+the C<:utf8> layer.  See L<C<binmode>|/binmode FILEHANDLE, LAYER>.
  
  =item setpgrp PID,PGRP
  X<setpgrp> X<group>
@@ -7467,7 +7657,7 @@ With proper care you may mix package and my (or state) C<$a> and/or C<$b>:
  
     # prints tinysmallnormalbighuge
  
-C<$a> and C<$b> are implicitely local to the sort() execution and regain their
+C<$a> and C<$b> are implicitly local to the sort() execution and regain their
  former values upon completing the sort.
  
  Sort subroutines written using C<$a> and C<$b> are bound to their calling
@@ -7993,8 +8183,8 @@ as supported by the compiler used to build Perl:
     h           interpret integer as C type "short" or
                 "unsigned short"
     j           interpret integer as C type "intmax_t" on Perl
-               5.14 or later; and only with a C99 compiler
-               prior to Perl 5.30 (unportable)
+               5.14 or later; and prior to Perl 5.30, only with
+               a C99 compiler (unportable)
     l           interpret integer as C type "long" or
                 "unsigned long"
     q, L, or ll interpret integer as C type "long long",
@@ -8002,8 +8192,8 @@ as supported by the compiler used to build Perl:
                 64-bit integers)
     t           interpret integer as C type "ptrdiff_t" on Perl
                 5.14 or later
-   z           interpret integer as C type "size_t" on Perl 5.14
-               or later
+   z           interpret integer as C types "size_t" or
+               "ssize_t" on Perl 5.14 or later
  
  As of 5.14, none of these raises an exception if they are not supported on
  your platform.  However, if warnings are enabled, a warning of the
@@ -8554,6 +8744,15 @@ parameters FILENAME, MODE, and PERMS.
  
  Returns true on success and L<C<undef>|/undef EXPR> otherwise.
  
+L<PerlIO> layers will be applied to the handle the same way they would in an
+L<C<open>|/open FILEHANDLE,MODE,EXPR> call that does not specify layers. That is,
+the current value of L<C<${^OPEN}>|perlvar/${^OPEN}> as set by the L<open>
+pragma in a lexical scope, or the C<-C> commandline option or C<PERL_UNICODE>
+environment variable in the main program scope, falling back to the platform
+defaults as described in L<PerlIO/Defaults and how to override them>. If you
+want to remove any layers that may transform the byte stream, use
+L<C<binmode>|/binmode FILEHANDLE, LAYER> after opening it.
+
  The possible values and flag bits of the MODE parameter are
  system-dependent; they are available via the standard module
  L<C<Fcntl>|Fcntl>.  See the documentation of your operating system's
@@ -8573,7 +8772,7 @@ OS/390 and on the Macintosh; you probably don't want to
  use them in new code.
  
  If the file named by FILENAME does not exist and the
-L<C<open>|/open FILEHANDLE,EXPR> call creates
+L<C<open>|/open FILEHANDLE,MODE,EXPR> call creates
  it (typically because MODE includes the C<O_CREAT> flag), then the value of
  PERMS specifies the permissions of the newly created file.  If you omit
  the PERMS argument to L<C<sysopen>|/sysopen FILEHANDLE,FILENAME,MODE>,
@@ -8603,6 +8802,13 @@ L<C<sysopen>|/sysopen FILEHANDLE,FILENAME,MODE>, because
  that takes away the user's option to have a more permissive umask.
  Better to omit it.  See L<C<umask>|/umask EXPR> for more on this.
  
+This function has no direct relation to the usage of
+L<C<sysread>|/sysread FILEHANDLE,SCALAR,LENGTH,OFFSET>,
+L<C<syswrite>|/syswrite FILEHANDLE,SCALAR,LENGTH,OFFSET>,
+or L<C<sysseek>|/sysseek FILEHANDLE,POSITION,WHENCE>.  A handle opened with
+this function can be used with buffered IO just as one opened with
+L<C<open>|/open FILEHANDLE,MODE,EXPR> can be used with unbuffered IO.
+
  Note that under Perls older than 5.8.0,
  L<C<sysopen>|/sysopen FILEHANDLE,FILENAME,MODE> depends on the
  L<fdopen(3)> C library function.  On many Unix systems, L<fdopen(3)> is known
@@ -8623,13 +8829,14 @@ X<sysread>
  =for Pod::Functions fixed-length unbuffered input from a filehandle
  
  Attempts to read LENGTH bytes of data into variable SCALAR from the
-specified FILEHANDLE, using L<read(2)>.  It bypasses
-buffered IO, so mixing this with other kinds of reads,
+specified FILEHANDLE, using L<read(2)>.  It bypasses any L<PerlIO> layers
+including buffered IO (but is affected by the presence of the C<:utf8>
+layer as described later), so mixing this with other kinds of reads,
  L<C<print>|/print FILEHANDLE LIST>, L<C<write>|/write FILEHANDLE>,
  L<C<seek>|/seek FILEHANDLE,POSITION,WHENCE>,
  L<C<tell>|/tell FILEHANDLE>, or L<C<eof>|/eof FILEHANDLE> can cause
  confusion because the
-perlio or stdio layers usually buffer data.  Returns the number of
+C<:perlio> or C<:crlf> layers usually buffer data.  Returns the number of
  bytes actually read, C<0> at end of file, or undef if there was an
  error (in the latter case L<C<$!>|perlvar/$!> is also set).  SCALAR will
  be grown or
@@ -8646,15 +8853,13 @@ bytes before the result of the read is appended.
  There is no syseof() function, which is ok, since
  L<C<eof>|/eof FILEHANDLE> doesn't work well on device files (like ttys)
  anyway.  Use L<C<sysread>|/sysread FILEHANDLE,SCALAR,LENGTH,OFFSET> and
-check for a return value for 0 to decide whether you're done.
+check for a return value of 0 to decide whether you're done.
  
-Note that if the filehandle has been marked as C<:utf8>, Unicode
-characters are read instead of bytes (the LENGTH, OFFSET, and the
-return value of L<C<sysread>|/sysread FILEHANDLE,SCALAR,LENGTH,OFFSET>
-are in Unicode characters).  The C<:encoding(...)> layer implicitly
+Note that if the filehandle has been marked as C<:utf8>, C<sysread> will
+throw an exception.  The C<:encoding(...)> layer implicitly
  introduces the C<:utf8> layer.  See
  L<C<binmode>|/binmode FILEHANDLE, LAYER>,
-L<C<open>|/open FILEHANDLE,EXPR>, and the L<open> pragma.
+L<C<open>|/open FILEHANDLE,MODE,EXPR>, and the L<open> pragma.
  
  =item sysseek FILEHANDLE,POSITION,WHENCE
  X<sysseek> X<lseek>
@@ -8663,7 +8868,7 @@ X<sysseek> X<lseek>
  
  Sets FILEHANDLE's system position I<in bytes> using L<lseek(2)>.  FILEHANDLE may
  be an expression whose value gives the name of the filehandle.  The values
-for WHENCE are C<0> to set the new position to POSITION; C<1> to set the it
+for WHENCE are C<0> to set the new position to POSITION; C<1> to set it
  to the current position plus POSITION; and C<2> to set it to EOF plus
  POSITION, typically negative.
  
@@ -8795,12 +9000,14 @@ X<syswrite>
  
  Attempts to write LENGTH bytes of data from variable SCALAR to the
  specified FILEHANDLE, using L<write(2)>.  If LENGTH is
-not specified, writes whole SCALAR.  It bypasses buffered IO, so
+not specified, writes whole SCALAR.  It bypasses any L<PerlIO> layers
+including buffered IO (but is affected by the presence of the C<:utf8>
+layer as described later), so
  mixing this with reads (other than C<sysread)>),
  L<C<print>|/print FILEHANDLE LIST>, L<C<write>|/write FILEHANDLE>,
  L<C<seek>|/seek FILEHANDLE,POSITION,WHENCE>,
  L<C<tell>|/tell FILEHANDLE>, or L<C<eof>|/eof FILEHANDLE> may cause
-confusion because the perlio and stdio layers usually buffer data.
+confusion because the C<:perlio> and C<:crlf> layers usually buffer data.
  Returns the number of bytes actually written, or L<C<undef>|/undef EXPR>
  if there was an error (in this case the errno variable
  L<C<$!>|perlvar/$!> is also set).  If the LENGTH is greater than the
@@ -8812,15 +9019,12 @@ string other than the beginning.  A negative OFFSET specifies writing
  that many characters counting backwards from the end of the string.
  If SCALAR is of length zero, you can only use an OFFSET of 0.
  
-B<WARNING>: If the filehandle is marked C<:utf8>, Unicode characters
-encoded in UTF-8 are written instead of bytes, and the LENGTH, OFFSET, and
-return value of L<C<syswrite>|/syswrite FILEHANDLE,SCALAR,LENGTH,OFFSET>
-are in (UTF8-encoded Unicode) characters.
+B<WARNING>: If the filehandle is marked C<:utf8>, C<syswrite> will raise an exception.
  The C<:encoding(...)> layer implicitly introduces the C<:utf8> layer.
  Alternately, if the handle is not marked with an encoding but you
  attempt to write characters with code points over 255, raises an exception.
  See L<C<binmode>|/binmode FILEHANDLE, LAYER>,
-L<C<open>|/open FILEHANDLE,EXPR>, and the L<open> pragma.
+L<C<open>|/open FILEHANDLE,MODE,EXPR>, and the L<open> pragma.
  
  =item tell FILEHANDLE
  X<tell>
@@ -9326,7 +9530,7 @@ want a version of Perl older than the specified one.
  Specifying VERSION as a numeric argument of the form 5.024001 should
  generally be avoided as older less readable syntax compared to
  v5.24.1. Before perl 5.8.0 released in 2002 the more verbose numeric
-orm was the only supported syntax, which is why you might see it in
+form was the only supported syntax, which is why you might see it in
  
      use v5.24.1;    # compile time version check
      use 5.24.1;     # ditto
@@ -9448,9 +9652,10 @@ I<only> meant to be used to assert that the running Perl is of a earlier
  version than its argument and I<not> to undo the feature-enabling side effects
  of C<use VERSION>.
  
-See L<perlmodlib> for a list of standard modules and pragmas.  See L<perlrun>
-for the C<-M> and C<-m> command-line options to Perl that give
-L<C<use>|/use Module VERSION LIST> functionality from the command-line.
+See L<perlmodlib> for a list of standard modules and pragmas.  See
+L<perlrun|perlrun/-m[-]module> for the C<-M> and C<-m> command-line
+options to Perl that give L<C<use>|/use Module VERSION LIST>
+functionality from the command-line.
  
  =item utime LIST
  X<utime>
@@ -9529,9 +9734,12 @@ may behave differently to Perl's hashes with respect to changes in order on
  insertion and deletion of items.
  
  As a side effect, calling L<C<values>|/values HASH> resets the HASH or
-ARRAY's internal iterator, see L<C<each>|/each HASH>.  (In particular,
+ARRAY's internal iterator (see L<C<each>|/each HASH>) before yielding the
+values.  In particular,
  calling L<C<values>|/values HASH> in void context resets the iterator
-with no other overhead.  Apart from resetting the iterator,
+with no other overhead.
+
+Apart from resetting the iterator,
  C<values @array> in list context is the same as plain C<@array>.
  (We recommend that you use void context C<keys @array> for this, but
  reasoned that taking C<values @array> out would require more
@@ -9599,10 +9807,8 @@ to try to write off the beginning of the string (i.e., negative OFFSET).
  If the string happens to be encoded as UTF-8 internally (and thus has
  the UTF8 flag set), L<C<vec>|/vec EXPR,OFFSET,BITS> tries to convert it
  to use a one-byte-per-character internal representation. However, if the
-string contains characters with values of 256 or higher, that conversion
-will fail, and a deprecation message will be raised.  In that situation,
-C<vec> will operate on the underlying buffer regardless, in its internal
-UTF-8 representation.  In Perl 5.32, this will be a fatal error.
+string contains characters with values of 256 or higher, a fatal error
+will occur.
  
  Strings created with L<C<vec>|/vec EXPR,OFFSET,BITS> can also be
  manipulated with the logical
@@ -10108,11 +10314,11 @@ Statements">.
  
  =over
  
-=item given
+=item default
  
-=item whereis
+=item given
  
-=item whereso
+=item when
  
  These flow-control keywords related to the experimental switch feature are
  documented in L<perlsyn/"Switch Statements">.