package CGI::Simple::Util; use strict; use warnings; use vars qw( $VERSION @EXPORT_OK @ISA $UTIL ); $VERSION = '1.281'; require Exporter; @ISA = qw( Exporter ); @EXPORT_OK = qw( rearrange make_attributes expires escapeHTML unescapeHTML escape unescape ); sub rearrange { my ( $order, @params ) = @_; my ( %pos, @result, %leftover ); return () unless @params; if ( ref $params[0] eq 'HASH' ) { @params = %{ $params[0] }; } else { return @params unless $params[0] =~ m/^-/; } # map parameters into positional indices my $i = 0; for ( @$order ) { for ( ref( $_ ) eq 'ARRAY' ? @$_ : $_ ) { $pos{ lc( $_ ) } = $i; } $i++; } $#result = $#$order; # preextend while ( @params ) { my $key = lc( shift( @params ) ); $key =~ s/^\-//; if ( exists $pos{$key} ) { $result[ $pos{$key} ] = shift( @params ); } else { $leftover{$key} = shift( @params ); } } push @result, make_attributes( \%leftover, 1 ) if %leftover; return @result; } sub make_attributes { my $attref = shift; my $escape = shift || 0; return () unless $attref && ref $attref eq 'HASH'; my @attrib; for my $key ( keys %{$attref} ) { ( my $mod_key = $key ) =~ s/^-//; # get rid of initial - if present $mod_key = lc $mod_key; # parameters are lower case $mod_key =~ tr/_/-/; # use dashes my $value = $escape ? escapeHTML( $attref->{$key} ) : $attref->{$key}; push @attrib, defined $value ? qq/$mod_key="$value"/ : $mod_key; } return @attrib; } # This internal routine creates date strings suitable for use in # cookies and HTTP headers. (They differ, unfortunately.) # Thanks to Mark Fisher for this. sub expires { my ( $time, $format ) = @_; $format ||= 'http'; my @MON = qw( Jan Feb Mar Apr May Jun Jul Aug Sep Oct Nov Dec); my @WDAY = qw( Sun Mon Tue Wed Thu Fri Sat ); # pass through preformatted dates for the sake of expire_calc() $time = _expire_calc( $time ); return $time unless $time =~ /^\d+$/; # make HTTP/cookie date string from GMT'ed time # (cookies use '-' as date separator, HTTP uses ' ') my $sc = $format eq 'cookie' ? '-' : ' '; my ( $sec, $min, $hour, $mday, $mon, $year, $wday ) = gmtime( $time ); $year += 1900; return sprintf( "%s, %02d$sc%s$sc%04d %02d:%02d:%02d GMT", $WDAY[$wday], $mday, $MON[$mon], $year, $hour, $min, $sec ); } # This internal routine creates an expires time exactly some number of # hours from the current time. It incorporates modifications from Mark Fisher. # format for time can be in any of the forms... # "now" -- expire immediately # "+180s" -- in 180 seconds # "+2m" -- in 2 minutes # "+12h" -- in 12 hours # "+1d" -- in 1 day # "+3M" -- in 3 months # "+2y" -- in 2 years # "-3m" -- 3 minutes ago(!) # If you don't supply one of these forms, we assume you are specifying # the date yourself sub _expire_calc { my ( $time ) = @_; my %mult = ( 's' => 1, 'm' => 60, 'h' => 60 * 60, 'd' => 60 * 60 * 24, 'M' => 60 * 60 * 24 * 30, 'y' => 60 * 60 * 24 * 365 ); my $offset; if ( !$time or lc $time eq 'now' ) { $offset = 0; } elsif ( $time =~ /^\d+/ ) { return $time; } elsif ( $time =~ /^([+-]?(?:\d+|\d*\.\d*))([mhdMy]?)/ ) { $offset = ( $mult{$2} || 1 ) * $1; } else { return $time; } my $cur_time = time; return ( $cur_time + $offset ); } sub escapeHTML { my ( $escape, $text ) = @_; return undef unless defined $escape; $escape =~ s/&/&/g; $escape =~ s/"/"/g; $escape =~ s//>/g; # these next optional escapes make text look the same when rendered in HTML if ( $text ) { $escape =~ s/\t/ /g; # tabs to 4 spaces $escape =~ s/( {2,})/" " x length $1/eg; # whitespace escapes $escape =~ s/\n/
\n/g; # newlines to
} return $escape; } sub unescapeHTML { my ( $unescape ) = @_; return undef unless defined( $unescape ); my $latin = $UTIL->{'charset'} =~ /^(?:ISO-8859-1|WINDOWS-1252)$/i; my $ebcdic = $UTIL->{'ebcdic'}; # credit to Randal Schwartz for original version of this $unescape =~ s[&(.*?);]{ local $_ = $1; /^amp$/i ? "&" : /^quot$/i ? '"' : /^gt$/i ? ">" : /^lt$/i ? "<" : /^#(\d+)$/ && $latin ? chr($1) : /^#(\d+)$/ && $ebcdic ? chr($UTIL->{'a2e'}->[$1]) : /^#x([0-9a-f]+)$/i && $latin ? chr(hex($1)) : /^#x([0-9a-f]+)$/i && $ebcdic ? chr($UTIL->{'a2e'}->[hex $1]) : "\&$_;" }gex; return $unescape; } # URL-encode data sub escape { my ( $toencode ) = @_; return undef unless defined $toencode; if ( $UTIL->{'ebcdic'} ) { $toencode =~ s/([^a-zA-Z0-9_.-])/uc sprintf "%%%02x", $UTIL->{'e2a'}->[ord $1]/eg; } else { $toencode =~ s/([^a-zA-Z0-9_.-])/uc sprintf "%%%02x", ord $1 /eg; } return $toencode; } # unescape URL-encoded data sub unescape { my ( $todecode ) = @_; return undef unless defined $todecode; $todecode =~ tr/+/ /; if ( $UTIL->{'ebcdic'} ) { $todecode =~ s/%([0-9a-fA-F]{2})/chr $UTIL->{'a2e'}->[hex $1]/ge; } else { $todecode =~ s/%(?:([0-9a-fA-F]{2})|u([0-9a-fA-F]{4}))/ defined($1)? chr hex($1) : utf8_chr(hex($2))/ge; } return $todecode; } sub utf8_chr ($) { my $c = shift; if ( $c < 0x80 ) { return sprintf( "%c", $c ); } elsif ( $c < 0x800 ) { return sprintf( "%c%c", 0xc0 | ( $c >> 6 ), 0x80 | ( $c & 0x3f ) ); } elsif ( $c < 0x10000 ) { return sprintf( "%c%c%c", 0xe0 | ( $c >> 12 ), 0x80 | ( ( $c >> 6 ) & 0x3f ), 0x80 | ( $c & 0x3f ) ); } elsif ( $c < 0x200000 ) { return sprintf( "%c%c%c%c", 0xf0 | ( $c >> 18 ), 0x80 | ( ( $c >> 12 ) & 0x3f ), 0x80 | ( ( $c >> 6 ) & 0x3f ), 0x80 | ( $c & 0x3f ) ); } elsif ( $c < 0x4000000 ) { return sprintf( "%c%c%c%c%c", 0xf8 | ( $c >> 24 ), 0x80 | ( ( $c >> 18 ) & 0x3f ), 0x80 | ( ( $c >> 12 ) & 0x3f ), 0x80 | ( ( $c >> 6 ) & 0x3f ), 0x80 | ( $c & 0x3f ) ); } elsif ( $c < 0x80000000 ) { return sprintf( "%c%c%c%c%c%c", 0xfc | ( $c >> 30 ), # was 0xfe patch Thomas L. Shinnick 0x80 | ( ( $c >> 24 ) & 0x3f ), 0x80 | ( ( $c >> 18 ) & 0x3f ), 0x80 | ( ( $c >> 12 ) & 0x3f ), 0x80 | ( ( $c >> 6 ) & 0x3f ), 0x80 | ( $c & 0x3f ) ); } else { return utf8( 0xfffd ); } } # We need to define a number of things about the operating environment so # we do this on first initialization and store the results in in an object BEGIN { $UTIL = CGI::Simple::Util->new; # initialize our $UTIL object sub new { my $class = shift; $class = ref( $class ) || $class; my $self = {}; bless $self, $class; $self->init; return $self; } sub init { my $self = shift; $self->charset; $self->os; $self->ebcdic; } sub charset { my ( $self, $charset ) = @_; $self->{'charset'} = $charset if $charset; $self->{'charset'} ||= 'ISO-8859-1'; # set to the safe ISO-8859-1 if not defined return $self->{'charset'}; } sub os { my ( $self, $OS ) = @_; $self->{'os'} = $OS if $OS; # allow value to be set manually $OS = $self->{'os'}; unless ( $OS ) { unless ( $OS = $^O ) { require Config; $OS = $Config::Config{'osname'}; } if ( $OS =~ /Win/i ) { $OS = 'WINDOWS'; } elsif ( $OS =~ /vms/i ) { $OS = 'VMS'; } elsif ( $OS =~ /bsdos/i ) { $OS = 'UNIX'; } elsif ( $OS =~ /dos/i ) { $OS = 'DOS'; } elsif ( $OS =~ /^MacOS$/i ) { $OS = 'MACINTOSH'; } elsif ( $OS =~ /os2/i ) { $OS = 'OS2'; } else { $OS = 'UNIX'; } } return $self->{'os'} = $OS; } sub ebcdic { my $self = shift; return $self->{'ebcdic'} if exists $self->{'ebcdic'}; $self->{'ebcdic'} = "\t" ne "\011" ? 1 : 0; if ( $self->{'ebcdic'} ) { # (ord('^') == 95) for codepage 1047 as on os390, vmesa my @A2E = ( 0, 1, 2, 3, 55, 45, 46, 47, 22, 5, 21, 11, 12, 13, 14, 15, 16, 17, 18, 19, 60, 61, 50, 38, 24, 25, 63, 39, 28, 29, 30, 31, 64, 90, 127, 123, 91, 108, 80, 125, 77, 93, 92, 78, 107, 96, 75, 97, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 122, 94, 76, 126, 110, 111, 124, 193, 194, 195, 196, 197, 198, 199, 200, 201, 209, 210, 211, 212, 213, 214, 215, 216, 217, 226, 227, 228, 229, 230, 231, 232, 233, 173, 224, 189, 95, 109, 121, 129, 130, 131, 132, 133, 134, 135, 136, 137, 145, 146, 147, 148, 149, 150, 151, 152, 153, 162, 163, 164, 165, 166, 167, 168, 169, 192, 79, 208, 161, 7, 32, 33, 34, 35, 36, 37, 6, 23, 40, 41, 42, 43, 44, 9, 10, 27, 48, 49, 26, 51, 52, 53, 54, 8, 56, 57, 58, 59, 4, 20, 62, 255, 65, 170, 74, 177, 159, 178, 106, 181, 187, 180, 154, 138, 176, 202, 175, 188, 144, 143, 234, 250, 190, 160, 182, 179, 157, 218, 155, 139, 183, 184, 185, 171, 100, 101, 98, 102, 99, 103, 158, 104, 116, 113, 114, 115, 120, 117, 118, 119, 172, 105, 237, 238, 235, 239, 236, 191, 128, 253, 254, 251, 252, 186, 174, 89, 68, 69, 66, 70, 67, 71, 156, 72, 84, 81, 82, 83, 88, 85, 86, 87, 140, 73, 205, 206, 203, 207, 204, 225, 112, 221, 222, 219, 220, 141, 142, 223 ); my @E2A = ( 0, 1, 2, 3, 156, 9, 134, 127, 151, 141, 142, 11, 12, 13, 14, 15, 16, 17, 18, 19, 157, 10, 8, 135, 24, 25, 146, 143, 28, 29, 30, 31, 128, 129, 130, 131, 132, 133, 23, 27, 136, 137, 138, 139, 140, 5, 6, 7, 144, 145, 22, 147, 148, 149, 150, 4, 152, 153, 154, 155, 20, 21, 158, 26, 32, 160, 226, 228, 224, 225, 227, 229, 231, 241, 162, 46, 60, 40, 43, 124, 38, 233, 234, 235, 232, 237, 238, 239, 236, 223, 33, 36, 42, 41, 59, 94, 45, 47, 194, 196, 192, 193, 195, 197, 199, 209, 166, 44, 37, 95, 62, 63, 248, 201, 202, 203, 200, 205, 206, 207, 204, 96, 58, 35, 64, 39, 61, 34, 216, 97, 98, 99, 100, 101, 102, 103, 104, 105, 171, 187, 240, 253, 254, 177, 176, 106, 107, 108, 109, 110, 111, 112, 113, 114, 170, 186, 230, 184, 198, 164, 181, 126, 115, 116, 117, 118, 119, 120, 121, 122, 161, 191, 208, 91, 222, 174, 172, 163, 165, 183, 169, 167, 182, 188, 189, 190, 221, 168, 175, 93, 180, 215, 123, 65, 66, 67, 68, 69, 70, 71, 72, 73, 173, 244, 246, 242, 243, 245, 125, 74, 75, 76, 77, 78, 79, 80, 81, 82, 185, 251, 252, 249, 250, 255, 92, 247, 83, 84, 85, 86, 87, 88, 89, 90, 178, 212, 214, 210, 211, 213, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 179, 219, 220, 217, 218, 159 ); if ( ord( '^' ) == 106 ) { # as in the BS2000 posix-bc coded character set $A2E[91] = 187; $A2E[92] = 188; $A2E[94] = 106; $A2E[96] = 74; $A2E[123] = 251; $A2E[125] = 253; $A2E[126] = 255; $A2E[159] = 95; $A2E[162] = 176; $A2E[166] = 208; $A2E[168] = 121; $A2E[172] = 186; $A2E[175] = 161; $A2E[217] = 224; $A2E[219] = 221; $A2E[221] = 173; $A2E[249] = 192; $E2A[74] = 96; $E2A[95] = 159; $E2A[106] = 94; $E2A[121] = 168; $E2A[161] = 175; $E2A[173] = 221; $E2A[176] = 162; $E2A[186] = 172; $E2A[187] = 91; $E2A[188] = 92; $E2A[192] = 249; $E2A[208] = 166; $E2A[221] = 219; $E2A[224] = 217; $E2A[251] = 123; $E2A[253] = 125; $E2A[255] = 126; } elsif ( ord( '^' ) == 176 ) { # as in codepage 037 on os400 $A2E[10] = 37; $A2E[91] = 186; $A2E[93] = 187; $A2E[94] = 176; $A2E[133] = 21; $A2E[168] = 189; $A2E[172] = 95; $A2E[221] = 173; $E2A[21] = 133; $E2A[37] = 10; $E2A[95] = 172; $E2A[173] = 221; $E2A[176] = 94; $E2A[186] = 91; $E2A[187] = 93; $E2A[189] = 168; } $self->{'a2e'} = \@A2E; $self->{'e2a'} = \@E2A; } } } 1; __END__ =head1 NAME CGI::Simple::Util - Internal utilities used by CGI::Simple module =head1 SYNOPSIS $escaped = escapeHTML('In HTML you need to escape < > " and & chars'); $unescaped = unescapeHTML('<>"&'); $url_encoded = escape($string); $decoded = unescape($url_encoded); =head1 DESCRIPTION CGI::Simple::Util contains essentially non public subroutines used by CGI::Simple. There are HTML and URL escape and unescape routines that may be of some use. An internal object is used to store a number of system specific details to enable the escape routines to be accurate. =head1 AUTHOR INFORMATION Original version copyright 1995-1998, Lincoln D. Stein. All rights reserved. Originally copyright 2001 Dr James Freeman Ejfreeman@tassie.net.auE This release by Andy Armstrong This library is free software; you can redistribute it and/or modify it under the same terms as Perl itself. Address bug reports and comments to: andy@hexten.net =head1 SEE ALSO L =cut