|
#!/usr/bin/env perl |
|
# Taken from "There are too many ways to do it" presentation |
|
# http://www.shlomifish.org/lecture/Perl/Lightning/Too-Many-Ways/slides/ |
|
# |
|
# The problem |
|
# |
|
# <sniperd> looking to write a regex that strips out all periods, except for |
|
# the last one. ie, i have a string named perl.is.the.best.txt and I just |
|
# want perlisthebest.txt |
|
# |
|
# - Freenode's #perl. |
|
# |
|
use strict; |
|
use warnings; |
|
use Benchmark 'cmpthese'; |
|
|
|
sub test { |
|
$_[0]->('hello.world.txt'); |
|
$_[0]->('hello-there'); |
|
$_[0]->('hello..too.pl'); |
|
$_[0]->('magna..carta'); |
|
$_[0]->('the-more-the-merrier.jpg'); |
|
$_[0]->('hello.'); |
|
$_[0]->('perl.txt.'); |
|
$_[0]->('.yes'); |
|
$_[0]->('.yes.txt'); |
|
} |
|
|
|
sub via_split { |
|
my $s = shift; |
|
my @components = split /\./, $s, -1; |
|
|
|
return $s if @components == 1; |
|
|
|
my $last = pop @components; |
|
return join( '', @components ) . '.' . $last; |
|
} |
|
|
|
sub sexeger { |
|
my $s = shift; |
|
$s = reverse $s; |
|
|
|
my $c = 0; |
|
$s =~ s!\.!($c++)?'':'.'!ge; |
|
|
|
return reverse $s; |
|
} |
|
|
|
sub two_parts { |
|
my $s = shift; |
|
if ( $s =~ /^(.*)\.([^\.]*)$/ ) { |
|
my ( $l, $r ) = ( $1, $2 ); |
|
$l =~ tr/.//d; |
|
return "$l.$r"; |
|
} |
|
else { |
|
return $s; |
|
} |
|
} |
|
|
|
sub look_ahead { |
|
my $s = shift; |
|
$s =~ s/\.(?=.*\.)//g; |
|
return $s; |
|
} |
|
|
|
sub count_and_replace { |
|
my $s = shift; |
|
my $count = ( my @a = ($s =~ /\./g) ); |
|
$s =~ s/\./(--$count)?'':'.'/ge; |
|
return $s; |
|
} |
|
|
|
sub elim_last { |
|
my $s = shift; |
|
my $non_occur = "\x{1}" . ( "\0" x length $s ) . "\x{1}"; |
|
$s =~ s/\.([^\.]*)$/$non_occur$1/; |
|
$s =~ tr/.//d; |
|
$s =~ s!$non_occur!.!; |
|
return $s; |
|
} |
|
|
|
sub rindex01 { |
|
my $s = shift; |
|
substr( $s, 0, rindex( $s, '.' ) ) =~ tr/.//d; |
|
return $s; |
|
} |
|
|
|
sub recursive_perl { |
|
my @chars = split //, shift; |
|
|
|
my $recurse; |
|
$recurse = sub { |
|
return '', 0 unless scalar @_; |
|
|
|
my $head = shift @_; |
|
my ( $processed_string, $was_period_found ) = $recurse->( @_ ); |
|
if ( $was_period_found ) { |
|
return ( $head eq '.' ? '' : $head ) . $processed_string, 1; |
|
} |
|
else { |
|
return $head . $processed_string, $head eq '.'; |
|
} |
|
}; |
|
|
|
return ( $recurse->( @chars ) )[0]; |
|
} |
|
|
|
sub delpoint1 { |
|
local $_ = shift; |
|
|
|
my $old = $_; |
|
while ( /\./ ) { |
|
$old = $_; |
|
s/\.//; |
|
} |
|
|
|
return $old; |
|
} |
|
|
|
sub delpoint2 { |
|
local $_ = shift; |
|
while ( s/\.(.*\.)/$1/ ) {} |
|
return $_; |
|
} |
|
|
|
sub delpoint8 { |
|
local $_ = shift; |
|
|
|
my @parts = split /(\.)/; |
|
my %hash; |
|
for my $i ( 0..$#parts ) { |
|
push @{ $hash{$parts[$i]} }, $i; |
|
} |
|
|
|
if ( exists $hash{'.'} ) { |
|
$hash{'.'} = [ @{ $hash{'.'} }[-1] ]; |
|
} |
|
|
|
my %sort; |
|
for my $key ( %hash ) { |
|
for my $number ( @{$hash{$key}} ) { |
|
$sort{$number} = $key; |
|
} |
|
} |
|
|
|
$_ = ''; |
|
for my $number ( sort { $a <=> $b } keys %sort ) { |
|
$_ .= $sort{$number}; |
|
} |
|
|
|
return $_; |
|
} |
|
|
|
sub pack01 { |
|
my @c = unpack 'c*', $_[0]; |
|
my @p = grep( $c[$_] == 46, 0..$#c ); |
|
pop @p; |
|
while ( defined ( my $c = pop @p ) ) { |
|
splice @c, $c, 1; |
|
} |
|
return pack 'c*', @c; |
|
} |
|
|
|
cmpthese( 1000000, { |
|
'via_split' => sub { test( \&via_split ) }, |
|
'sexeger' => sub { test( \&sexeger ) }, |
|
'two_parts' => sub { test( \&two_parts ) }, |
|
'look_ahead' => sub { test( \&look_ahead ) }, |
|
'count_and_replace' => sub { test( \&count_and_replace ) }, |
|
'elim_last' => sub { test( \&elim_last ) }, |
|
'rindex01' => sub { test( \&rindex01 ) }, |
|
# Recursive would eat all the memory and would be the slowest one anyway. |
|
# Trust me on this ;) |
|
#'recursive_perl' => sub { test( \&recursive_perl ) }, |
|
'delpoint1' => sub { test( \&delpoint1 ) }, |
|
'delpoint2' => sub { test( \&delpoint2 ) }, |
|
'delpoint8' => sub { test( \&delpoint8 ) }, |
|
'pack01' => sub { test( \&pack01 ) }, |
|
}); |