Perl,Code片段,代码实例,代码示例,代码片段库 - IT屋

Perl 疯狂的Perl代码

$_ = shift;
s/\\/\//g;
print;

################

while(&lt;&gt;) {
   /^(\w+)/;
   print $_.',';
}

#############

if(($_ = 5)==5) {print;}

##############

$x = 7;
if (($x &lt;=&gt; 0)==($x=$x)) {print 'true';}
else{print 'false';}

#######################

print &quot;Hello World&quot; or die &quot;trying&quot;;

######################

print eval qw(qw(qw()));

Perl 计算给定目录中的目录条目

#!/usr/bin/perl
$ARGV[0] = '.' unless @ARGV;
for my $dir (@ARGV) {
  opendir DIR, $dir or die &quot;$dir: $!\n&quot;;
  $file =~ m:^\.: or ++$count
    while ($file = readdir DIR);
  closedir DIR;
}
print &quot;$count\n&quot;;
exit 0;

Perl 备份您自己的snipplr.com片段

#!/usr/bin/perl
use strict;
use LWP::UserAgent;
my $silent = 0; # set to 1 for no output on stdout
my $logindata = {
    'username' =&gt; 'fill in your username',
    'password' =&gt; 'fill in your password',
                };
my $loginurl = 'http://snipplr.com/login/';
my $backupurl = 'http://snipplr.com/zipbackup.php';
my $backupdir = '.';

my $ua = LWP::UserAgent-&gt;new;
$ua-&gt;cookie_jar({ file =&gt; &quot;cookies.txt&quot; });

print qq{get cookie from frontpage...} unless $silent;
my $devnull = $ua-&gt;get('http://snipplr.com/'); #get cookie
print qq{done.\n} unless $silent;

print qq{login as $$logindata{'username'}...} unless $silent;
my $loginresponse = $ua-&gt;post($loginurl, $logindata);
print qq{done.\n} unless $silent;

print qq{exporting snipplr_backup.zip...} unless $silent;
my $backupfile = $ua-&gt;get($backupurl);
open (KI, &quot;&gt;$backupdir/snipplr_backup.zip&quot;);
binmode KI;
print KI $backupfile-&gt;content;
close (KI);
print qq{done.\n} unless $silent;

Perl 使用XML :: API :: XHTML在命令行上生成XHTML

perl -e &quot;use XML::API::XHTML; my $d = new XML::API::XHTML(); $d-&gt;head_open(); $d-&gt;title('hello world!'); $d-&gt;script({type =&gt; 'text/javascript'}, '/* hello scripts! */'); $d-&gt;head_close(); $d-&gt;body_open(); $d-&gt;h1({style =&gt; 'color:red'}, 'Hi nerd!'); print $d;&quot;  | tidy -q -o temp.html

Perl 日期功能

sub date_mysql2sec {
#takes: date in &quot;yyyy-mm-dd hh:mm:ss&quot; format (with some freedom)
#returns: date in seconds since 1970 format
    use Time::Local;# 'timelocal_nocheck';
    my $mysqldate = shift;
    $mysqldate =~ /(\d{4}).(\d{2}).(\d{2}).(\d{2}).(\d{2}).(\d{2})/;
    my ($sec,$min,$hour,$mday,$mon,$year) = ($6,$5,$4,$3,$2,$1);
    if ($mon != 0) {$mon--};
    return timelocal($sec,$min,$hour,$mday,$mon,$year);
}

sub date_sec2mysql {
#takes: date in seconds since 1970 format
#returns: date in yyyy-mm-dd hh:mm:ss format
    my $secdate = shift;
    my ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday) = localtime($secdate);
    $year += 1900;
    $mon++;
    $mon = $mon &lt; 10 ? &quot;0$mon&quot; : $mon;
    $mday = $mday &lt; 10 ? &quot;0$mday&quot; : $mday;
    $sec = $sec &lt; 10 ? &quot;0$sec&quot; : $sec;
    $min = $min &lt; 10 ? &quot;0$min&quot; : $min;
    $hour = $hour &lt; 10 ? &quot;0$hour&quot; : $hour;    
    return qq{$year-$mon-$mday $hour:$min:$sec};
}

sub date_mysql_now {
#Takes: nothing
#Returns: current date and time in yyyy-mm-dd hh:mm:ss format
    return date_sec2mysql(time);
}

Perl 基于MySQL的功能

sub db_connect {
    my ($dbname, $dbuser, $dbpass) = @_;
    my $dbh = DBI-&gt;connect(&quot;DBI:mysql:$dbname&quot;,$dbuser,$dbpass);
    #$dbh-&gt;do(qq{set character set 'utf8';});
    return $dbh;
}

sub do_sql {
# Takes: $dbh, $sql
# Returns: status
    my $dbh = shift || die &quot;Database not connected!\n&quot;;
    my $sql = shift || die &quot;Missing SQL statement???\n&quot;;
    return $dbh-&gt;do($sql);
}

sub execute_sql {
# Takes: $dbh, $sql
# Returns: $result_arrayref
    my $dbh = shift || die &quot;Database not connected!\n&quot;;
    my $sql = shift || die &quot;Missing SQL statement???\n&quot;;
    my $sth = $dbh-&gt;prepare($sql);
    $sth-&gt;execute;
    my $result = $sth-&gt;fetchall_arrayref({}); # {} =&gt; Return arrayref of hashrefs
    return $result;
}

sub do_insert {
#takes: $dbh, $table, $datahash
#returns: status
    my $dbh = shift || die &quot;Database not connected!\n&quot;;
    my $table = shift || die &quot;Missing table!\n&quot;;
    my $datahash = shift || die &quot;Nothing to insert!\n&quot;;
    my $insert = &quot;INSERT INTO $table (&quot; . join(',', keys %$datahash) . ') VALUES (' . join(',', values %$datahash) . ');';
    return &amp;do_sql($dbh, $insert);
}

Perl 在多个文件夹中的文本文件中查找和替换字符串

grep -rl target_string . | xargs perl -pi~ -e 's/target_string/replacement_string/g'

Perl 使用Perl正则表达式替换批量重命名文件

#!/usr/bin/env perl -w
use strict;

# Batch rename files with Perl regex substitutions
# Perl administration files rename
#
# Larry Wall's filename fixer: recipe 9.9 in Perl Cookbook 

$op = shift 
	or die &quot;Usage: $0 expr [files]\n&quot;;
chomp(@ARGV = &lt;STDIN&gt;) unless @ARGV;
for (@ARGV) {
    $was = $_;
    eval $op;
    die $@ if $@;
    rename($was, $_) unless $was eq $_;
}

Perl 纽约时报报道RSS

#!/usr/bin/perl -w

use strict;
use LWP::Simple;
use HTML::TreeBuilder;
use LWP::Parallel::UserAgent;
use WWW::Mechanize;
use XML::TreeBuilder;
use Getopt::Long;
use HTTP::Cookies;
use Encode;

my $username;
my $password;
my $feedurl;

GetOptions(	&quot;user=s&quot;	=&gt; \$username,
		&quot;pass=s&quot;	=&gt; \$password,
		&quot;url=s&quot;		=&gt; \$feedurl
);

print STDERR &quot;Getting login page...\n&quot;;

my $cookiejar = HTTP::Cookies-&gt;new();

my $mech = WWW::Mechanize-&gt;new();

$mech-&gt;agent_alias('Linux Mozilla');
$mech-&gt;cookie_jar($cookiejar);

$mech-&gt;get(&quot;http://www.nytimes.com/auth/login&quot;);

my $loginresponse = $mech-&gt;submit_form(
	form_name	=&gt;	'login',
	fields		=&gt;	{
		USERID		=&gt;	$username,
		PASSWORD	=&gt;	$password
	}
);
		

unless ($loginresponse-&gt;is_success()) {
	die(&quot;Error logging in!\n&quot;);
}

print STDERR &quot;Logged in successfully!\n&quot;;

my $pua = LWP::Parallel::UserAgent-&gt;new();
$pua-&gt;cookie_jar($cookiejar);
$pua-&gt;redirect(1);


print STDERR &quot;Getting XML...\n&quot;;
my $xml = get($feedurl);
my $feed = XML::TreeBuilder-&gt;new();
$feed-&gt;parse($xml);
my %entries;

print STDERR &quot;Grabbing links...\n&quot;;

foreach my $item ($feed-&gt;look_down(&quot;_tag&quot;, &quot;item&quot;)) {
	my $link = $item-&gt;look_down(&quot;_tag&quot;, &quot;link&quot;)-&gt;as_text();
	$link =~ s/\?.*//;

	my $request = HTTP::Request-&gt;new();

	print STDERR &quot;Registering $link...\n&quot;;
	
	$request-&gt;uri($link,);
	$request-&gt;method(&quot;GET&quot;);

	$pua-&gt;register($request);

	$entries{$link} = $item;
}

print STDERR &quot;Downloading HTML...\n&quot;;
my $html = $pua-&gt;wait();

foreach my $entry (values(%$html)) {
	my $response = $entry-&gt;response();
	my $url = $response-&gt;base()-&gt;as_string();
	$url =~ s/\?.*//;

	print STDERR &quot;Processing $url...\n&quot;;

	my $item = $entries{$url};

	my $articlehtml = HTML::TreeBuilder-&gt;new_from_content(
		decode_utf8($response-&gt;content())
	);

	if (my $redirelem = $articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;meta&quot;, &quot;http-equiv&quot;, &quot;refresh&quot;)) {
		print STDERR &quot;Interstitial ad detected, skipping...\n&quot;;
		my $newurl = $redirelem-&gt;attr_get_i(&quot;content&quot;);

		($newurl) = ($newurl =~ m/url=(.*?)/);
		$newurl = &quot;http://www.nytimes.com&quot; . $newurl;

		print STDERR &quot;Redirect URL is $newurl...\n&quot;;
	}


	# Let's clean this up for Liferea, shall we?
	my $messyelement;

	foreach ($articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;enlargeThis&quot;)) {
		$_-&gt;delete();
	}
	if ($messyelement = $articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;nextArticleLink&quot;)) {
		$messyelement-&gt;delete();
	}

	my $description = $entries{$url}-&gt;look_down(&quot;_tag&quot;, &quot;description&quot;);
	$description-&gt;delete_content();

	foreach ($articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;image&quot;)) {
		$description-&gt;push_content($_-&gt;as_HTML());
	}

	if ($messyelement = $articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;articleInline&quot;)) {
		$messyelement-&gt;delete();
	}

	my %pages;
	my @pages;
	my $pageua = LWP::Parallel::UserAgent-&gt;new();
	$pageua-&gt;cookie_jar($cookiejar);

	if (my $pageelem = $articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;pageLinks&quot;)) {
		print STDERR &quot;Multiple pages detected...\n&quot;;

		foreach ($pageelem-&gt;look_down(&quot;_tag&quot;, &quot;a&quot;, &quot;title&quot;, qr/^Page/)) {
			my $pageurl = &quot;http://www.nytimes.com&quot; . $_-&gt;attr_get_i(&quot;href&quot;);
			print STDERR &quot;Registering $pageurl...\n&quot;;

			push(@pages, $pageurl);
			my $pagerequest = HTTP::Request-&gt;new();
			$pagerequest-&gt;uri($pageurl);
			$pagerequest-&gt;method('GET');

			$pageua-&gt;register($pagerequest);			
		}

		print STDERR &quot;Downloading pages...\n&quot;;

		$pageelem-&gt;delete();
	}

	foreach ($articlehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;articlebody&quot;)) {
		$description-&gt;push_content($_-&gt;as_HTML());
	}

	my $htmlpages = $pageua-&gt;wait();

	if ($htmlpages) {
		print STDERR &quot;Sorting pages...\n&quot;;
		foreach (values(%$htmlpages)) {
			my $pageresponse = $_-&gt;response();
			my $responseurl = $pageresponse-&gt;base()-&gt;as_string();

			$pages{$responseurl} = $pageresponse;
		}

		foreach (@pages) {
			print STDERR &quot;Processing $_...\n&quot;;

			my $pagehtml = HTML::TreeBuilder-&gt;new_from_content(
				decode_utf8($pages{$_}-&gt;content())
			);

			# Let's clean this up for Liferea, shall we?

			if ($messyelement = $pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;enlargeThis&quot;)) {
				$messyelement-&gt;delete();
			}
			if ($messyelement = $pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;nextArticleLink&quot;)) {
				$messyelement-&gt;delete();
			}

			foreach ($pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;class&quot;, &quot;image&quot;)) {
				$description-&gt;push_content($_-&gt;as_HTML());
			}
		
			if ($messyelement = $pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;articleInline&quot;)) {
				$messyelement-&gt;delete();
			}

			if ($messyelement = $pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;pageLinks&quot;)) {
				$messyelement-&gt;delete();
			}

			foreach ($pagehtml-&gt;look_down(&quot;_tag&quot;, &quot;div&quot;, &quot;id&quot;, &quot;articlebody&quot;)) {
				my $content = $_-&gt;as_HTML();
				$content =~ s/\(Page \d+ of \d+\)//g;
				$description-&gt;push_content($content);
			}
		}
	}
}

print $feed-&gt;as_XML();

Perl 让你的战争刮到RSS

#!/usr/bin/perl

use HTML::Entities;
use LWP::Simple;

# print a feed header
print &quot;&lt;?xml version=\&quot;1.0\&quot; encoding=\&quot;ISO-8859-1\&quot;?&gt;\n&quot;.
	&quot;&lt;rdf:RDF\n&quot;.
	&quot;xmlns:rdf=\&quot;http://www.w3.org/1999/02/22-rdf-syntax-ns#\&quot;\n&quot;.
	&quot;xmlns:content=\&quot;http://purl.org/rss/1.0/modules/content/\&quot;\n&quot;.
	&quot;xmlns=\&quot;http://my.netscape.com/rdf/simple/0.9/\&quot;&gt;\n&quot;.
	&quot;&lt;channel&gt;\n&quot;.
	&quot;  &lt;title&gt;Get Your War On&lt;/title&gt;\n&quot;.
	&quot;  &lt;link&gt;http://www.mnftiu.cc/mnftiu.cc/war.html&lt;/link&gt;\n&quot;.
	&quot;  &lt;description&gt;A webcomic about our 9/11 epilogue.&lt;/description&gt;\n&quot;.
	&quot;&lt;/channel&gt;\n\n&quot;;

$html_string = get (&quot;http://www.mnftiu.cc/mnftiu.cc/war.html&quot;);

$i = 2;

while ($html_string =~ m/&lt;a href=&quot;war(\d|\d\d).html&quot;&gt;(\d|\d\d)&lt;\/a&gt;/g)
{
	$i++
}

$url = &quot;http://www.mnftiu.cc/mnftiu.cc/war&quot; . $i . &quot;.html&quot;;

$html_string = get ($url);

while ($html_string =~ m/&lt;img src=&quot;images\/gywo.(.*?).gif&quot; border=0&gt;/g)
{
	print	&quot;&lt;item&gt;\n&quot;.
		&quot;&lt;title&gt;&quot; . $1 . &quot;&lt;/title&gt;\n&quot;.
	 	&quot;&lt;link&gt;&quot; . $url . &quot;&lt;/link&gt;\n&quot;.
		&quot;&lt;description&gt;&amp;lt;img src=\&quot;http://www.mnftiu.cc/mnftiu.cc/images/gywo.&quot; . $1 . &quot;.gif\&quot;&amp;gt;&lt;/description&gt;\n&quot;;

	print &quot;&lt;/item&gt;\n\n&quot;;
}

print &quot;&lt;/rdf:RDF&gt;\n&quot;;