([^<>]*)
([^<>]*)
Autor:\s+(.*?)(?:, iDNES.cz)?
From 89ca70a15a92676350073237f862e90b567430d5 Mon Sep 17 00:00:00 2001 From: lace <> Date: Wed, 14 Jul 2010 11:13:17 +0000 Subject: [PATCH] current --- public_html/cgi-bin/idnes-foto | 19 +++++++++++++------ 1 file changed, 13 insertions(+), 6 deletions(-) diff --git a/public_html/cgi-bin/idnes-foto b/public_html/cgi-bin/idnes-foto index dfdbd96..2cd8e73 100755 --- a/public_html/cgi-bin/idnes-foto +++ b/public_html/cgi-bin/idnes-foto @@ -18,11 +18,13 @@ else { $BASE=$ARGV[0]; } +# Somehow Perl modules started reencoding windows-1250 -> utf-8. + if ($ENV{"GATEWAY_INTERFACE"}) { my $future=HTTP::Date::time2str(2000000000); my $past =HTTP::Date::time2str(1000000000); print <<"EOH"; -Content-type: text/html; charset=windows-1250 +Content-type: text/html; charset=utf-8 Cache-Control: public Expires: $future Last-Modified: $past @@ -32,14 +34,14 @@ EOH print <<"EOH";
([^<>]*)
}, $info=~m{}s, ) { next if !$text; + $text=~s/^\s+//s; + $text=~s/\s+$//s; + next if !$text; + $hit++; print <<"EOH" if !$seen_p_text{$text}++;$text
EOH } - warn "No text found: $infourl" if $text_last==keys(%seen_p_text); + warn "No text found: $infourl" if !$hit; } die $pageurl if !$did; $pageno++; -- 1.8.3.1