Fixed some (Linux kernel?) compatibility problem of flock(1) of a directory.
[MyWeb.git] / Web.pm
1 # $Id$
2 # Common functions for HTML/XHTML output generation
3 # Copyright (C) 2003-2005 Jan Kratochvil <project-www.jankratochvil.net@jankratochvil.net>
4
5 # This program is free software; you can redistribute it and/or modify
6 # it under the terms of the GNU General Public License as published by
7 # the Free Software Foundation; exactly version 2 of June 1991 is required
8
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 # GNU General Public License for more details.
13
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software
16 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17
18
19 package My::Web;
20 require 5.6.0;  # at least 'use warnings;' but we need some 5.6.0+ modules anyway
21 our $VERSION=do { my @r=(q$Revision$=~/\d+/g); sprintf "%d.".("%03d"x$#r),@r; };
22 our $CVS_ID=q$Id$;
23 use strict;
24 use warnings;
25
26 use Exporter;
27 sub Wrequire($%);
28 sub Wuse($@);
29 our $W;
30 our @EXPORT=qw(
31                 &Wrequire &Wuse
32                 &path_web &path_abs_disk
33                 &uri_escaped
34                 &a_href &a_href_cc &text_cc
35                 &vskip
36                 &img &centerimg &rightimg &leftimg
37                 $W
38                 &input_hidden_persistents
39                 &escapeHTML
40                 &form_method
41                 );
42 our @ISA=qw(Tie::Handle Exporter);
43
44 my %packages_used_hash; # $packages_used_hash{$W->{"__PACKAGE__"}}{"_done"}=1;
45 my %packages_used_array;
46
47 BEGIN
48 {
49         use Carp qw(cluck confess);
50         $W->{"__My::Web_init"}=1;
51
52         # $args{"first"}=1
53         sub Wrequire ($%)
54         {
55         my($file,%args)=@_;
56
57 #               print STDERR "Wrequire $file\n";
58                 $file=~s#/#::#g;
59                 $file=~s/[.]pm$//;
60                 my $class=$file;
61                 $file=~s#::#/#g;
62                 $file.=".pm";
63                 my %callers;
64                 for (my $depth=0;defined caller($depth);$depth++) {
65                         $callers{caller($depth)}=1;
66                         }
67                 my $selfpkg=__PACKAGE__;
68                 $callers{$selfpkg}=1;
69                 for my $target ($class,__PACKAGE__) {
70                         for my $caller (keys(%callers)) {
71                                 next if $packages_used_hash{$caller}{$target}++;
72                                 cluck "Appending to the '_done' package list: caller=$caller,target=$target"
73                                                 if $packages_used_hash{$caller}{"_done"};
74                                 if ($args{"first"}) {
75                                         unshift @{$packages_used_array{$caller}},$target;
76                                         }
77                                 else {
78                                         push @{$packages_used_array{$caller}},$target;
79                                         }
80                                 }
81                         }
82                 eval { CORE::require "$file"; } or confess $@;
83                 1;      # Otherwise 'require' would already file above.
84         }
85
86         sub Wuse ($@)
87         {
88         my($file,@list)=@_;
89
90 #               print STDERR "Wuse $file\n";
91                 Wrequire $file;
92                 local $Exporter::ExportLevel=$Exporter::ExportLevel+1;
93                 $file->import(@list);
94                 1;
95         }
96
97         sub import
98         {
99         my($class,@rest)=@_;
100
101                 local $Exporter::ExportLevel=$Exporter::ExportLevel+1;
102                 Wrequire("$class");
103                 return $class->SUPER::import(@rest);
104         }
105 }
106
107 use WebConfig;  # see also below: Wuse 'WebConfig';
108 require Image::Size;    # for &imgsize
109 use File::Basename;     # &basename
110 use Carp qw(cluck confess);
111 use URI::Escape;
112 require HTTP::BrowserDetect;
113 require HTTP::Negotiate;
114 our $have_Geo_IP; BEGIN { $have_Geo_IP=eval { require Geo::IP; 1; }; }
115 # Do not: use ModPerl::Util qw(exit);
116 # to prevent in mod_perl2: "exit" is not exported by the ModPerl::Util module
117 # I do not know why.
118 use POSIX qw(strftime);
119 use Tie::Handle;
120 use Apache2::Const qw(HTTP_MOVED_TEMPORARILY OK HTTP_OK);
121 use URI;
122 use URI::QueryParam;
123 use Cwd;
124 require HTTP::Date;
125 require Storable;
126 require Digest::MD5;
127 require Data::Compare;
128 use Data::Dumper;
129 require Encode;
130 use Apache2::RequestUtil;
131 use Apache2::Filter;
132 use Apache2::Connection;
133 require MIME::Base64;
134 use Apache2::ServerUtil;
135 require MIME::Types;
136 require MIME::Parser;
137 use Apache2::RequestRec;
138 use Apache2::RequestIO;
139 use Apache2::Response;
140
141
142 #our $W;
143
144 sub init ($%)
145 {
146 my($class,%args)=@_;
147
148         print STDERR "$class->init ".Apache2::RequestUtil->request()->unparsed_uri()."\n";
149
150         # We need to track package dependencies, so we need to call it from &init.
151         # We cannot do it in BEGIN { } block
152         # as it would not be tracked for each of the toplevel users later.
153         Wuse 'WebConfig';
154         Wrequire 'My::Hash';
155
156         # $W={} can get somehow created very easily.
157         # Do not: cluck "W not empty:\n".Dumper($W) if keys(%$W);
158         # to prevent (of $W->{"headers_in"}): TODO: Enumeration may not be expected.
159         cluck "W not empty; __PACKAGE__ was: ".$W->{"__PACKAGE__"} if keys(%$W);
160         $W=My::Hash->new({},"My::Hash::Sub","My::Hash::Push");
161         bless $W,$class;
162         %$W=(
163                 "__PACKAGE__"=>scalar(caller()),
164                 %WebConfig,
165                 %args,  # override %WebConfig settings
166                 );
167
168         # {"__PACKAGE__"} is mandatory for mod_perl-2.0;
169         # $Apache2::Registry::curstash is no longer supported.
170         do { cluck "No $_" if !$W->{$_}; } for "__PACKAGE__";
171         exit_hook_start();
172         # Package dependencies tracking only:
173         Wrequire $W->{"__PACKAGE__"},"first"=>1;
174
175         do { $W->{$_}=0  if !defined $W->{$_}; } for "detect_ent";
176         do { $W->{$_}=0  if !defined $W->{$_}; } for "detect_js";
177         do { $W->{$_}=1  if !defined $W->{$_}; } for "have_css";        # AFAIK it does not hurt anyone.
178         do { $W->{$_}=0  if !defined $W->{$_}; } for "css_inherit";
179         do { $W->{$_}=1  if !defined $W->{$_}; } for "footer";
180         do { $W->{$_}=1  if !defined $W->{$_}; } for "footer_delimit";
181         do { $W->{$_}=1  if !defined $W->{$_}; } for "footer_ids";
182         do { $W->{$_}=1  if !defined $W->{$_}; } for "indexme";
183         do { $W->{$_}="" if !defined $W->{$_}; } for "body_attr";
184         do { $W->{$_}="en-US" if !defined $W->{$_}; } for "language";
185
186         my $footer_any=0;
187         for (qw(footer_ids)) {
188                 $W->{$_}=0 if !$W->{"footer"};
189                 $footer_any=1 if $W->{$_};
190                 }
191         $W->{"footer"}=0 if !$footer_any;
192         $W->{"footer_delimit"}=0 if !$W->{"footer"};
193
194         $W->{"r"}=Apache2::RequestUtil->request();
195
196         $W->{"r"}->push_handlers("PerlCleanupHandler"=>\&cleanup);
197
198         $W->{"web_hostname"}||=$W->{"r"}->hostname();
199
200         tie *STDOUT,$W->{"r"};
201         select *STDOUT;
202         $|=1;
203
204         $W->{"headers_in"}=$W->{"r"}->headers_in();
205         Wrequire 'My::Hash::Merge';
206         $W->{"headers_in"}=My::Hash::Merge->new(
207                         $W->{"headers_in"},
208                         My::Hash::Sub->new({
209                                 "_remote_ip"=>sub { return $W->{"r"}->connection()->remote_ip(); },
210                                 }),
211                         );
212         Wrequire 'My::Hash::Readonly';
213         $W->{"headers_in"}=My::Hash::Readonly->new($W->{"headers_in"});
214         
215         if ($W->{"r"}->method() eq "GET" || $W->{"r"}->method() eq "HEAD") {
216                 for (\$W->{"http_safe"}) {
217                         # Do not: # Extend the current ETag system instead if you would need it:
218                         #         cluck "Explicitely NOT HTTP-Safe for method \"".$W->{"r"}->method()."\"?!?"
219                         #                       if defined($$_) && !$$_;
220                         # as sometimes it just does not make sense to cache it.
221                         $$_=1 if !defined $$_;
222                         }
223                 }
224         else {
225                 for (\$W->{"http_safe"}) {
226                         cluck "Undefined HTTP-Safe-ty for method \"".$W->{"r"}->method()."\"!"
227                                         if !defined($$_);
228                         $$_=0 if !defined $$_;
229                         }
230                 }
231         # Used only if: $W->{"http_safe"}
232         # but we would cause on different method(): Appending to the '_done' package list
233         Wrequire 'My::Hash::RecordKeys';
234         if ($W->{"http_safe"}) {
235                 $W->{"headers_in_RecordKeys"}=My::Hash::RecordKeys->new($W->{"headers_in"});
236                 $W->{"headers_in"}=$W->{"headers_in_RecordKeys"};
237                 }
238
239         {
240                 local $_=$W->{"r"}->args() || "";
241                 if ($W->{"detect_ent"}) {
242                                  if (/[&]amp;have_ent/)
243                                 { $W->{"have_ent"}=0; }
244                         elsif (    /[&]have_ent/)
245                                 { $W->{"have_ent"}=1; }
246                         else
247                                 { delete $W->{"have_ent"}; }
248                         if (!defined $W->{"have_ent"} && $W->{"r"}->method() eq "GET") {
249                                 $W->{"head_push"}='<meta http-equiv="Refresh" content="0; URL='
250                                                 .escapeHTML("http://".$W->{"web_hostname"}."/".($W->{"r"}->uri()=~m#^/*(.*)$#)[0]
251                                                                 ."?".($_ || "detect_ent_glue=1").'&have_ent=detect')
252                                                 .'" />'."\n";
253                                 }
254                         }
255                 s/([&])amp;/$1/g;
256                 $W->{"r"}->args($_);
257                 }
258
259         $W->{"args"}=URI->new("?".$W->{"r"}->args())->query_form_hash();
260         $W->merge_post_args() if $W->{"r"}->method() eq "POST";
261         # Prepare '$args' first to (FIXME: Why?) prevent: Not a reference
262         my $args=$W->{"args"};
263         $W->{"args_orig"}=Storable::dclone($args);
264
265         $W->{"browser"}=sub {
266                 # Lazy-evaluation, we may not need the "User-Agent" header at all.
267                 return our $r||=HTTP::BrowserDetect->new($W->{"headers_in"}{"User-Agent"});
268                 };
269
270         if (!defined $W->{"have_style"}) {
271                 $W->{"have_style"}=sub {
272                         # Lazy-evaluation, we may not need the "User-Agent" header at all.
273                         return our $r||=(!$W->{"browser"}->netscape() || ($W->{"browser"}->major() && $W->{"browser"}->major()>4) ? 1 : 0);
274                         };
275                 }
276
277         $W->{"have_js"}=($W->{"args"}{"have_js"} ? 1 : 0);
278         if ($W->{"detect_js"} && !$W->{"have_js"}) {
279                 # Do not: <script />
280                 # as at least Lynx inhibits any further HTML output.
281                 # Do not: text/javascript
282                 # as it does not look as registered, at least according to: MIME::Types $VERSION 1.15
283                 # "application/javascript" so far standardized till 2005-12-08 by:
284                 #       http://www.ietf.org/internet-drafts/draft-hoehrmann-script-types-03.txt
285                 $W->{"head_push"}='<script type="application/javascript" src="'.uri_escaped(path_web('/My/HaveJS.pm')).'"></script>'."\n";
286                 }
287
288         # Required by &_args_check below.
289         $W->{"_init_done"}=1;
290
291         do { _args_check(%$_) if $_; } for $W->{"args_check"};
292
293         return $W;
294 }
295
296 sub form_method($)
297 {
298 my($method)=@_;
299
300         my $r=q{method="}.$method.q{"};
301         return $r." ".q{enctype="application/x-www-form-urlencoded" accept-charset="us-ascii utf-8"} if $method eq "post";
302         return $r." ".                                            q{accept-charset="us-ascii utf-8"} if $method eq "get";
303         cluck "Undefined method: $method";
304         return $r;
305 }
306
307 sub merge_post_args($)
308 {
309 my($class)=@_;
310
311         my @post_args=$class->read_post_args();
312         while (@post_args) {
313                 my $name=shift @post_args;
314                 my $data=shift @post_args;
315                 my $ref=\$W->{"args"}{$name};
316                    if (!defined $$ref)       { $$ref=$data; }
317                 elsif (!ref $$ref)           { $$ref=[$$ref,$data]; }
318                 elsif ("ARRAY" eq ref $$ref) { push @$$ref,$data; }
319                 else {
320                         cluck "Ignoring POST argument \"$name\", orig is weird:\n",Dumper($$ref);
321                         }
322                 }
323         return;
324 }
325
326 # Do not: use CGI;
327 # as CGI parsing of POST vs. QUERY_STRING data, multiple-valued keys etc.
328 # is too dense and causes weird problems, together with mod_perl etc.
329 sub read_post_args($)
330 {
331 my($class)=@_;
332
333         local $_=$class->http_headers_in_for("Content-type")->content_type();
334         return $class->read_multipart_form_data() if $_ eq "multipart/form-data";
335         return $class->read_application_x_www_form_urlencoded() if $_ eq "application/x-www-form-urlencoded";
336         cluck "Unknown POST data body, ignored: $_";
337         return;
338 }
339
340 sub read_application_x_www_form_urlencoded($)
341 {
342 my($class)=@_;
343
344         my $body="";
345         for (;;) {
346                 my $got=$W->{"r"}->read(my($buf),0x1000);
347                 # Do not: cluck "Error reading POST data: $!" if !defined $got;
348                 # as it should be done using: APR::Error exceptions
349                 last if !$got;
350                 $body.=$buf;
351                 }
352         return URI->new("?".$body)->query_form();
353 }
354
355 sub read_multipart_form_data($)
356 {
357 my($class)=@_;
358
359         my $parser=MIME::Parser->new();
360         # FIXME: No unlink()s done!
361         $parser->output_under("/tmp");
362
363         local *R_FH;
364         tie *R_FH,$W->{"r"};
365         local *FH;
366         tie *FH,"My::Web::ReadMerged",
367                         join("",map(($_.": ".$W->{"headers_in"}{$_}."\n"),qw(
368                                         Content-type
369                                         )))."\n",
370                         \*R_FH;
371         my $body=$parser->parse(\*FH);
372         cluck "No multipart POST request body?" if !$body->is_multipart();
373
374         return map((
375                         $_->head()->mime_attr("content-disposition.name")
376                         =>
377                         join("",@{$_->body()})
378                         ),$body->parts());
379
380         # TODO: Globalize, make it IO::* compatible, split to the merging part + IO::Scalar.
381         package My::Web::ReadMerged;
382
383         require Tie::Handle;
384         require Exporter;
385         our @ISA=qw(Tie::Handle Exporter);
386         use Carp qw(cluck confess);
387
388         sub READLINE($)
389         {
390         my($self)=@_;
391
392                 confess "Slurp not yet implemented" if !defined $/;
393                 # Apache2::RequestIO does not support 'READLINE'!
394                 for (;;) {
395                         if (defined $self->{"data"} && $self->{"data"}=~s{^.*\Q$/\E}{}) {
396                                 $self->{"offset"}+=length $&;
397                                 return $&;
398                                 }
399                         my $fh_orig=$self->{"fh_orig"};
400                         if (!$fh_orig) {
401                                 my $r=$self->{"data"};
402                                 delete $self->{"data"};
403                                 $self->{"offset"}+=length $r if defined $r;
404                                 return $r;
405                                 }
406                         my $got=read $fh_orig,my($buf),0x1000;
407                         cluck "Error reading POST data: $!" if !defined $got;
408                         delete $self->{"fh_orig"} if !$got;
409                         cluck "INTERNAL: fh_orig should not exist here" if !defined $self->{"data"};
410                         $self->{"data"}.=$buf;
411                         }
412         }
413
414         sub TELL($)
415         {
416         my($self)=@_;
417
418                 return $self->{"offset"};
419         }
420
421         sub TIEHANDLE($$$)
422         {
423         my($class,$data,$fh_orig)=@_;
424
425                 my $self=bless {},$class;
426                 $self->{"data"}=$data;
427                 $self->{"offset"}=0;
428                 $self->{"fh_orig"}=$fh_orig;
429                 return $self;
430         }
431 }
432
433 sub cleanup($)
434 {
435 my($apache_request)=@_;
436
437         cluck "CORE::GLOBAL::exit hook not ran" if !$W->{"_exit_done"};
438         cluck "packages not finalized" if !$packages_used_hash{$W->{"__PACKAGE__"}}{"_done"};
439         cache_finish();
440         # Sanity protection.
441         $W=undef();
442         exit_hook_stop();
443         return OK;
444 }
445
446 # PerlResponseHandler is RUN_FIRST and &ModPerl::Util::exit returns OK, so no (sane) go.
447 # PerlLogHandler is already too late to be able to produce any output.
448 my $exit_orig;
449 sub exit_hook
450 {
451         cluck "Missing ->init while in exit_hook()" if !$W->{"_init_done"};
452         # &footer will call us recursively!
453         footer() if !$W->{"_exit_done"}++;
454         return &{$exit_orig}(@_);
455 }
456 sub exit_hook_start
457 {
458         do { cluck "exit_hook_start() twice?"; return; } if defined $exit_orig;
459         $exit_orig=\&CORE::GLOBAL::exit;
460         # Prevent: Subroutine CORE::GLOBAL::exit redefined
461         no warnings 'redefine';
462         *CORE::GLOBAL::exit=\&exit_hook;
463 }
464 sub exit_hook_stop
465 {
466         do { cluck "exit_hook_stop() without exit_hook_start()?"; return; }
467                         if \&exit_hook ne \&CORE::GLOBAL::exit;
468         do { cluck "INTERNAL: exit_orig uninitialized"; return; }
469                         if !$exit_orig;
470         # Prevent: Subroutine CORE::GLOBAL::exit redefined
471         no warnings 'redefine';
472         *CORE::GLOBAL::exit=$exit_orig;
473         $exit_orig=undef();
474 }
475
476 # Be aware other parts of code (non-My::Web) will NOT use this function!
477 # Do not: Wprint $W->{"heading"},"undef"=>1;
478 # as we would need to undef() it to turn it off and it would get defaulted in such case.
479 # Do not: exists $W->{"heading"}
480 # as we use a lot of 'for $W->{"heading"}' which instantiates it with the value: undef()
481 sub Wprint($%)
482 {
483 my($text,%args)=@_;
484
485         cluck "undef Wprint" if !defined $text && !$args{"undef"};
486         delete $args{"undef"};
487         cluck join(" ","Invalid arguments:",keys(%args)) if keys(%args);
488         return if !defined $text;
489         # Do not: cluck "utf-8 untested" if Encode::is_utf8($text);
490         # as it is valid here.
491         $W->{"r"}->puts($text);
492 }
493
494 sub request_check(;$)
495 {
496 my($self)=@_;
497
498         # Use &eval to prevent: Global $r object is not available. Set:\n\tPerlOptions +GlobalRequest\nin ...
499         confess "Calling sensitive dynamic code from a static code" if !eval { Apache2::RequestUtil->request(); };
500         # Do not: confess "Calling sensitive dynamic code without My::Web::init" if !$W->{"__PACKAGE__"};
501         # as it is valid at least while preparing arguments to call: &project::Lib::init
502 }
503
504 # Do not: use CGI;
505 # as it is too much backward compatible regarding the charset encodings etc.
506 # and the resulting code is too dense with no additional functionality for the recent content.
507 sub escapeHTML($)
508 {
509 my($text)=@_;
510
511         local $_=$text;
512         s{&}{&amp;}gso;
513         s{<}{&lt;}gso;
514         s{>}{&gt;}gso;
515         s{"}{&quot;}gso;
516         return $_;
517 }
518
519 # /home/user/www/webdir
520 sub dir_top_abs_disk()
521 {
522         our $dir_top_abs_disk;
523         if (!$dir_top_abs_disk) {
524                 my $selfpkg_relpath=__PACKAGE__;
525                 $selfpkg_relpath=~s{::}{/}g;
526                 $selfpkg_relpath.=".pm";
527                 my $selfpkg_abspath=$INC{$selfpkg_relpath} or do {
528                         cluck "Unable to find self package $selfpkg_relpath";
529                         return;
530                         };
531                 $selfpkg_abspath=~s{/*\Q$selfpkg_relpath\E$}{} or do {
532                         cluck "Unable to strip myself \"$selfpkg_relpath\" from the abspath: $selfpkg_abspath";
533                         return;
534                         };
535                 cluck "INC{myself} is relative?: $selfpkg_abspath" if $selfpkg_abspath!~m{^/};
536                 $dir_top_abs_disk=$selfpkg_abspath;
537                 }
538         return $dir_top_abs_disk;
539 }
540
541 sub unparsed_uri()
542 {
543         request_check();
544         if (!$W->{"unparsed_uri"}) {
545                 # Do not: $W->{"r"}
546                 # as we may be called before &init from: &My::Project::init
547                 my $r=Apache2::RequestUtil->request();
548                 cluck "Calling ".'&unparsed_uri'." from a static code, going to fail" if !$r;
549                 my $uri_string=$r->unparsed_uri() or cluck "Valid 'r' missing unparsed_uri()?";
550                 my $uri=URI->new_abs($uri_string,"http://".$W->{"web_hostname"}."/");
551                 $W->{"unparsed_uri"}=$uri;
552                 }
553         return $W->{"unparsed_uri"};
554 }
555
556 sub in_to_uri_abs($)
557 {
558 my($in)=@_;
559
560         # Otherwise we may have been already processed and thus legally relativized.
561         # FIXME data: Currently disabled, all the data are too violating such rule.
562         if (0 && !ref $in) {
563                 my $uri_check=URI->new($in);
564                 $uri_check->scheme() || $in=~m{^\Q./\E} || $in=~m{^/}
565                                 or cluck "Use './' or '/' prefix for all the local references: $in";
566                 }
567         my $uri=URI->new_abs($in,unparsed_uri());
568         $uri=$uri->canonical();
569         return $uri;
570 }
571
572 # $args{"uri_as_in"}=1 to permit passing URI objects as: $in
573 # $args{"abs"}=0 || 1;  # overrides: $W->{"args"}{"Wabs"}
574 sub path_web($%)
575 {
576 my($in,%args)=@_;
577
578         cluck if !$args{"uri_as_in"} && ref $in;
579         my $uri=in_to_uri_abs($in);
580         if (uri_is_local($uri)) {
581                 # Prefer the $uri values over "args_persistent" values.
582                 # &query_form_hash comes from: URI::QueryParam
583                 $uri->query_form_hash({
584                                 map({
585                                         my $key=$_;
586                                         my $val=$W->{"args"}{$key};
587                                         (!defined $val ? () : ($key=>$val));
588                                         } keys(%{$W->{"args_persistent"}})),
589                                 %{$uri->query_form_hash()},
590                                 });
591                 }
592         my $abs;
593         do { $abs=$_ if defined; } for $W->{"args"}{"Wabs"},$args{"abs"};
594         return $uri->abs(unparsed_uri()) if $abs;
595         return $uri->rel(unparsed_uri());
596 }
597
598 sub path_abs_disk_register($)
599 {
600 my($path_abs_disk)=@_;
601
602         $W->{"path_abs_disk_register"}{$path_abs_disk}=1;
603 }
604
605 # $args{"uri_as_in"}=1 to permit passing URI objects as: $in
606 sub path_abs_disk($%)
607 {
608 my($in,%args)=@_;
609
610         cluck if !$args{"uri_as_in"} && ref $in;
611         my $uri=in_to_uri_abs($in);
612         cluck if !uri_is_local($uri);
613         my $path=$uri->path();
614         cluck "URI compatibility: ->path() not w/leading slash of URI \"$uri\"; path: $path" if $path!~m{^/};
615         my $r=dir_top_abs_disk().$path;
616         path_abs_disk_register $r if !defined $args{"register"} || $args{"register"};
617         return $r;
618 }
619
620 sub fatal (;$);
621
622 sub _args_check (%)
623 {
624 my(%tmpl)=@_;
625
626         while (my($name,$regex)=each(%tmpl)) {
627                 my $name_html="Parameter <span class=\"quote\">".escapeHTML($name)."</span>";
628                 $W->{"args"}{$name}="" if !defined $W->{"args"}{$name};
629                 $W->{"args"}{$name}=[ $W->{"args"}{$name} ] if !ref $W->{"args"}{$name} && ref $regex;
630                 fatal "$name_html passed as multivar although singlevar expected"
631                                 if ref $W->{"args"}{$name} && !ref $regex;
632                 $regex=$regex->[0] if ref $regex;
633                 for my $val (!ref $W->{"args"}{$name} ? $W->{"args"}{$name} : @{$W->{"args"}{$name}}) {
634                         $val="" if !defined $val;
635                         fatal "$name_html <span class=\"quote\">".escapeHTML($val)."</span>"
636                                                         ." does not match the required regex <span class=\"quote\">".escapeHTML($regex)."</span> "
637                                         if $regex ne "" && $val!~/$regex/;
638                         }
639                 }
640 }
641
642 sub vskip (;$)
643 {
644 my($height)=@_;
645
646         return '<p'.(!defined $height ? "" : ' style="height: '.$height.';"').'>&nbsp;</p>'."\n";
647 }
648
649 sub fatal (;$)
650 {
651 my($msg)=@_;
652
653         $msg="UNKNOWN" if !$msg;
654         cluck "FATAL: $msg";
655
656         # Do not send it unconditionally.
657         # The intial duplicated '<?xml...' crashes Gecko parser.
658         $W->{"heading_done"}=0 if $W->{"header_only"};
659         # Do not send it unconditionally.
660         # Prevents warn: Headers already sent
661         if (!$W->{"heading_done"}) {
662                 $W->{"indexme"}=0;      # For the case no heading was sent yet.
663                 $W->{"header_only"}=0;  # assurance for &heading
664                 $W->{"content_type"}="text/html";       # Force HTML and avoid strictly checked XHTML.
665                 My::Web->heading();
666                 }
667         Wprint "\n".vskip("3ex")."<hr /><h1 class=\"error\">FATAL ERROR: $msg!</h1>\n"
668                         ."<p>You can report this problem's details to"
669                         ." ".a_href("mailto:".$W->{"admin_mail"},"admin of this website").".</p>\n";
670         exit;
671 }
672
673 sub footer_packages_used_comments()
674 {
675         my $packages_used=$packages_used_array{$W->{"__PACKAGE__"}};
676         for my $package (@$packages_used) {
677                 my $cvs_id=(eval('$'.$package."::CVS_ID")
678 #                               || $package     # debug
679                                 );
680                 Wprint '<!-- '.$package.' - $'.$cvs_id.'$ -->'."\n" if $cvs_id;
681                 }
682 }
683
684 sub footer()
685 {
686         cluck 'Explicit &footer call is deprecated, !_exit_dne' if !$W->{"_exit_done"};
687         exit if $W->{"footer_done"}++;  # deadlock prevention:
688         &{$_}() for reverse @{$W->{"footer_sub_push"}};
689         if ($W->{"header_only"}) {
690                 $packages_used_hash{$W->{"__PACKAGE__"}}{"_done"}=1;
691                 exit;
692                 }
693
694         Wprint vskip if $W->{"footer_delimit"};
695         &{$_}() for reverse @{$W->{"footing_delimit_sub_push"}};
696         Wprint "<hr />\n" if $W->{"footer"};
697
698         # Never update the package list while we examine it!
699         $packages_used_hash{$W->{"__PACKAGE__"}}{"_done"}=1;
700
701         # Dump the whole packages stack or just the primary one?
702         #my $packages_used=$packages_used_array{$W->{"__PACKAGE__"}};
703         my $packages_used=[$W->{"__PACKAGE__"}];
704
705         if ($W->{"footer_ids"}) {
706                 Wprint '<p class="cvs-id">';
707                 Wprint join("<br />\n",map({ my $package=$_;
708                         my $cvs_id=(eval('$'.$package."::CVS_ID")
709 #                                       || $package     # debug
710                                         );
711                         if (!$cvs_id) {
712                                 ();
713                                 }
714                         else {
715                                 $cvs_id='$'.$cvs_id.'$';        # Eaten by 'q' operator.
716                                 my @cvs_id_split=split / +/,$cvs_id;
717                                 if (@cvs_id_split==8) {
718                                         my $file=$package;
719                                         $file=~s#::#/#g;
720                                         my $ext;
721                                         my @tried;
722                                         for (qw(.pm)) {
723                                                 $ext=$_;
724                                                 my $path_abs_disk=path_abs_disk("/$file$ext");
725                                                 push @tried,$path_abs_disk;
726                                                 last if -r $path_abs_disk;
727                                                 cluck "Class file $file not found; tried: ".join(" ",@tried) if !$ext;
728                                                 }
729                                         $file.=$ext;
730                                         my $viewcvs;
731                                         if ((my $file_cvs=$file)=~s{^My/}{}) {
732                                                 $viewcvs=$W->{"viewcvs_My"}.$file_cvs;
733                                                 }
734                                         else {
735                                                 $viewcvs=$W->{"viewcvs"}.$file;
736                                                 }
737                                         $cvs_id_split[2]=""
738                                                         .a_href((map({ my $s=$_; $s=~s#/viewcvs/#$&~checkout~/#; $s; } $viewcvs))[0]."?rev=".$cvs_id_split[2],
739                                                                         $cvs_id_split[2]);
740                                         $cvs_id_split[1]=a_href($viewcvs,($package!~/^Apache2::/ ? $package : $cvs_id_split[1]));
741                                         $cvs_id_split[5]=&{$W->{"cvs_id_author_sub"}}($cvs_id_split[5]);
742                                         }
743                                 join " ",@cvs_id_split;
744                                 }
745                         } @$packages_used));
746                 Wprint "</p>\n";
747                 }
748
749         footer_packages_used_comments();
750
751         do { Wprint $_ if $_; } for $W->{"footing"};
752
753         Wprint "</body></html>\n";
754         exit;
755 }
756
757 # Existing entries are overwritten.
758 sub header(%)
759 {
760 my(%pairs)=@_;
761
762         while (my($key,$val)=each(%pairs)) {
763                 do { cluck "Headers already sent"; next; } if $W->{"heading_done"};
764                 $W->{"r"}->headers_out()->set($key,$val);
765                 }
766 }
767
768 sub size_display ($)
769 {
770 my($size)=@_;
771
772            if ($size<4096)
773                 {}
774         elsif ($size<1024*1024)
775                 { $size=sprintf "%.1fK",$size/1024; }
776         else
777                 { $size=sprintf "%.1fM",$size/1024/1024; }
778         $size.="B";
779         return $size;
780 }
781
782 sub uri_is_local($)
783 {
784 my($in)=@_;
785
786         my $uri_rel=in_to_uri_abs($in)->rel(unparsed_uri());
787         # Do not: defined $uri_rel->("userinfo"|"host"|"port")();
788         # as they fail to be called for schemes not supporting them.
789         return 0 if $uri_rel->scheme();
790         return 0 if $uri_rel->authority();
791         return 1;
792 }
793
794 # &path_web still may be required for &uri_escaped !
795 sub uri_escaped($)
796 {
797 my($uri)=@_;
798
799         cluck if !ref $uri;
800         my $urient=escapeHTML($uri);
801         return $uri    if $uri eq $urient;
802         request_check();
803         return $urient if uri_is_local $uri;
804         return $uri    if defined $W->{"have_ent"} && !$W->{"have_ent"};        # non-ent client
805         return $urient if $W->{"have_ent"};     # ent client
806         # Unknown client, &escapeHTML should not be needed here:
807         return escapeHTML(path_web('/My/Redirect.pm?location='.uri_escape($uri->abs(unparsed_uri()))));
808 }
809
810 our $a_href_inhibited;
811 sub a_href($;$%)
812 {
813 my($in,$contents,%args)=@_;
814
815         request_check();
816         do { $$_=1 if !defined $$_; } for (\$args{"size"});
817         if (!defined $contents) {
818                 $contents=$in;
819                 $contents=File::Basename::basename($contents) if $args{"basename"};
820                 $contents=~s/^mailto:([-.\w]+(?:@|\Q(at)\E)[-.\w]+)$/$1/;
821                 $contents=escapeHTML($contents);
822                 }
823         $contents=~s#<a\b[^>]*>##gi;
824         $contents=~s#</a>##gi;
825         return $contents if $a_href_inhibited;
826
827         my $path_web=path_web $in,%args;
828         my $r="";
829         $r.='<a href="';
830         $r.=uri_escaped $path_web;
831         $r.='"';
832         do { $r.=" $_" if $_; } for ($args{"attr"});
833         $r.='>'.$contents.'</a>';
834         my $size_in=$in;
835         do { $size_in=$_ if $_ && !/^\d+$/; } for $args{"size"};
836         if ($args{"size"} && uri_is_local($size_in)
837                         && (($args{"size"} && $args{"size"}=~/^\d+$/ && $args{"size"}>=2)
838                                         || $size_in=~/[.](?:gz|Z|rpm|zip|deb|lha)/)) {  # Downloadable?
839                 my $path_abs_disk=path_abs_disk $size_in,%args;
840                 cluck "File not readable: $path_abs_disk" if !-r $path_abs_disk;
841                 $r.='&nbsp;('.size_display((stat($path_abs_disk))[7]).')';
842                 }
843         return $r;
844 }
845
846 sub a_href_inhibit($$;@)
847 {
848 my($self,$sub,@sub_args)=@_;
849
850         local $a_href_inhibited=1;
851         return &{$sub}(@sub_args);
852 }
853
854 sub input_hidden_persistents()
855 {
856         request_check();
857         return join("",map({
858                 my $key=$_;
859                 my $val=$W->{"args"}{$key};
860                 (!defined $val ? () : '<input type="hidden"'
861                                 .' name="'.escapeHTML($key).'"'
862                                 .' value="'.escapeHTML($val).'"'
863                                 .' />'."\n");
864                 } (keys(%{$W->{"args_persistent"}}))));
865 }
866
867 sub http_moved($$;$)
868 {
869 my($self,$url,$status)=@_;
870
871         $url=path_web($url,"abs"=>1);
872         $status||=HTTP_MOVED_TEMPORARILY;
873         $W->{"r"}->status($status);
874         $W->{"r"}->headers_out()->{"Location"}=$url;
875         $W->{"header_only"}=1;
876         $W->{"content_type"}=0;
877         $W->{"charset"}=0;
878         My::Web->heading();
879         exit;
880         die "NOTREACHED";
881 }
882
883 sub remote_ip ()
884 {
885         # Do not: PerlModule                 Apache2::ForwardedFor
886         #         PerlPostReadRequestHandler Apache2::ForwardedFor
887         # As 'Apache2::ForwardedFor' takes the first of $ENV{"HTTP_X_FORWARDED_FOR"}
888         # while the contents is '127.0.0.1, 213.220.195.171' if client has its own proxy.
889         # We must take the last item ourselves.
890         # Be VERY sure you always retrieve all the headers unconditionally to hit: My::Hash::RecordKeys
891         my $x_forwarded_for=$W->{"headers_in"}{"X-Forwarded-For"};
892         $x_forwarded_for=~s/^.*,\s*// if $x_forwarded_for;
893         my $remote_ip=$W->{"headers_in"}{"_remote_ip"};
894         my $r;
895         $r||=$x_forwarded_for;
896         $r||=$remote_ip;
897         return $r;
898 }
899
900 sub _cc()
901 {
902         my $r;
903         $r||=Geo::IP->new()->country_code_by_addr(remote_ip()) if $have_Geo_IP;
904         $r||="";
905         return $r;
906 }
907
908 # $url={"JP"=>"http://specific",...};
909 # $url={""=>"http://default",...};
910 sub a_href_cc($$;%)
911 {
912 my($url,$contents,%args)=@_;
913
914         # A bit ineffective but we must process all the possibilities to get stable 'headers_in' hits!
915         my %map=map(($_=>a_href($url->{$_},$contents,%args)),keys(%$url));
916         my $r;
917         $r||=$map{_cc()};
918         $r||=$map{""};
919         return $r if $r;
920         return $contents;
921 }
922
923 # $tree={"JP"=>"specific",...};
924 # $tree={""=>"default",...};
925 sub text_cc($)
926 {
927 my($tree)=@_;
928
929         cluck if !$tree->{""};
930         my $r;
931         $r||=$tree->{_cc()};
932         $r||=$tree->{""};
933         return $r;
934 }
935
936 sub make ($)
937 {
938 my($cmd)=@_;
939
940         # FIXME: &alarm, --timeout is now infinite.
941         # FIXME: Try to remove bash(1).
942         # FIXME: Use: @PATH_FLOCK@
943         # Do not: dir_top_abs_disk(),
944         # to prevent: flock: cannot open lock file /home/lace/www/www.jankratochvil.net: Is a directory
945         my @argv=('flock',dir_top_abs_disk()."/WebConfig.pm",'bash','-c',$cmd.' >&2');
946         print STDERR join(" ","SPAWN:",@argv)."\n";
947         system @argv;
948 }
949
950 sub make_file($$)
951 {
952 my($self,$file)=@_;
953
954         cluck "Pathname not absolute: $file" if $file!~m{^/};
955         return if -f $file;
956         # TODO: Somehow quickly check dependencies?
957         return make('make -s --no-print-directory'
958                                         .' -C '."'".File::Basename::dirname($file)."' '".File::Basename::basename($file)."'");
959 }
960
961 sub img_size ($$)
962 {
963 my($width,$height)=@_;
964
965         cluck if !defined $width || !defined $height;
966         return ($W->{"have_style"} ? "style=\"border:0;width:${width}px;height:${height}px\"" : "border=\"0\"")
967                         ." width=\"$width\" height=\"$height\"";
968 }
969
970 sub negotiate_variant (%)
971 {
972 my(%args)=@_;
973
974         my @fields=("id","qs","content-type","encoding","charset","lang","size");
975         return [ map(($args{$_}),@fields) ];
976 }
977
978 # Returns: 'HTTP::Headers' instance.
979 sub http_headers_in_for($@)
980 {
981 my($self,@headers)=@_;
982
983         # Limit these entries to generate proper 'Vary' header.
984         return HTTP::Headers->new(map(($_=>$W->{"headers_in"}{$_}),@headers));
985 }
986
987 # Input: $self is required!
988 # Input: Put the fallback variant as the first one.
989 # Returns: always only scalar!
990 sub Negotiate_choose($$)
991 {
992 my($self,$variants)=@_;
993
994         my $best=HTTP::Negotiate::choose($variants,
995                         # Do not: $W->{"r"}
996                         # to prevent: Can't locate object method "scan" via package "Apache2::RequestRec" at HTTP/Negotiate.pm line 84.
997                         # Do not: $W->{"r"}->headers_in()
998                         # to prevent: Can't locate object method "scan" via package "APR::Table" at HTTP/Negotiate.pm line 84.
999                         # Do not: HTTP::Headers->new($W->{"r"}->headers_in());
1000                         # to prevent empty result or even: Odd number of elements in anonymous hash
1001                         $self->http_headers_in_for(qw(
1002                                         Accept
1003                                         Accept-Charset
1004                                         Accept-Encoding
1005                                         Accept-Language
1006                                         )));
1007         $best||=$variants->[0][0];      # $variants->[0]{"id"}; &HTTP::Negotiate::choose failed?
1008         return $best;
1009 }
1010
1011 # FIXME: Use for "content-type": MIME::Types
1012 my @img_variants=(
1013         { "id"=>"svg","qs"=>0.9,"content-type"=>"image/svg+xml" },
1014         { "id"=>"png","qs"=>0.8,"content-type"=>"image/png" },
1015         { "id"=>"gif","qs"=>0.7,"content-type"=>"image/gif" },
1016         # Do not prefer these to avoid fedding them for '*/*' browsers.
1017         { "id"=>"dia","qs"=>0.6,"content-type"=>"application/x-dia-diagram" },
1018         { "id"=>"fig","qs"=>0.6,"content-type"=>"image/x-xfig" },
1019         { "id"=>"fig","qs"=>0.6,"content-type"=>"application/x-xfig" },
1020         { "id"=>"sxd","qs"=>0.6,"content-type"=>"application/vnd.sun.xml.draw" },
1021         { "id"=>"sxi","qs"=>0.6,"content-type"=>"application/vnd.sun.xml.impress" },
1022         );
1023 # Unsupported by Image::Size 2.992: sxd sxi dia
1024 #   Supported by Image::Size 2.992: fig png gif jpeg
1025 #   Expensive by Image::Size 2.992: svg
1026 my %img_map=(
1027         "svg" =>[qw(png gif)],  # svg
1028         "png" =>[qw(png gif)],
1029         "jpeg"=>[qw(jpeg)],
1030         "dia" =>[qw(png gif)],  # svg
1031         "fig" =>[qw(fig png gif)],
1032         "sxd" =>[qw(png gif)],
1033         "sxi" =>[qw(png gif)],
1034         );
1035
1036 # Returns: ($path_web,$path_abs_disk)
1037 # URI path segments support ignored here. Where it is used? (';' path segment options)
1038 sub _img_src($%)
1039 {
1040 my($in,%args)=@_;
1041
1042         cluck if !uri_is_local $in;
1043         my $uri=in_to_uri_abs $in;
1044         my $path_abs_disk=path_abs_disk $uri,%args,"uri_as_in"=>1,"register"=>0;
1045
1046         cluck "Not exists image path_abs_disk: $path_abs_disk" if !-r $path_abs_disk;
1047         my($path_abs_disk_base,$ext_orig)=($path_abs_disk=~/^(.*)[.](\w+)$/) or cluck;
1048         my $map_arrayref=$img_map{$ext_orig} or cluck;
1049
1050         my $ext=$ext_orig;
1051         if (1!=@$map_arrayref) {
1052                 my @nego_variants;
1053                 for my $ext (@$map_arrayref) {
1054                         my $path_abs_disk_variant=$path_abs_disk_base.".".$ext;
1055                         path_abs_disk_register($path_abs_disk_variant);
1056                         __PACKAGE__->make_file($path_abs_disk_variant);
1057                         for my $var (@img_variants) {
1058                                 next if $var->{"id"} ne $ext;
1059                                 push @nego_variants,negotiate_variant(
1060                                                 %$var,
1061                                                 "size"=>(stat $path_abs_disk_variant)[7],
1062                                                 );
1063                                 }
1064                         }
1065                 $ext=__PACKAGE__->Negotiate_choose(\@nego_variants);
1066                 }
1067
1068         my $uri_path=$uri->path();
1069         $uri_path=~s/\Q.$ext_orig\E$/.$ext/ or cluck;
1070         $uri->path($uri_path);
1071         return path_web($uri,%args,"uri_as_in"=>1),path_abs_disk($uri,%args,"uri_as_in"=>1);
1072 }
1073
1074 # $args{"attr"}
1075 sub img ($$%)
1076 {
1077 my($in,$alt,%args)=@_;
1078
1079         request_check();
1080         my($path_web,$path_abs_disk)=_img_src($in,%args);
1081         my($width,$height)=Image::Size::imgsize($path_abs_disk);
1082         $alt=~s/<[^>]*>//g;
1083         $alt=escapeHTML($alt);
1084         my $content="<img src=\"".uri_escaped($path_web)."\" alt=\"$alt\" title=\"$alt\" ".img_size($width,$height)
1085                         .(!$args{"attr"} ? "" : " ".$args{"attr"})." />";
1086         do { return a_href((_img_src($_))[0],$content,"uri_as_in"=>1) if $_; } for $args{"a_href_img"};
1087         do { return a_href $_,$content if $_; } for $args{"a_href"};
1088         return $content;
1089 }
1090
1091 sub centerimg
1092 {
1093         my $r="";
1094         $r.='<table border="0" width="100%"><tr>'."\n";
1095         @_=( [@_] ) if !ref $_[0];
1096         for (@_) {
1097                 $r.="\t".'<td align="center">'.&{\&img}(@$_).'</td>'."\n";
1098                 }
1099         $r.='</tr></table>'."\n";
1100         return $r;
1101 }
1102
1103 # Optional: Provide 'text' as 1==@args_img item.
1104 sub rightimg
1105 {
1106 my($text,@args_img)=@_;
1107
1108         # FIXME: Workaround bug of 'Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)':
1109         #        <col width="@{[ (!$W->{"browser"}->ie() ? "1*" : "90%" ) ]}" />
1110         #        <col width="@{[ (!$W->{"browser"}->ie() ? "0*" : "10%" ) ]}" />
1111         # causes whole invisible projects in: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.10) Gecko/20050719 Galeon/1.3.21
1112         return <<"HERE";
1113 <table border="0" width="100%" class="textimg">
1114         <tr>
1115                 <td align="left">
1116                         @{[ $text ]}
1117                 </td>
1118                 <td>&nbsp;&nbsp;</td>
1119                 <td align="right">
1120                         @{[ 1==@args_img ? $args_img[0] : &{\&img}(@args_img) ]}
1121                 </td>
1122         </tr>
1123 </table>
1124 HERE
1125 }
1126
1127 # Optional: Provide 'text' as 1==@args_img item.
1128 sub leftimg
1129 {
1130 my($text,@args_img)=@_;
1131
1132         # FIXME: Workaround bug of 'Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)':
1133         #        <col width="@{[ (!$W->{"browser"}->ie() ? "0*" : "10%" ) ]}" />
1134         #        <col width="@{[ (!$W->{"browser"}->ie() ? "1*" : "90%" ) ]}" />
1135         # causes whole invisible projects in: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.10) Gecko/20050719 Galeon/1.3.21
1136         return <<"HERE";
1137 <table border="0" width="100%">
1138         <tr>
1139                 <td align="center">
1140                         @{[ 1==@args_img ? $args_img[0] : &{\&img}(@args_img) ]}
1141                 </td>
1142                 <td>&nbsp;&nbsp;</td>
1143                 <td align="left">
1144                         @{[ $text ]}
1145                 </td>
1146         </tr>
1147 </table>
1148 HERE
1149 }
1150
1151 sub readfile($$)
1152 {
1153 my($class,$filename)=@_;
1154
1155         local *F;
1156         open F,$filename or cluck "Cannot open \"$filename\": $!";
1157         my $F=do { local $/=undef(); <F>; };
1158         close F or cluck "Cannot close \"$filename\": $!";
1159         return $F;
1160 }
1161
1162 sub _no_cache($)
1163 {
1164 my($self)=@_;
1165
1166         header("Expires"=>HTTP::Date::time2str(1000000000));    # date in the past
1167         header("Last-Modified"=>HTTP::Date::time2str());        # always modified
1168         header("Cache-Control"=>join(", ",
1169                         "no-cache",
1170                         "no-store",
1171                         "must-revalidate",
1172                         "max-age=0",
1173                         "pre-check=0",  # MSIE
1174                         "post-check=0", # MSIE
1175                         ));     # HTTP/1.1
1176         header("Pragma"=>"no-cache");   # HTTP/1.0
1177         header("Vary"=>"*");    # content may ba based on unpredictable sources
1178 }
1179
1180 sub headers_in_filtered(@)
1181 {
1182 my(@keys)=@_;
1183
1184         return map(($_=>$W->{"headers_in"}{$_}),@keys);
1185 }
1186
1187 our %uri_args_frozen_to_headers_in_keys;
1188 our %uri_args_headers_in_frozen_to_headers_out;
1189
1190 sub uri_args_headers_in_frozen_get($)
1191 {
1192 my($headers_in_keys_arrayref)=@_;
1193
1194         my %uri_args_headers_in_hash=(
1195                 "uri_args_frozen"=>$W->{"uri_args_frozen"},
1196                 "headers_in"=>{ headers_in_filtered(@$headers_in_keys_arrayref) },
1197                 );
1198         return do { local $Storable::canonical=1; Storable::freeze(\%uri_args_headers_in_hash); };
1199 }
1200
1201 sub cache_output_filter($)
1202 {
1203 my($f)=@_;
1204
1205         while ($f->read(my $text,0x400)) {
1206                 cluck "utf-8 untested" if Encode::is_utf8($text);       # Possible here at all?
1207                 $f->print($text);
1208                 $W->{"digest-md5"}->add($text);
1209                 }
1210         return OK;
1211 }
1212
1213 sub cache_start()
1214 {
1215         # Used only if: !$W->{"http_safe"}
1216         # but we would cause on different method(): Appending to the '_done' package list
1217         # &Wrequire it here even if it will not be later used; to be stable!
1218         Wrequire 'My::Hash::RestrictTo';
1219         if (!$W->{"http_safe"}) {
1220                 __PACKAGE__->_no_cache();
1221                 return;
1222                 }
1223
1224         {
1225                 my %uri_args_hash=(
1226                         "method"=>$W->{"r"}->method(),
1227                         "uri"=>"http://".$W->{"web_hostname"}."/".$W->{"r"}->uri(),
1228                         "args"=>$W->{"args_orig"},
1229                         );
1230                 $W->{"uri_args_frozen"}=do { local $Storable::canonical=1; Storable::freeze(\%uri_args_hash); };
1231                 last if !(my $headers_in_keys_arrayref=$uri_args_frozen_to_headers_in_keys{$W->{"uri_args_frozen"}});
1232
1233                 # Protection to be sure we are stable:
1234                 $W->{"headers_in"}=My::Hash::RestrictTo->new($W->{"headers_in"},@$headers_in_keys_arrayref);
1235
1236                 $W->{"uri_args_headers_in_frozen"}=uri_args_headers_in_frozen_get($headers_in_keys_arrayref);
1237                 last if !(my $headers_out_hashref=$uri_args_headers_in_frozen_to_headers_out{$W->{"uri_args_headers_in_frozen"}});
1238                 header(%$headers_out_hashref);
1239                 my $status;
1240                 {
1241                         # &meets_conditions will always deny the attempt if !2xx status().
1242                         # At least ap_read_request() sets: r->status=HTTP_REQUEST_TIME_OUT;     /* Until we get a request */
1243                         my $status_old=$W->{"r"}->status();
1244                         $W->{"r"}->status(HTTP_OK);
1245                         # Update httpd's 'r->mtime' as the header "Last-Modified" is just not enough for ap_meets_conditions():
1246                         # &update_mtime() argument is really in _secs_, not in _msecs_ as the docs claim.
1247                         # Be aware '*1000000' would overflow Perl integer anyway.
1248                         # &set_last_modified would also override the "Last-Modified" headers_out!
1249                         # &mtime may exist but somehow does not work.
1250                         $W->{"r"}->update_mtime(HTTP::Date::str2time($headers_out_hashref->{"Last-Modified"}));
1251                         $status=$W->{"r"}->meets_conditions();
1252                         $W->{"r"}->status($status_old);
1253                         }
1254                 last if OK==$status;
1255                 $W->{"r"}->status($status);
1256                 $W->{"header_only"}=1;  # Inhibit &footer output.
1257                 exit;
1258                 die "NOTREACHED";
1259                 }
1260
1261         $W->{"digest-md5"}=Digest::MD5->new();
1262         $W->{"cache_active"}=1;
1263         $W->{"r"}->add_output_filter(\&cache_output_filter);
1264 }
1265
1266 sub cache_finish_last_modified()
1267 {
1268         cluck "Not yet done now? W __PACKAGE__: ".$W->{"__PACKAGE__"}
1269                         if !$packages_used_hash{$W->{"__PACKAGE__"}}{"_done"};
1270         for my $package_orig (@{$packages_used_array{$W->{"__PACKAGE__"}}}) {
1271                 local $_=$package_orig.".pm";
1272                 s{::}{/}g;
1273                 path_abs_disk "/$_","register"=>1;
1274                 }
1275         my $mtime_newest;
1276         for my $path_abs_disk (keys(%{$W->{"path_abs_disk_register"}})) {
1277                 my $mtime=(stat $path_abs_disk)[9];
1278                 do { cluck "No mtime for: $path_abs_disk"; next; } if !$mtime;
1279                 $mtime_newest=$mtime if !$mtime_newest || $mtime_newest<$mtime;
1280                 }
1281         cluck "No mtime_newest found for the current W __PACKAGE__: ".$W->{"__PACKAGE__"}
1282                         if !$mtime_newest;
1283         return HTTP::Date::time2str($mtime_newest);
1284 }
1285
1286
1287 sub cache_finish()
1288 {
1289         # Do not: return if !$W->{"uri_args_frozen"};
1290         # as we may have just gave 304 and 'exit;' without starting the caching.
1291         return if !$W->{"cache_active"};
1292
1293         # Headers may not be complete in this case; not sure, just trying.
1294         return if $W->{"r"}->connection()->aborted();
1295
1296         # Fill-in/check: %uri_args_frozen_to_headers_in_keys
1297         my $headers_in_keys_stored_arrayref_ref=\$uri_args_frozen_to_headers_in_keys{$W->{"uri_args_frozen"}};
1298         my @headers_in_keys=tied(%{$W->{"headers_in_RecordKeys"}})->accessed();
1299         if (!$$headers_in_keys_stored_arrayref_ref
1300                         || !Data::Compare::Compare(\@headers_in_keys,$$headers_in_keys_stored_arrayref_ref)) {
1301                 cluck "Non-matching generated 'headers_in_keys' per 'uri_args_frozen' key:\n"
1302                                                 .Dumper(\@headers_in_keys,$$headers_in_keys_stored_arrayref_ref)
1303                                 if $$headers_in_keys_stored_arrayref_ref;
1304                 # Build or possibly prevent such further warn dupes:
1305                 $$headers_in_keys_stored_arrayref_ref=\@headers_in_keys;
1306                 # Build or regenerate as obsoleted now:
1307                 $W->{"uri_args_headers_in_frozen"}=uri_args_headers_in_frozen_get(\@headers_in_keys);
1308                 }
1309
1310         # Prepare 'headers_out' for the future reusal:
1311         my %headers_out;
1312         # Do not: $W->{"digest-md5"}->b64digest();
1313         # as it will not provide the trailing filling '='s.
1314         # RFC 1864 is not clear if they should be there but its sample provides them.
1315         # Do not try to provide canonical "\r\n" form of newlines as is said by RFC 1864.
1316         # RFC 2068 (HTTP/1.1) section 14.16 says the newlines should NOT be converted for HTTP.
1317         # ',""' to avoid breaking the headers by its default "\n".
1318         $headers_out{"Content-MD5"}=MIME::Base64::encode_base64($W->{"digest-md5"}->digest(),"");
1319         # In fact we could also use MD5 for ETag as if we know ETag we also know MD5.
1320         # But this way we do not need to calculate MD5 and we still can provide such ETag. So.
1321         # $W->{"r"}->set_etag() ?
1322         $headers_out{"ETag"}='"'.Digest::MD5::md5_base64($W->{"uri_args_headers_in_frozen"}).'"';
1323         # $W->{"r"}->set_content_length() ?
1324         $headers_out{"Content-Length"}=$W->{"r"}->bytes_sent();
1325         my %Vary=map(($_=>1),(@headers_in_keys));
1326         for (keys(%Vary)) {
1327                 next if !/^_/;
1328                 $Vary{"*"}=1;
1329                 delete $Vary{$_};
1330                 }
1331         %Vary=("*"=>1) if $Vary{"*"};
1332         $headers_out{"Vary"}=join(", ",sort keys(%Vary)) if keys(%Vary);
1333         # $W->{"r"}->set_last_modified() ?
1334         $headers_out{"Last-Modified"}=cache_finish_last_modified();
1335
1336         # Fill-in/check: %uri_args_headers_in_frozen_to_headers_out
1337         my $headers_out_stored_hashref_ref=\$uri_args_headers_in_frozen_to_headers_out{$W->{"uri_args_headers_in_frozen"}};
1338         if (!$$headers_out_stored_hashref_ref
1339                         || !Data::Compare::Compare(\%headers_out,$$headers_out_stored_hashref_ref)) {
1340                 cluck "Non-matching generated 'headers_out' per 'uri_args_headers_in_frozen' key:\n"
1341                                                 .Dumper(\%headers_out,$$headers_out_stored_hashref_ref)
1342                                 if $$headers_out_stored_hashref_ref;
1343                 # Build or possibly prevent such further warn dupes:
1344                 $$headers_out_stored_hashref_ref=\%headers_out;
1345                 }
1346
1347 ###print STDERR Dumper(\%uri_args_frozen_to_headers_in_keys,\%uri_args_headers_in_frozen_to_headers_out);
1348 }
1349
1350 sub heading()
1351 {
1352 my($class)=@_;
1353
1354         if (!$W->{"header_only"}) {
1355                 header("Content-Style-Type"=>"text/css");
1356                 # Do not: text/javascript
1357                 # as it does not look as registered, at least according to: MIME::Types $VERSION 1.15
1358                 # "application/javascript" so far standardized till 2005-12-08 by:
1359                 #       http://www.ietf.org/internet-drafts/draft-hoehrmann-script-types-03.txt
1360                 header("Content-Script-Type"=>"application/javascript");
1361                 # $W->{"r"}->content_languages() ?
1362                 do { header("Content-Language"=>$_) if $_; } for $W->{"language"};
1363                 }
1364         # TODO: Support also: private
1365         header("Cache-Control"=>"public");      # HTTP/1.1
1366
1367         # Use $W->{"charset"}=0 to disable charset.
1368         $W->{"charset"}="us-ascii"
1369                         if !defined $W->{"charset"} && (!defined($W->{"content_type"}) || $W->{"content_type"});
1370
1371         # Workaround bug
1372         #   https://bugzilla.mozilla.org/show_bug.cgi?id=120556
1373         # of at least
1374         #   Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8b) Gecko/20050217
1375         # http://validator.w3.org/ does not send ANY "Accept" headers!
1376         if (!defined $W->{"content_type"}) {
1377                 # Be _stable_ for "headers_in".
1378                 my $accept=$W->{"headers_in"}{"Accept"};
1379                 my $user_agent=$W->{"headers_in"}{"User-Agent"}||"";
1380                 $W->{"content_type"}="application/xhtml+xml"
1381                                 if !$accept && $user_agent=~m{^W3C_Validator/}i;
1382                 # Be _stable_:
1383                 my $negotiated=$class->Negotiate_choose([
1384                                 # Put the fallback variant as the first one.
1385                                 # Rate both variants the same to prefer "text/html" for undecided clients.
1386                                 # At least
1387                                 #   Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8b) Gecko/20050217
1388                                 # prefers "application/xhtml+xml" over "text/html" itself:
1389                                 #   text/xml,application/xml,application/xhtml+xml,text/html;q=0.9,text/plain;q=0.8,image/png,*/*;q=0.5
1390                                 negotiate_variant(
1391                                                 "id"=>"text/html",
1392                                                 "content-type"=>"text/html",
1393                                                 "qs"=>0.6,
1394                                                 (!$W->{"charset"} ? () : "charset"=>$W->{"charset"}),
1395                                                 "lang"=>$W->{"language"},
1396                                                 ),
1397                                 negotiate_variant(
1398                                                 "id"=>"application/xhtml+xml",
1399                                                 "content-type"=>"application/xhtml+xml",
1400                                                 "qs"=>0.6,
1401                                                 (!$W->{"charset"} ? () : "charset"=>$W->{"charset"}),
1402                                                 "lang"=>$W->{"language"},
1403                                                 ),
1404                                 # application/xml ?
1405                                 # text/xml ?
1406                                 ]);
1407                 $W->{"content_type"}=$negotiated if !defined $W->{"content_type"};
1408                 }
1409         # mod_perl doc: If you set this header via the headers_out table directly, it
1410         #               will be ignored by Apache. So do not do that.
1411         my $type;
1412         if ($W->{"content_type"}) {
1413                 $type=MIME::Types->new()->type($W->{"content_type"});
1414                 cluck "MIME::Types type '".$W->{"content_type"}."' not known" if !$type;
1415                 }
1416         cluck "charset='".$W->{"charset"}."' does not match content-type='".$W->{"content_type"}."'"
1417                         if ($W->{"charset"} ? 1 : 0) != (!$type ? 0 : $type->isAscii());
1418         $W->{"r"}->content_type($W->{"content_type"}.(!$W->{"charset"} ? "" : "; charset=".$W->{"charset"}))
1419                         if $W->{"content_type"};
1420
1421         cache_start();
1422         # We still can append headers before we put out some text.
1423         # FIXME: It is not clean to still append them without overwriting.
1424         return if $W->{"heading_done"};
1425         Wprint '<?xml version="1.0" encoding="'.$W->{"charset"}.'"?>'."\n"
1426                         if (!$W->{"header_only"} || $W->{"header_only"} eq "xml") && (0
1427                                         || $W->{"content_type"}=~m{^application/\w+[+]xml$}
1428                                         || $W->{"content_type"} eq "text/vnd.wap.wml");
1429         return if $W->{"header_only"};
1430         # Split 'heading_done' for the proper handling of: /project/Rel.pm
1431         $W->{"heading_done"}++;
1432
1433         Wprint '<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">'."\n";
1434         Wprint '<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="'.$W->{"language"}.'">'."\n";
1435         my $title=$W->{"title_prefix"}.join("",map({ ': '.$_; } ($W->{"title"} || ())));
1436         # Do not: cluck if $title=~/[<>]/;
1437         # as it is not solved just by: &a_href_inhibit
1438         # as sometimes titles use also: <i>...</i>
1439         $title=~s#<[^>]*>##g;
1440         Wprint "<head>";
1441         Wprint "<title>$title</title>\n";
1442         if ($W->{"have_css"}) {
1443                 # Everything can get overriden later.
1444                 for my $css ("/My/Web.css",@{$W->{"css_push"}}) {
1445                         Wprint <<"HERE";
1446 <link rel="stylesheet" type="text/css" href="@{[ uri_escaped(path_web $css) ]}" />
1447 HERE
1448                         }
1449                 if ($W->{"css_inherit"}) {
1450                         $W->{"js_push"}="/My/css_inherit.js";
1451                         }
1452                 }
1453         for my $js (@{$W->{"js_push"}}) {
1454                 # Do not: <script />
1455                 # as at least Lynx inhibits any further HTML output.
1456                 # Do not: text/javascript
1457                 # as it does not look as registered, at least according to: MIME::Types $VERSION 1.15
1458                 # "application/javascript" so far standardized till 2005-12-08 by:
1459                 #       http://www.ietf.org/internet-drafts/draft-hoehrmann-script-types-03.txt
1460                 Wprint <<"HERE";
1461 <script type="application/javascript" src="@{[ uri_escaped(path_web $js) ]}"></script>
1462 <script type="text/javascript"        src="@{[ uri_escaped(path_web $js) ]}"></script>
1463 HERE
1464                 }
1465         Wprint '<meta name="robots" content="'.($W->{"indexme"} ? "" : "no" ).'index,follow" />'."\n";
1466         for my $head (@{$W->{"head_push"}}) {
1467                 $head=&{$head}() if "CODE" eq ref $head;
1468                 Wprint $head;
1469                 }
1470         for my $type (qw(prev next index contents start up)) {
1471                 do { Wprint '<link rel="'.$type.'" href="'.uri_escaped(path_web $_).'" />'."\n" if $_; }
1472                                 for ($W->{"rel_$type"});
1473                 }
1474         Wprint "</head><body";
1475 #       Wprint ' bgcolor="black" text="white" link="aqua" vlink="teal"'
1476 #                       if $W->{"browser"}->netscape() && (!$W->{"browser"}->major() || $W->{"browser"}->major()<=4);
1477         Wprint $W->{"body_attr"};
1478         Wprint ">\n";
1479
1480         do { Wprint $_ if $_; } for $W->{"heading"};
1481 }
1482
1483 BEGIN {
1484         delete $W->{"__My::Web_init"};
1485         }
1486
1487 1;