Documentation
[CGIscriptor.git] / CGIscriptor.pl
blob62b7ce58a26a836addb94d84e54285b39739cfd5
1 #! /usr/bin/perl
3 # (configure the first line to contain YOUR path to perl 5.000+)
5 # CGIscriptor.pl
6 # Version 2.3
7 # 15 January 2002
9 # YOU NEED:
11 # perl 5.0 or higher (see: "http://www.perl.org/")
13 # Notes:
15 if(grep(/\-\-help/i, @ARGV))
17 print << 'ENDOFPREHELPTEXT1';
18 # CGIscriptor.pl is a Perl program will run on any WWW server that
19 # runs Perl scripts, just add a line like the following to your
20 # httpd.conf file (Apache example):
22 # ScriptAlias /SHTML/ "/real-path/CGIscriptor.pl/"
24 # URL's that refer to http://www.your.address/SHTML/... will now be handled
25 # by CGIscriptor.pl, which can use a private directory tree (default is the
26 # DOCUMENT_ROOT directory tree, but it can be anywhere, see below).
27 # NOTE: if you cannot use a ScriptAlias, there is a way to use .htaccess
28 # instead. See below.
30 # This file contains all documentation as comments. These comments
31 # can be removed to speed up loading (e.g., `egrep -v '^#' CGIscriptor.pl` >
32 # leanScriptor.pl). A bare bones version of CGIscriptor.pl, lacking
33 # documentation, most comments, access control, example functions etc.
34 # (but still with the copyright notice and some minimal documentation)
35 # can be obtained by calling CGIscriptor.pl with the '-slim'
36 # command line argument, e.g.,
37 # >CGIscriptor.pl -slim >slimCGIscriptor.pl
39 # CGIscriptor.pl can be run from the command line as
40 # `CGIscriptor.pl <path> <query>`, inside a perl script with
41 # 'do CGIscriptor.pl' after setting $ENV{PATH_INFO} and $ENV{QUERY_STRING},
42 # or CGIscriptor.pl can be loaded with 'require "/real-path/CGIscriptor.pl"'.
43 # In the latter case, requests are processed by 'Handle_Request();'
44 # (again after setting $ENV{PATH_INFO} and $ENV{QUERY_STRING}).
46 # The --help command line switch will print the manual.
48 # Running demo's and more information can be found at
49 # http://www.fon.hum.uva.nl/rob/OSS/OSS.html
51 # A pocket-size HTTP daemon, CGIservlet.pl, is available from my web site
52 # or CPAN that can use CGIscriptor.pl as the base of a µWWW server and
53 # demonstrates its use.
55 ENDOFPREHELPTEXT1
57 # Configuration, copyright notice, and user manual follow the next
58 # (Changes) section.
60 ############################################################################
62 # Changes (document ALL changes with date, name and email here):
63 # 11 Jun 2012 - Securing CGIvariable setting. Made
64 # 'if($ENV{QUERY_STRING} =~ /$name/)' into elsif in
65 # defineCGIvariable/List/Hash to give precedence to ENV{$name}
66 # This was a very old security bug. Added ProtectCGIvariable($name).
67 # 06 Jun 2012 - Added IP only session types after login.
68 # 31 May 2012 - Session ticket system added for handling login sessions.
69 # 29 May 2012 - CGIsafeFileName does not accept filenames starting with '.'
70 # 29 May 2012 - Added CGIscriptor::BrowseAllDirs to handle browsing directories
71 # correctly.
72 # 22 May 2012 - Added Access control with Session Tickets linked to
73 # IP Address and PATH_INFO.
74 # 21 May 2012 - Corrected the links generated by CGIscriptor::BrowseDirs
75 # Will link to current base URL when the HTTP server is '.' or '~'
76 # 29 Oct 2009 - Adapted David A. Wheeler's suggestion about filenames:
77 # CGIsafeFileName does not accept filenames starting with '-'
78 # (http://www.dwheeler.com/essays/fixing-unix-linux-filenames.html)
79 # 08 Oct 2009 - Some corrections in the README.txt file, eg, new email address
80 # 28 Jan 2005 - Added a file selector to performTranslation.
81 # Changed %TranslationTable to @TranslationTable
82 # and patterns to lists.
83 # 27 Jan 2005 - Added a %TranslationTable with associated
84 # performTranslation(\$text) function to allow
85 # run changes in the web pages. Say, to translate
86 # legacy pages with <%=...%> delimiters to the new
87 # <SCRIPT TYPE=..></SCRIPT> format.
88 # 27 Jan 2005 - Small bug of extra '\n' in output removed from the
89 # Other Languages Code.
90 # 10 May 2004 - Belated upload of latest version (2.3) to CPAN
91 # 07 Oct 2003 - Corrected error '\s' -> '\\s' in rebol scripting
92 # language call
93 # 07 Oct 2003 - Corrected omitted INS tags in <DIV><INS> handling
94 # 20 May 2003 - Added a --help switch to print the manual.
95 # 06 Mar 2003 - Adapted the blurb at the end of the file.
96 # 03 Mar 2003 - Added a user definable dieHandler function to catch all
97 # "die" calls. Also "enhanced" the STDERR printout.
98 # 10 Feb 2003 - Split off the reading of the POST part of a query
99 # from Initialize_output. This was suggested by Gerd Franke
100 # to allow for the catching of the file_path using a
101 # POST based lookup. That is, he needed the POST part
102 # to change the file_path.
103 # 03 Feb 2003 - %{$name}; => %{$name} = (); in defineCGIvariableHash.
104 # 03 Feb 2003 - \1 better written as $1 in
105 # $directive =~ s/[^\\\$]\#[^\n\f\r]*([\n\f\r])/$1/g
106 # 29 Jan 2003 - This makes "CLASS="ssperl" CSS-compatible Gerd Franke
107 # added:
108 # $ServerScriptContentClass = "ssperl";
109 # changed in ProcessFile():
110 # unless(($CurrentContentType =~
111 # 28 Jan 2003 - Added 'INS' Tag! Gerd Franke
112 # 20 Dec 2002 - Removed useless $Directoryseparator variable.
113 # Update comments and documentation.
114 # 18 Dec 2002 - Corrected bug in Accept/Reject processing.
115 # Files didn't work.
116 # 24 Jul 2002 - Added .htaccess documentation (from Gerd Franke)
117 # Also added a note that RawFilePattern can be a
118 # complete file name.
119 # 19 Mar 2002 - Added SRC pseudo-files PREFIX and POSTFIX. These
120 # switch to prepending or to appending the content
121 # of the SRC attribute. Default is prefixing. You
122 # can add as many of these switches as you like.
123 # 13 Mar 2002 - Do not search for tag content if a tag closes with
124 # />, i.e., <DIV ... /> will be handled the XML/XHTML way.
125 # 25 Jan 2002 - Added 'curl' and 'snarf' to SRC attribute URL handling
126 # (replaces wget).
127 # 25 Jan 2002 - Found a bug in SAFEqx, now executes qx() in a scalar context
128 # (i.o. a list context). This is necessary for binary results.
129 # 24 Jan 2002 - Disambiguated -T $SRCfile to -T "$SRCfile" (and -e) and
130 # changed the order of if/elsif to allow removing these
131 # conditions in systems with broken -T functions.
132 # (I also removed a spurious ')' bracket)
133 # 17 Jan 2002 - Changed DIV tag SRC from <SOURCE> to sysread(SOURCE,...)
134 # to support binary files.
135 # 17 Jan 2002 - Removed WhiteSpace from $FileAllowedCharacters.
136 # 17 Jan 2002 - Allow "file://" prefix in SRC attribute. It is simply
137 # stipped from the path.
138 # 15 Jan 2002 - Version 2.2
139 # 15 Jan 2002 - Debugged and completed URL support (including
140 # CGIscriptor::read_url() function)
141 # 07 Jan 2002 - Added automatic (magic) URL support to the SRC attribute
142 # with the main::GET_URL function. Uses wget -O underlying.
143 # 04 Jan 2002 - Added initialization of $NewDirective in InsertForeignScript
144 # (i.e., my $NewDirective = "";) to clear old output
145 # (this was a realy anoying bug).
146 # 03 Jan 2002 - Added a <DIV CLASS='text/ssperl' ID='varname'></DIV>
147 # tags that assign the body text as-is (literally)
148 # to $varname. Allows standard HTML-tools to handle
149 # Cascading Style Sheet templates. This implements a
150 # design by Gerd Franke (franke@roo.de).
151 # 03 Jan 2002 - I finaly gave in and allowed SRC files to expand ~/.
152 # 12 Oct 2001 - Normalized spelling of "CGIsafFileName" in documentation.
153 # 09 Oct 2001 - Added $ENV{'CGI_BINARY_FILE'} to log files to
154 # detect unwanted indexing of TAR files by webcrawlers.
155 # 10 Sep 2001 - Added $YOUR_SCRIPTS directory to @INC for 'require'.
156 # 22 Aug 2001 - Added .txt (Content-type: text/plain) as a default
157 # processed file type. Was processed via BinaryMapFile.
158 # 31 May 2001 - Changed =~ inside CGIsafeEmailAddress that was buggy.
159 # 29 May 2001 - Updated $CGI_HOME to point to $ENV{DOCUMENT_ROOT} io
160 # the root of PATH_TRANSLATED. DOCUMENT_ROOT can now
161 # be manipulated to achieve a "Sub Root".
162 # NOTE: you can have $YOUR_HTML_FILES != DOCUMENT_ROOT
163 # 28 May 2001 - Changed CGIscriptor::BrowsDirs function for security
164 # and debugging (it now works).
165 # 21 May 2001 - defineCGIvariableHash will ADD values to existing
166 # hashes,instead of replacing existing hashes.
167 # 17 May 2001 - Interjected a '&' when pasting POST to GET data
168 # 24 Apr 2001 - Blocked direct requests for BinaryMapFile.
169 # 16 Aug 2000 - Added hash table extraction for CGI parameters with
170 # CGIparseValueHash (used with structured parameters).
171 # Use: CGI='%<CGI-partial-name>' (fill in your name in <>)
172 # Will collect all <CGI-partial-name><key>=value pairs in
173 # $<CGI-partial-name>{<key>} = value;
174 # 16 Aug 2000 - Adapted SAFEqx to protect @PARAMETER values.
175 # 09 Aug 2000 - Added support for non-filesystem input by way of
176 # the CGI_FILE_CONTENTS and CGI_DATA_ACCESS_CODE
177 # environment variables.
178 # 26 Jul 2000 - On the command-line, file-path '-' indicates STDIN.
179 # This allows CGIscriptor to be used in pipes.
180 # Default, $BLOCK_STDIN_HTTP_REQUEST=1 will block this
181 # in an HTTP request (i.e., in a web server).
182 # 26 Jul 2000 - Blocked 'Content-type: text/html' if the SERVER_PROTOCOL
183 # is not HTTP or another protocol. Changed the default
184 # source directory to DOCUMENT_ROOT (i.o. the incorrect
185 # SERVER_ROOT).
186 # 24 Jul 2000 - -slim Command-line argument added to remove all
187 # comments, security, etc.. Updated documentation.
188 # 05 Jul 2000 - Added IF and UNLESS attributes to make the
189 # execution of all <META> and <SCRIPT> code
190 # conditional.
191 # 05 Jul 2000 - Rewrote and isolated the code for extracting
192 # quoted items from CGI and SRC attributes.
193 # Now all attributes expect the same set of
194 # quotes: '', "", ``, (), {}, [] and the same
195 # preceded by a \, e.g., "\((aap)\)" will be
196 # extracted as "(aap)".
197 # 17 Jun 2000 - Construct @ARGV list directly in CGIexecute
198 # name-space (i.o. by evaluation) from
199 # CGI attributes to prevent interference with
200 # the processing for non perl scripts.
201 # Changed CGIparseValueList to prevent runaway
202 # loops.
203 # 16 Jun 2000 - Added a direct (interpolated) display mode
204 # (text/ssdisplay) and a user log mode
205 # (text/sslogfile).
206 # 06 Jun 2000 - Replace "print $Result" with a syswrite loop to
207 # allow large string output.
208 # 02 Jun 2000 - Corrected shrubCGIparameter($CGI_VALUE) to realy
209 # remove all control characters. Changed Interpreter
210 # initialization to shrub interpolated CGI parameters.
211 # Added 'text/ssmailto' interpreter script.
212 # 22 May 2000 - Changed some of the comments
213 # 09 May 2000 - Added list extraction for CGI parameters with
214 # CGIparseValueList (used with multiple selections).
215 # Use: CGI='@<CGI-parameter>' (fill in your name in <>)
216 # 09 May 2000 - Added a 'Not Present' condition to CGIparseValue.
217 # 27 Apr 2000 - Updated documentation to reflect changes.
218 # 27 Apr 2000 - SRC attribute "cleaned". Supported for external
219 # interpreters.
220 # 27 Apr 2000 - CGI attribute can be used in <SCRIPT> tag.
221 # 27 Apr 2000 - Gprolog, M4 support added.
222 # 26 Apr 2000 - Lisp (rep) support added.
223 # 20 Apr 2000 - Use of external interpreters now functional.
224 # 20 Apr 2000 - Removed bug from extracting Content types (RegExp)
225 # 10 Mar 2000 - Qualified unconditional removal of '#' that preclude
226 # the use of $#foo, i.e., I changed
227 # s/[^\\]\#[^\n\f\r]*([\n\f\r])/\1/g
228 # to
229 # s/[^\\\$]\#[^\n\f\r]*([\n\f\r])/\1/g
230 # 03 Mar 2000 - Added a '$BlockPathAccess' variable to "hide"
231 # things like, e.g., CVS information in CVS subtrees
232 # 10 Feb 2000 - URLencode/URLdecode have been made case-insensitive
233 # 10 Feb 2000 - Added a BrowseDirs function (CGIscriptor package)
234 # 01 Feb 2000 - A BinaryMapFile in the ~/ directory has precedence
235 # over a "burried" BinaryMapFile.
236 # 04 Oct 1999 - Added two functions to check file names and email addresses
237 # (CGIscriptor::CGIsafeFileName and
238 # CGIscriptor::CGIsafeEmailAddress)
239 # 28 Sept 1999 - Corrected bug in sysread call for reading POST method
240 # to allow LONG posts.
241 # 28 Sept 1999 - Changed CGIparseValue to handle multipart/form-data.
242 # 29 July 1999 - Refer to BinaryMapFile from CGIscriptor directory, if
243 # this directory exists.
244 # 07 June 1999 - Limit file-pattern matching to LAST extension
245 # 04 June 1999 - Default text/html content type is printed only once.
246 # 18 May 1999 - Bug in replacement of ~/ and ./ removed.
247 # (Rob van Son, R.J.J.H.vanSon@uva.nl)
248 # 15 May 1999 - Changed the name of the execute package to CGIexecute.
249 # Changed the processing of the Accept and Reject file.
250 # Added a full expression evaluation to Access Control.
251 # (Rob van Son, R.J.J.H.vanSon@uva.nl)
252 # 27 Apr 1999 - Brought CGIscriptor under the GNU GPL. Made CGIscriptor
253 # Version 1.1 a module that can be called with 'require "CGIscriptor.pl"'.
254 # Requests are serviced by "Handle_Request()". CGIscriptor
255 # can still be called as a isolated perl script and a shell
256 # command.
257 # Changed the "factory default setting" so that it will run
258 # from the DOCUMENT_ROOT directory.
259 # (Rob van Son, R.J.J.H.vanSon@uva.nl)
260 # 29 Mar 1999 - Remove second debugging STDERR switch. Moved most code
261 # to subroutines to change CGIscriptor into a module.
262 # Added mapping to process unsupported file types (e.g., binary
263 # pictures). See $BinaryMapFile.
264 # (Rob van Son, R.J.J.H.vanSon@uva.nl)
265 # 24 Sept 1998 - Changed text of license (Rob van Son, R.J.J.H.vanSon@uva.nl)
266 # Removed a double setting of filepatterns and maximum query
267 # size. Changed email address. Removed some typos from the
268 # comments.
269 # 02 June 1998 - Bug fixed in URLdecode. Changing the foreach loop variable
270 # caused quiting CGIscriptor.(Rob van Son, R.J.J.H.vanSon@uva.nl)
271 # 02 June 1998 - $SS_PUB and $SS_SCRIPT inserted an extra /, removed.
272 # (Rob van Son, R.J.J.H.vanSon@uva.nl)
275 # Known Bugs:
277 # 23 Mar 2000
278 # It is not possible to use operators or variables to construct variable names,
279 # e.g., $bar = \@{$foo}; won't work. However, eval('$bar = \@{'.$foo.'};');
280 # will indeed work. If someone could tell me why, I would be obliged.
283 ############################################################################
285 # OBLIGATORY USER CONFIGURATION
287 # Configure the directories where all user files can be found (this
288 # is the equivalent of the server root directory of a WWW-server).
289 # These directories can be located ANYWHERE. For security reasons, it is
290 # better to locate them outside the WWW-tree of your HTTP server, unless
291 # CGIscripter handles ALL requests.
293 # For convenience, the defaults are set to the root of the WWW server.
294 # However, this might not be safe!
296 # ~/ text files
297 # $YOUR_HTML_FILES = "/usr/pub/WWW/SHTML"; # or SS_PUB as environment var
298 # (patch to use the parent directory of CGIscriptor as document root, should be removed)
299 if($ENV{'SCRIPT_FILENAME'}) # && $ENV{'SCRIPT_FILENAME'} !~ /\Q$ENV{'DOCUMENT_ROOT'}\E/)
301 $ENV{'DOCUMENT_ROOT'} = $ENV{'SCRIPT_FILENAME'};
302 $ENV{'DOCUMENT_ROOT'} =~ s@/CGIscriptor.*$@@ig;
305 # Just enter your own directory path here
306 $YOUR_HTML_FILES = $ENV{'DOCUMENT_ROOT'}; # default is the DOCUMENT_ROOT
308 # ./ script files (recommended to be different from the previous)
309 # $YOUR_SCRIPTS = "/usr/pub/WWW/scripts"; # or SS_SCRIPT as environment var
310 $YOUR_SCRIPTS = $YOUR_HTML_FILES; # This might be a SECURITY RISK
312 # End of obligatory user configuration
313 # (note: there is more non-essential user configuration below)
315 ############################################################################
317 # OPTIONAL USER CONFIGURATION (all values are used CASE INSENSITIVE)
319 # Script content-types: TYPE="Content-type" (user defined mime-type)
320 $ServerScriptContentType = "text/ssperl"; # Server Side Perl scripts
321 # CSS require a simple class
322 $ServerScriptContentClass = $ServerScriptContentType =~ m!/! ?
323 $' : "ssperl"; # Server Side Perl CSS classes
325 $ShellScriptContentType = "text/osshell"; # OS shell scripts
326 # # (Server Side perl ``-execution)
328 # Accessible file patterns, block any request that doesn't match.
329 # Matches any file with the extension .(s)htm(l), .txt, or .xmr
330 # (\. is used in regexp)
331 # Note: die unless $PATH_INFO =~ m@($FilePattern)$@is;
332 $FilePattern = ".shtml|.htm|.html|.xml|.xmr|.txt|.js";
334 # The table with the content type MIME types
335 # (allows to differentiate MIME types, if needed)
336 %ContentTypeTable =
338 '.html' => 'text/html',
339 '.shtml' => 'text/html',
340 '.htm' => 'text/html',
341 '.xml' => 'text/xml',
342 '.txt' => 'text/plain',
343 '.js' => 'text/plain'
347 # File pattern post-processing
348 $FilePattern =~ s/([@.])/\\$1/g; # Convert . and @ to \. and \@
350 # SHAsum command needed for Authorization and Login
351 # (note, these have to be accessible in the HTML pages, ie, the CGIexecute environment)
352 my $shasum = "shasum -a 256";
353 if(qx{uname} =~ /Darwin/)
355 $shasum = "shasum-5.12 -a 256" unless `which shasum`;
357 my $SHASUMCMD = $shasum.' |cut -f 1 -d" "';
358 $ENV{"SHASUMCMD"} = $SHASUMCMD;
359 my $RANDOMHASHCMD = 'dd bs=1 count=64 if=/dev/urandom 2>/dev/null | '.$shasum.' -b |cut -f 1 -d" "';
360 $ENV{"RANDOMHASHCMD"} = $RANDOMHASHCMD;
362 # Hash a string, return hex of hash
363 sub hash_string # ($string) -> hex_hash
365 my $string = shift || "";
366 # Catch nasty \'-quotes, embed them in '..'"'"'..'
367 $string =~ s/\'/\'\"\'\"\'/isg;
368 my $hash = `printf '%s' '$string'| $ENV{"SHASUMCMD"}`;
369 chomp($hash);
370 return $hash;
373 # Generate random hex hash
374 sub get_random_hex # () -> hex
376 # Create Random Hash Salt
377 open(URANDOM, "$RANDOMHASHCMD |") || die "URANDOM; $RANDOMHASHCMD | $!\n";
378 my $RANDOMSALT= <URANDOM>;
379 close(URANDOM);
380 chomp($RANDOMSALT);
382 return $RANDOMSALT;
386 # File patterns of files which are handled by session tickets.
387 %TicketRequiredPatterns = (
388 '^/Private(/|$)' => "Private/.Sessions\tPrivate/.Passwords\t/Private/Login.html\t+36000"
390 # Used to set cookies, only session cookies supported
391 my %SETCOOKIELIST = ();
393 # Session Ticket Directory: Private/.Sessions
394 # Password Directory: Private/.Passwords
395 # Login page (url path): /Private/Login.html
396 # Expiration time (s): +3600
397 # +<seconds> = relative time <seconds> is absolute date-time
399 # Raw files must contain their own Content-type (xmr <- x-multipart-replace).
400 # THIS IS A SUBSET OF THE FILES DEFINED IN $FilePattern
401 $RawFilePattern = ".xmr";
402 # (In principle, this could contain a full file specification, e.g.,
403 # ".xmr|relocated.html")
405 # Raw File pattern post-processing
406 $RawFilePattern =~ s/([@.])/\\$1/g; # Convert . and @ to \. and \@
408 # Server protocols for which "Content-type: text/html\n\n" should be printed
409 # (you should not bother with these, except for HTTP, they are mostly imaginary)
410 $ContentTypeServerProtocols = 'HTTP|MAIL|MIME';
412 # Block access to all (sub-) paths and directories that match the
413 # following (URL) path (is used as:
414 # 'die if $BlockPathAccess && $ENV{'PATH_INFO'} =~ m@$BlockPathAccess@;' )
415 $BlockPathAccess = '/(CVS|\.git)/'; # Protect CVS and .git information
417 # All (blocked) other file-types can be mapped to a single "binary-file"
418 # processor (a kind of pseudo-file path). This can either be an error
419 # message (e.g., "illegal file") or contain a script that serves binary
420 # files.
421 # Note: the real file path wil be stored in $ENV{CGI_BINARY_FILE}.
422 $BinaryMapFile = "/BinaryMapFile.xmr";
423 # Allow for the addition of a CGIscriptor directory
424 # Note that a BinaryMapFile in the root "~/" directory has precedence
425 $BinaryMapFile = "/CGIscriptor".$BinaryMapFile
426 if ! -e "$YOUR_HTML_FILES".$BinaryMapFile
427 && -e "$YOUR_HTML_FILES/CGIscriptor".$BinaryMapFile;
430 # List of all characters that are allowed in file names and paths.
431 # All requests containing illegal characters are blocked. This
432 # blocks most tricks (e.g., adding "\000", "\n", or other control
433 # characters, also blocks URI's using %FF)
434 # THIS IS A SECURITY FEATURE
435 # (this is also used to parse filenames in SRC= features, note the
436 # '-quotes, they are essential)
437 $FileAllowedChars = '\w\.\~\/\:\*\?\-'; # Covers Unix and Mac, but NO spaces
439 # Maximum size of the Query (number of characters clients can send
440 # covers both GET & POST combined)
441 $MaximumQuerySize = 2**20 - 1; # = 2**14 - 1
444 # Embeded URL get function used in SRC attributes and CGIscriptor::read_url
445 # (returns a string with the PERL code to transfer the URL contents, e.g.,
446 # "SAFEqx(\'curl \"http://www.fon.hum.uva.nl\"\')")
447 # "SAFEqx(\'wget --quiet --output-document=- \"http://www.fon.hum.uva.nl\"\')")
448 # Be sure to handle <BASE HREF='URL'> and allow BOTH
449 # direct printing GET_URL($URL [, 0]) and extracting the content of
450 # the $URL for post-processing GET_URL($URL, 1).
451 # You get the WHOLE file, including HTML header.
452 # The shell command Use $URL where the URL should go
453 # ('wget', 'snarf' or 'curl', uncomment the one you would like to use)
454 my $GET_URL_shell_command = 'wget --quiet --output-document=- $URL';
455 #my $GET_URL_shell_command = 'snarf $URL -';
456 #my $GET_URL_shell_command = 'curl $URL';
458 sub GET_URL # ($URL, $ValueNotPrint) -> content_of_url
460 my $URL = shift || return;
461 my $ValueNotPrint = shift || 0;
463 # Check URL for illegal characters
464 return "print '<h1>Illegal URL<h1>'\"\n\";" if $URL =~ /[^$FileAllowedChars\%]/;
466 # Include URL in final command
467 my $CurrentCommand = $GET_URL_shell_command;
468 $CurrentCommand =~ s/\$URL/$URL/g;
470 # Print to STDOUT or return a value
471 my $BlockPrint = "print STDOUT ";
472 $BlockPrint = "" if $ValueNotPrint;
474 my $Commands = <<"GETURLCODE";
475 # Get URL
477 my \$Page = "";
479 # Simple, using shell command
480 \$Page = SAFEqx('$CurrentCommand');
482 # Add a BASE tage to the header
483 \$Page =~ s!\\</head!\\<base href='$URL'\\>\\</head!ig unless \$Page =~ m!\\<base!;
485 # Print the URL value, or return it as a value
486 $BlockPrint\$Page;
488 GETURLCODE
489 return $Commands;
492 # As files can get rather large (and binary), you might want to use
493 # some more intelligent reading procedure, e.g.,
494 # Direct Perl
495 # # open(URLHANDLE, '/usr/bin/wget --quiet --output-document=- "$URL"|') || die "wget: \$!";
496 # #open(URLHANDLE, '/usr/bin/snarf "$URL" -|') || die "snarf: \$!";
497 # open(URLHANDLE, '/usr/bin/curl "$URL"|') || die "curl: \$!";
498 # my \$text = "";
499 # while(sysread(URLHANDLE,\$text, 1024) > 0)
501 # \$Page .= \$text;
502 # };
503 # close(URLHANDLE) || die "\$!";
504 # However, this doesn't work with the CGIexecute->evaluate() function.
505 # You get an error: 'No child processes at (eval 16) line 15, <file0> line 8.'
507 # You can forget the next two variables, they are only needed when
508 # you don't want to use a regular file system (i.e., with open)
509 # but use some kind of database/RAM image for accessing (generating)
510 # the data.
512 # Name of the environment variable that contains the file contents
513 # when reading directly from Database/RAM. When this environment variable,
514 # $ENV{$CGI_FILE_CONTENTS}, is not false, no real file will be read.
515 $CGI_FILE_CONTENTS = 'CGI_FILE_CONTENTS';
516 # Uncomment the following if you want to force the use of the data access code
517 # $ENV{$CGI_FILE_CONTENTS} = '-'; # Force use of $ENV{$CGI_DATA_ACCESS_CODE}
519 # Name of the environment variable that contains the RAM access perl
520 # code needed to read additional "files", i.e.,
521 # $ENV{$CGI_FILE_CONTENTS} = eval("\@_=('$file_path'); do{$ENV{$CGI_DATA_ACCESS_CODE}}");
522 # When $ENV{$CGI_FILE_CONTENTS} eq '-', this code is executed to generate the data.
523 $CGI_DATA_ACCESS_CODE = 'CGI_DATA_ACCESS_CODE';
525 # You can, of course, fill this yourself, e.g.,
526 # $ENV{$CGI_DATA_ACCESS_CODE} =
527 # 'open(INPUT, "<$_[0]"); while(<INPUT>){print;};close(INPUT);'
530 # DEBUGGING
532 # Suppress error messages, this can be changed for debugging or error-logging
533 #open(STDERR, "/dev/null"); # (comment out for use in debugging)
535 # SPECIAL: Remove Comments, security, etc. if the command line is
536 # '>CGIscriptor.pl -slim >slimCGIscriptor.pl'
537 $TrimDownCGIscriptor = 1 if $ARGV[0] =~ /^\-slim/i;
539 # If CGIscriptor is used from the command line, the command line
540 # arguments are interpreted as the file (1st) and the Query String (rest).
541 # Get the arguments
542 $ENV{'PATH_INFO'} = shift(@ARGV) unless exists($ENV{'PATH_INFO'}) || grep(/\-\-help/i, @ARGV);
543 $ENV{'QUERY_STRING'} = join("&", @ARGV) unless exists($ENV{'QUERY_STRING'});
546 # Handle bail-outs in a user definable way.
547 # Catch Die and replace it with your own function.
548 # Ends with a call to "die $_[0];"
550 sub dieHandler # ($ErrorCode, "Message", @_) -> DEAD
552 my $ErrorCode = shift;
553 my $ErrorMessage = shift;
555 # Place your own reporting functions here
557 # Now, kill everything (default)
558 print STDERR "$ErrorCode: $ErrorMessage\n";
559 die $ErrorMessage;
563 # End of optional user configuration
564 # (note: there is more non-essential user configuration below)
566 if(grep(/\-\-help/i, @ARGV))
568 print << 'ENDOFPREHELPTEXT2';
570 ###############################################################################
572 # Author and Copyright (c):
573 # Rob van Son, © 1995,1996,1997,1998,1999,2000,2001,2002-2012
574 # NKI-AVL Amsterdam
575 # r.v.son@nki.nl
576 # Institute of Phonetic Sciences & IFOTT/ACLS
577 # University of Amsterdam
578 # Email: R.J.J.H.vanSon@gmail.com
579 # Email: R.J.J.H.vanSon@uva.nl
580 # WWW : http://www.fon.hum.uva.nl/rob/
582 # License for use and disclaimers
584 # CGIscriptor merges plain ASCII HTML files transparantly
585 # with CGI variables, in-line PERL code, shell commands,
586 # and executable scripts in other scripting languages.
588 # This program is free software; you can redistribute it and/or
589 # modify it under the terms of the GNU General Public License
590 # as published by the Free Software Foundation; either version 2
591 # of the License, or (at your option) any later version.
593 # This program is distributed in the hope that it will be useful,
594 # but WITHOUT ANY WARRANTY; without even the implied warranty of
595 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
596 # GNU General Public License for more details.
598 # You should have received a copy of the GNU General Public License
599 # along with this program; if not, write to the Free Software
600 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
603 # Contributors:
604 # Rob van Son (R.J.J.H.vanSon@uva.nl)
605 # Gerd Franke franke@roo.de (designed the <DIV> behaviour)
607 #######################################################
608 ENDOFPREHELPTEXT2
610 #######################################################>>>>>>>>>>Start Remove
612 # You can skip the following code, it is an auto-splice
613 # procedure.
615 # Construct a slimmed down version of CGIscriptor
616 # (i.e., CGIscriptor.pl -slim > slimCGIscriptor.pl)
618 if($TrimDownCGIscriptor)
620 open(CGISCRIPTOR, "<CGIscriptor.pl")
621 || dieHandler(1, "<CGIscriptor.pl not slimmed down: $!\n");
622 my $SKIPtext = 0;
623 my $SKIPComments = 0;
625 while(<CGISCRIPTOR>)
627 my $SKIPline = 0;
629 ++$LineCount;
631 # Start of SKIP text
632 $SKIPtext = 1 if /[\>]{10}Start Remove/;
633 $SKIPComments = 1 if $SKIPtext == 1;
635 # Skip this line?
636 $SKIPline = 1 if $SKIPtext || ($SKIPComments && /^\s*\#/);
638 ++$PrintCount unless $SKIPline;
640 print STDOUT $_ unless $SKIPline;
642 # End of SKIP text ?
643 $SKIPtext = 0 if /[\<]{10}End Remove/;
645 # Ready!
646 print STDERR "\# Printed $PrintCount out of $LineCount lines\n";
647 exit;
650 #######################################################
652 if(grep(/\-\-help/i, @ARGV))
654 print << 'ENDOFHELPTEXT';
656 # HYPE
658 # CGIscriptor merges plain ASCII HTML files transparantly and safely
659 # with CGI variables, in-line PERL code, shell commands, and executable
660 # scripts in many languages (on-line and real-time). It combines the
661 # "ease of use" of HTML files with the versatillity of specialized
662 # scripts and PERL programs. It hides all the specifics and
663 # idiosyncrasies of correct output and CGI coding and naming. Scripts
664 # do not have to be aware of HTML, HTTP, or CGI conventions just as HTML
665 # files can be ignorant of scripts and the associated values. CGIscriptor
666 # complies with the W3C HTML 4.0 recommendations.
667 # In addition to its use as a WWW embeded CGI processor, it can
668 # be used as a command-line document preprocessor (text-filter).
670 # THIS IS HOW IT WORKS
672 # The aim of CGIscriptor is to execute "plain" scripts inside a text file
673 # using any required CGIparameters and environment variables. It
674 # is optimized to transparantly process HTML files inside a WWW server.
675 # The native language is Perl, but many other scripting languages
676 # can be used.
678 # CGIscriptor reads text files from the requested input file (i.e., from
679 # $YOUR_HTML_FILES$PATH_INFO) and writes them to <STDOUT> (i.e., the
680 # client requesting the service) preceded by the obligatory
681 # "Content-type: text/html\n\n" or "Content-type: text/plain\n\n" string
682 # (except for "raw" files which supply their own Content-type message
683 # and only if the SERVER_PROTOCOL supports HTTP, MAIL, or MIME).
685 # When CGIscriptor encounters an embedded script, indicated by an HTML4 tag
687 # <SCRIPT TYPE="text/ssperl" [CGI="$VAR='default value'"] [SRC="ScriptSource"]>
688 # PERL script
689 # </SCRIPT>
691 # or
693 # <SCRIPT TYPE="text/osshell" [CGI="$name='default value'"] [SRC="ScriptSource"]>
694 # OS Shell script
695 # </SCRIPT>
697 # construct (anything between []-brackets is optional, other MIME-types
698 # and scripting languages are supported), the embedded script is removed
699 # and both the contents of the source file (i.e., "do 'ScriptSource'")
700 # AND the script are evaluated as a PERL program (i.e., by eval()),
701 # shell script (i.e., by a "safe" version of `Command`, qx) or an external
702 # interpreter. The output of the eval() function takes the place of the
703 # original <SCRIPT></SCRIPT> construct in the output string. Any CGI
704 # parameters declared by the CGI attribute are available as simple perl
705 # variables, and can subsequently be made available as variables to other
706 # scripting languages (e.g., bash, python, or lisp).
708 # Example: printing "Hello World"
709 # <HTML><HEAD><TITLE>Hello World</TITLE>
710 # <BODY>
711 # <H1><SCRIPT TYPE="text/ssperl">"Hello World"</SCRIPT></H1>
712 # </BODY></HTML>
714 # Save this in a file, hello.html, in the directory you indicated with
715 # $YOUR_HTML_FILES and access http://your_server/SHTML/hello.html
716 # (or to whatever name you use as an alias for CGIscriptor.pl).
717 # This is realy ALL you need to do to get going.
719 # You can use any values that are delivered in CGI-compliant form (i.e.,
720 # the "?name=value" type URL additions) transparently as "$name" variables
721 # in your scripts IFF you have declared them in the CGI attribute of
722 # a META or SCRIPT tag before e.g.:
723 # <META CONTENT="text/ssperl; CGI='$name = `default value`'
724 # [SRC='ScriptSource']">
725 # or
726 # <SCRIPT TYPE="text/ssperl" CGI="$name = 'default value'"
727 # [SRC='ScriptSource']>
728 # After such a 'CGI' attribute, you can use $name as an ordinary PERL variable
729 # (the ScriptSource file is immediately evaluated with "do 'ScriptSource'").
730 # The CGIscriptor script allows you to write ordinary HTML files which will
731 # include dynamic CGI aware (run time) features, such as on-line answers
732 # to specific CGI requests, queries, or the results of calculations.
734 # For example, if you wanted to answer questions of clients, you could write
735 # a Perl program called "Answer.pl" with a function "AnswerQuestion()"
736 # that prints out the answer to requests given as arguments. You then write
737 # an HTML page "Respond.html" containing the following fragment:
739 # <center>
740 # The Answer to your question
741 # <META CONTENT="text/ssperl; CGI='$Question'">
742 # <h3><SCRIPT TYPE="text/ssperl">$Question</SCRIPT></h3>
743 # is
744 # <h3><SCRIPT TYPE="text/ssperl" SRC="./PATH/Answer.pl">
745 # AnswerQuestion($Question);
746 # </SCRIPT></h3>
747 # </center>
748 # <FORM ACTION=Respond.html METHOD=GET>
749 # Next question: <INPUT NAME="Question" TYPE=TEXT SIZE=40><br>
750 # <INPUT TYPE=SUBMIT VALUE="Ask">
751 # </FORM>
753 # The output could look like the following (in HTML-speak):
755 # <CENTER>
756 # The Answer to your question
757 # <h3>What is the capital of the Netherlands?</h3>
758 # is
759 # <h3>Amsterdam</h3>
760 # </CENTER>
761 # <FORM ACTION=Respond.html METHOD=GET>
762 # Next question: <INPUT NAME="Question" TYPE=TEXT SIZE=40><br>
763 # <INPUT TYPE=SUBMIT VALUE="Ask">
765 # Note that the function "Answer.pl" does know nothing about CGI or HTML,
766 # it just prints out answers to arguments. Likewise, the text has no
767 # provisions for scripts or CGI like constructs. Also, it is completely
768 # trivial to extend this "program" to use the "Answer" later in the page
769 # to call up other information or pictures/sounds. The final text never
770 # shows any cue as to what the original "source" looked like, i.e.,
771 # where you store your scripts and how they are called.
773 # There are some extra's. The argument of the files called in a SRC= tag
774 # can access the CGI variables declared in the preceding META tag from
775 # the @ARGV array. Executable files are called as:
776 # `file '$ARGV[0]' ... ` (e.g., `Answer.pl \'$Question\'`;)
777 # The files called from SRC can even be (CGIscriptor) html files which are
778 # processed in-line. Furthermore, the SRC= tag can contain a perl block
779 # that is evaluated. That is,
780 # <META CONTENT="text/ssperl; CGI='$Question' SRC='{$Question}'">
781 # will result in the evaluation of "print do {$Question};" and the VALUE
782 # of $Question will be printed. Note that these "SRC-blocks" can be
783 # preceded and followed by other file names, but only a single block is
784 # allowed in a SRC= tag.
786 # One of the major hassles of dynamic WWW pages is the fact that several
787 # mutually incompatible browsers and platforms must be supported. For example,
788 # the way sound is played automatically is different for Netscape and
789 # Internet Explorer, and for each browser it is different again on
790 # Unix, MacOS, and Windows. Realy dangerous is processing user-supplied
791 # (form-) values to construct email addresses, file names, or database
792 # queries. All Apache WWW-server exploits reported in the media are
793 # based on faulty CGI-scripts that didn't check their user-data properly.
795 # There is no panacee for these problems, but a lot of work and problems
796 # can be saved by allowing easy and transparent control over which
797 # <SCRIPT></SCRIPT> blocks are executed on what CGI-data. CGIscriptor
798 # supplies such a method in the form of a pair of attributes:
799 # IF='...condition..' and UNLESS='...condition...'. When added to a
800 # script tag, the whole block (including the SRC attribute) will be
801 # ignored if the condition is false (IF) or true (UNLESS).
802 # For example, the following block will NOT be evaluated if the value
803 # of the CGI variable FILENAME is NOT a valid filename:
805 # <SCRIPT TYPE='text/ssperl' CGI='$FILENAME'
806 # IF='CGIscriptor::CGIsafeFileName($FILENAME)'>
807 # .....
808 # </SCRIPT>
810 # (the function CGIsafeFileName(String) returns an empty string ("")
811 # if the String argument is not a valid filename).
812 # The UNLESS attribute is the mirror image of IF.
814 # A user manual follows the HTML 4 and security paragraphs below.
816 ##########################################################################
818 # HTML 4 compliance
820 # In general, CGIscriptor.pl complies with the HTML 4 recommendations of
821 # the W3C. This means that any software to manage Web sites will be able
822 # to handle CGIscriptor files, as will web agents.
824 # All script code should be placed between <SCRIPT></SCRIPT> tags, the
825 # script type is indicated with TYPE="mime-type", the LANGUAGE
826 # feature is ignored, and a SRC feature is implemented. All CGI specific
827 # features are delegated to the CGI attribute.
829 # However, the behavior deviates from the W3C recommendations at some
830 # points. Most notably:
831 # 0- The scripts are executed at the server side, invissible to the
832 # client (i.e., the browser)
833 # 1- The mime-types are personal and idiosyncratic, but can be adapted.
834 # 2- Code in the body of a <SCRIPT></SCRIPT> tag-pair is still evaluated
835 # when a SRC feature is present.
836 # 3- The SRC attribute reads a list of files.
837 # 4- The files in a SRC attribute are processed according to file type.
838 # 5- The SRC attribute evaluates inline Perl code.
839 # 6- Processed META, DIV, INS tags are removed from the output
840 # document.
841 # 7- All attributes of the processed META tags, except CONTENT, are ignored
842 # (i.e., deleted from the output).
843 # 8- META tags can be placed ANYWHERE in the document.
844 # 9- Through the SRC feature, META tags can have visible output in the
845 # document.
846 # 10- The CGI attribute that declares CGI parameters, can be used
847 # inside the <SCRIPT> tag.
848 # 11- Use of an extended quote set, i.e., '', "", ``, (), {}, []
849 # and their \-slashed combinations: \'\', \"\", \`\`, \(\),
850 # \{\}, \[\].
851 # 12- IF and UNLESS attributes to <SCRIPT>, <META>, <DIV>, <INS> tags.
852 # 13- <DIV> tags cannot be nested, DIV tags are not
853 # rendered with new-lines.
854 # 14- The XML style <TAG .... /> is recognized and handled correctly.
855 # (i.e., no content is processed)
857 # The reasons for these choices are:
858 # You can still write completely HTML4 compliant documents. CGIscriptor
859 # will not force you to write "deviant" code. However, it allows you to
860 # do so (which is, in fact, just as bad). The prime design principle
861 # was to allow users to include plain Perl code. The code itself should
862 # be "enhancement free". Therefore, extra features were needed to
863 # supply easy access to CGI and Web site components. For security
864 # reasons these have to be declared explicitly. The SRC feature
865 # transparently manages access to external files, especially the safe
866 # use of executable files.
867 # The CGI attribute handles the declarations of external (CGI) variables
868 # in the SCRIPT and META tag's.
869 # EVERYTHING THE CGI ATTRIBUTE AND THE META TAG DO CAN BE DONE INSIDE
870 # A <SCRIPT></SCRIPT> TAG CONSTRUCT.
872 # The reason for the IF, UNLESS, and SRC attributes (and their Perl code
873 # evaluation) were build into the META and SCRIPT tags is part laziness,
874 # part security. The SRC blocks allows more compact documents and easier
875 # debugging. The values of the CGI variables can be immediately screened
876 # for security by IF or UNLESS conditions, and even SRC attributes (e.g.,
877 # email addresses and file names), and a few commands can be called
878 # without having to add another Perl TAG pair. This is especially important
879 # for documents that require the use of other (more restricted) "scripting"
880 # languages and facilities that lag transparent control structures.
882 ##########################################################################
884 # SECURITY
886 # Your WWW site is a few keystrokes away from a few hundred million internet
887 # users. A fair percentage of these users knows more about your computer
888 # than you do. And some of these just might have bad intentions.
890 # To ensure uncompromized operation of your server and platform, several
891 # features are incorporated in CGIscriptor.pl to enhance security.
892 # First of all, you should check the source of this program. No security
893 # measures will help you when you download programs from anonymous sources.
894 # If you want to use THIS file, please make sure that it is uncompromized.
895 # The best way to do this is to contact the source and try to determine
896 # whether s/he is reliable (and accountable).
898 # BE AWARE THAT ANY PROGRAMMER CAN CHANGE THIS PROGRAM IN SUCH A WAY THAT
899 # IT WILL SET THE DOORS TO YOUR SYSTEM WIDE OPEN
901 # I would like to ask any user who finds bugs that could compromise
902 # security to report them to me (and any other bug too,
903 # Email: R.J.J.H.vanSon@uva.nl or ifa@hum.uva.nl).
905 # Security features
907 # 1 Invisibility
908 # The inner workings of the HTML source files are completely hidden
909 # from the client. Only the HTTP header and the ever changing content
910 # of the output distinguish it from the output of a plain, fixed HTML
911 # file. Names, structures, and arguments of the "embedded" scripts
912 # are invisible to the client. Error output is suppressed except
913 # during debugging (user configurable).
915 # 2 Separate directory trees
916 # Directories containing Inline text and script files can reside on
917 # separate trees, distinct from those of the HTTP server. This means
918 # that NEITHER the text files, NOR the script files can be read by
919 # clients other than through CGIscriptor.pl, UNLESS they are
920 # EXPLICITELY made available.
922 # 3 Requests are NEVER "evaluated"
923 # All client supplied values are used as literal values (''-quoted).
924 # Client supplied ''-quotes are ALWAYS removed. Therefore, as long as the
925 # embedded scripts do NOT themselves evaluate these values, clients CANNOT
926 # supply executable commands. Be sure to AVOID scripts like:
928 # <META CONTENT="text/ssperl; CGI='$UserValue'">
929 # <SCRIPT TYPE="text/ssperl">$dir = `ls -1 $UserValue`;</SCRIPT>
931 # These are a recipe for disaster. However, the following quoted
932 # form should be save (but is still not adviced):
934 # <SCRIPT TYPE="text/ssperl">$dir = `ls -1 \'$UserValue\'`;</SCRIPT>
936 # A special function, SAFEqx(), will automatically do exactly this,
937 # e.g., SAFEqx('ls -1 $UserValue') will execute `ls -1 \'$UserValue\'`
938 # with $UserValue interpolated. I recommend to use SAFEqx() instead
939 # of backticks whenever you can. The OS shell scripts inside
941 # <SCRIPT TYPE="text/osshell">ls -1 $UserValue</SCRIPT>
943 # are handeld by SAFEqx and automatically ''-quoted.
945 # 4 Logging of requests
946 # All requests can be logged separate from the Host server. The level of
947 # detail is user configurable: Including or excluding the actual queries.
948 # This allows for the inspection of (im-) proper use.
950 # 5 Access control: Clients
951 # The Remote addresses can be checked against a list of authorized
952 # (i.e., accepted) or non-authorized (i.e., rejected) clients. Both
953 # REMOTE_HOST and REMOTE_ADDR are tested so clients without a proper
954 # HOST name can be (in-) excluded by their IP-address. Client patterns
955 # containing all numbers and dots are considered IP-addresses, all others
956 # domain names. No wild-cards or regexp's are allowed, only partial
957 # addresses.
958 # Matching of names is done from the back to the front (domain first,
959 # i.e., $REMOTE_HOST =~ /\Q$pattern\E$/is), so including ".edu" will
960 # accept or reject all clients from the domain EDU. Matching of
961 # IP-addresses is done from the front to the back (domain first, i.e.,
962 # $REMOTE_ADDR =~ /^\Q$pattern\E/is), so including "128." will (in-)
963 # exclude all clients whose IP-address starts with 128.
964 # There are two special symbols: "-" matches HOSTs with no name and "*"
965 # matches ALL HOSTS/clients.
966 # For those needing more expressional power, lines starting with
967 # "-e" are evaluated by the perl eval() function. E.g.,
968 # '-e $REMOTE_HOST =~ /\.edu$/is;' will accept/reject clients from the
969 # domain '.edu'.
971 # 6 Access control: Files
972 # In principle, CGIscriptor could read ANY file in the directory
973 # tree as discussed in 1. However, for security reasons this is
974 # restricted to text files. It can be made more restricted by entering
975 # a global file pattern (e.g., ".html"). This is done by default.
976 # For each client requesting access, the file pattern(s) can be made
977 # more restrictive than the global pattern by entering client specific
978 # file patterns in the Access Control files (see 5).
979 # For example: if the ACCEPT file contained the lines
980 # * DEMO
981 # .hum.uva.nl LET
982 # 145.18.230.
983 # Then all clients could request paths containing "DEMO" or "demo", e.g.
984 # "/my/demo/file.html" ($PATH_INFO =~ /\Q$pattern\E/), Clients from
985 # *.hum.uva.nl could also request paths containing "LET or "let", e.g.
986 # "/my/let/file.html", and clients from the local cluster
987 # 145.18.230.[0-9]+ could access ALL files.
988 # Again, for those needing more expressional power, lines starting with
989 # "-e" are evaluated. For instance:
990 # '-e $REMOTE_HOST =~ /\.edu$/is && $PATH_INFO =~ m@/DEMO/@is;'
991 # will accept/reject requests for files from the directory "/demo/" from
992 # clients from the domain '.edu'.
994 # 7 Access control: Server side session tickets
995 # Specific paths can be controlled by Session Tickets which must be
996 # present as a SESSIONTICKET=<value> CGI variable in the request. These paths
997 # are defined in %TicketRequiredPatterns as pairs of:
998 # ('regexp' => 'SessionPath\tPasswordPath\tLogin.html\tExpiration').
999 # Session Tickets are stored in a separate directory (SessionPath, e.g.,
1000 # "Private/.Session") as files with the exact same name of the SESSIONTICKET
1001 # CGI. The following is an example:
1002 # Type: SESSION
1003 # IPaddress: 127.0.0.1
1004 # AllowedPaths: ^/Private/Name/
1005 # Expires: 3600
1006 # Username: test
1007 # ...
1008 # Other content can follow.
1010 # It is adviced that Session Tickets should be deleted
1011 # after some (idle) time. The IP address should be the IP number at login, and
1012 # the SESSIONTICKET will be rejected if it is presented from another IP address.
1013 # AllowedPaths and DeniedPaths are perl regexps. Be careful how they match. Make sure to delimit
1014 # the names to prevent access to overlapping names, eg, "^/Private/Rob" will also
1015 # match "^/Private/Robert", however, "^/Private/Rob/" will not. Expires is the
1016 # time the ticket will remain valid after creation (file ctime). Time can be given
1017 # in s[econds] (default), m[inutes], h[hours], or d[ays], eg, "24h" means 24 hours.
1018 # None of these need be present, but the Ticket must have a non-zero size.
1020 # Next to Session Tickets, there are two other type of ticket files:
1021 # - LOGIN tickets store information about a current login request
1022 # - PASSWORD ticket store account information to authorize login requests
1024 # 8 Query length limiting
1025 # The length of the Query string can be limited. If CONTENT_LENGTH is larger
1026 # than this limit, the request is rejected. The combined length of the
1027 # Query string and the POST input is checked before any processing is done.
1028 # This will prevent clients from overloading the scripts.
1029 # The actual, combined, Query Size is accessible as a variable through
1030 # $CGI_Content_Length.
1032 # 9 Illegal filenames, paths, and protected directories
1033 # One of the primary security concerns in handling CGI-scripts is the
1034 # use of "funny" characters in the requests that con scripts in executing
1035 # malicious commands. Examples are inserting ';', null bytes, or <newline>
1036 # characters in URL's and filenames, followed by executable commands. A
1037 # special variable $FileAllowedChars stores a string of all allowed
1038 # characters. Any request that translates to a filename with a character
1039 # OUTSIDE this set will be rejected.
1040 # In general, all (readable files) in the DocumentRoot tree are accessible.
1041 # This might not be what you want. For instance, your DocumentRoot directory
1042 # might be the working directory of a CVS project and contain sensitive
1043 # information (e.g., the password to get to the repository). You can block
1044 # access to these subdirectories by adding the corresponding patterns to
1045 # the $BlockPathAccess variable. For instance, $BlockPathAccess = '/CVS/'
1046 # will block any request that contains '/CVS/' or:
1047 # die if $BlockPathAccess && $ENV{'PATH_INFO'} =~ m@$BlockPathAccess@;
1049 #10 The execution of code blocks can be controlled in a transparent way
1050 # by adding IF or UNLESS conditions in the tags themselves. That is,
1051 # a simple check of the validity of filenames or email addresses can
1052 # be done before any code is executed.
1054 ###############################################################################
1056 # USER MANUAL (sort of)
1058 # CGIscriptor removes embedded scripts, indicated by an HTML 4 type
1059 # <SCRIPT TYPE='text/ssperl'> </SCRIPT> or <SCRIPT TYPE='text/osshell'>
1060 # </SCRIPT> constructs. CGIscriptor also recognizes XML-type
1061 # <SCRIPT TYPE='text/ssperl'/> constructs. These are usefull when
1062 # the necessary code is already available in the TAG itself (e.g.,
1063 # using external files). The contents of the directive are executed by
1064 # the PERL eval() and `` functions (in a separate name space). The
1065 # result of the eval() function replaces the <SCRIPT> </SCRIPT> construct
1066 # in the output file. You can use the values that are delivered in
1067 # CGI-compliant form (i.e., the "?name=value&.." type URL additions)
1068 # transparently as "$name" variables in your directives after they are
1069 # defined in a <META> or <SCRIPT> tag.
1070 # If you define the variable "$CGIscriptorResults" in a CGI attribute, all
1071 # subsequent <SCRIPT> and <META> results (including the defining
1072 # tag) will also be pushed onto a stack: @CGIscriptorResults. This list
1073 # behaves like any other, ordinary list and can be manipulated.
1075 # Both GET and POST requests are accepted. These two methods are treated
1076 # equal. Variables, i.e., those values that are determined when a file is
1077 # processed, are indicated in the CGI attribute by $<name> or $<name>=<default>
1078 # in which <name> is the name of the variable and <default> is the value
1079 # used when there is NO current CGI value for <name> (you can use
1080 # white-spaces in $<name>=<default> but really DO make sure that the
1081 # default value is followed by white space or is quoted). Names can contain
1082 # any alphanumeric characters and _ (i.e., names match /[\w]+/).
1083 # If the Content-type: is 'multipart/*', the input is treated as a
1084 # MIME multipart message and automatically delimited. CGI variables get
1085 # the "raw" (i.e., undecoded) body of the corresponding message part.
1087 # Variables can be CGI variables, i.e., those from the QUERY_STRING,
1088 # environment variables, e.g., REMOTE_USER, REMOTE_HOST, or REMOTE_ADDR,
1089 # or predefined values, e.g., CGI_Decoded_QS (The complete, decoded,
1090 # query string), CGI_Content_Length (the length of the decoded query
1091 # string), CGI_Year, CGI_Month, CGI_Time, and CGI_Hour (the current
1092 # date and time).
1094 # All these are available when defined in a CGI attribute. All environment
1095 # variables are accessible as $ENV{'name'}. So, to access the REMOTE_HOST
1096 # and the REMOTE_USER, use, e.g.:
1098 # <SCRIPT TYPE='text/ssperl'>
1099 # ($ENV{'REMOTE_HOST'}||"-")." $ENV{'REMOTE_USER'}"
1100 # </SCRIPT>
1102 # (This will print a "-" if REMOTE_HOST is not known)
1103 # Another way to do this is:
1105 # <META CONTENT="text/ssperl; CGI='$REMOTE_HOST = - $REMOTE_USER'">
1106 # <SCRIPT TYPE='text/ssperl'>"$REMOTE_HOST $REMOTE_USER"</SCRIPT>
1107 # or
1108 # <META CONTENT='text/ssperl; CGI="$REMOTE_HOST = - $REMOTE_USER"
1109 # SRC={"$REMOTE_HOST $REMOTE_USER\n"}'>
1111 # This is possible because ALL environment variables are available as
1112 # CGI variables. The environment variables take precedence over CGI
1113 # names in case of a "name clash". For instance:
1114 # <META CONTENT="text/ssperl; CGI='$HOME' SRC={$HOME}">
1115 # Will print the current HOME directory (environment) irrespective whether
1116 # there is a CGI variable from the query
1117 # (e.g., Where do you live? <INPUT TYPE="TEXT" NAME="HOME">)
1118 # THIS IS A SECURITY FEATURE. It prevents clients from changing
1119 # the values of defined environment variables (e.g., by supplying
1120 # a bogus $REMOTE_ADDR). Although $ENV{} is not changed by the META tags,
1121 # it would make the use of declared variables insecure. You can still
1122 # access CGI variables after a name clash with
1123 # CGIscriptor::CGIparseValue(<name>).
1125 # Some CGI variables are present several times in the query string
1126 # (e.g., from multiple selections). These should be defined as
1127 # @VARIABLENAME=default in the CGI attribute. The list @VARIABLENAME
1128 # will contain ALL VARIABLENAME values from the query, or a single
1129 # default value. If there is an ENVIRONMENT variable of the
1130 # same name, it will be used instead of the default AND the query
1131 # values. The corresponding function is
1132 # CGIscriptor::CGIparseValueList(<name>)
1134 # CGI variables collected in a @VARIABLENAME list are unordered.
1135 # When more structured variables are needed, a hash table can be used.
1136 # A variable defined as %VARIABLE=default will collect all
1137 # CGI-parameters whose name start with 'VARIABLE' in a hash table with
1138 # the remainder of the name as a key. For instance, %PERSON will
1139 # collect PERSONname='John Doe', PERSONbirthdate='01 Jan 00', and
1140 # PERSONspouse='Alice' into a hash table %PERSON such that $PERSON{'spouse'}
1141 # equals 'Alice'. Any default value or environment value will be stored
1142 # under the "" key. If there is an ENVIRONMENT variable of the same name,
1143 # it will be used instead of the default AND the query values. The
1144 # corresponding function is CGIscriptor::CGIparseValueHash(<name>)
1146 # This method of first declaring your environment and CGI variables
1147 # before being able to use them in the scripts might seem somewhat
1148 # clumsy, but it protects you from inadvertedly printing out the values of
1149 # system environment variables when their names coincide with those used
1150 # in the CGI forms. It also prevents "clients" from supplying CGI
1151 # parameter values for your private variables.
1152 # THIS IS A SECURITY FEATURE!
1155 # NON-HTML CONTENT TYPES
1157 # Normally, CGIscriptor prints the standard "Content-type: text/html\n\n"
1158 # message before anything is printed. This has been extended to include
1159 # plain text (.txt) files, for which the Content-type (MIME type)
1160 # 'text/plain' is printed. In all other respects, text files are treated
1161 # as HTML files (this can be switched off by removing '.txt' from the
1162 # $FilePattern variable) . When the content type should be something else,
1163 # e.g., with multipart files, use the $RawFilePattern (.xmr, see also next
1164 # item). CGIscriptor will not print a Content-type message for this file
1165 # type (which must supply its OWN Content-type message). Raw files must
1166 # still conform to the <SCRIPT></SCRIPT> and <META> tag specifications.
1169 # NON-HTML FILES
1171 # CGIscriptor is intended to process HTML and text files only. You can
1172 # create documents of any mime-type on-the-fly using "raw" text files,
1173 # e.g., with the .xmr extension. However, CGIscriptor will not process
1174 # binary files of any type, e.g., pictures or sounds. Given the sheer
1175 # number of formats, I do not have any intention to do so. However,
1176 # an escape route has been provided. You can construct a genuine raw
1177 # (.xmr) text file that contains the perl code to service any file type
1178 # you want. If the global $BinaryMapFile variable contains the path to
1179 # this file (e.g., /BinaryMapFile.xmr), this file will be called
1180 # whenever an unsupported (non-HTML) file type is requested. The path
1181 # to the requested binary file is stored in $ENV('CGI_BINARY_FILE')
1182 # and can be used like any other CGI-variable. Servicing binary files
1183 # then becomes supplying the correct Content-type (e.g., print
1184 # "Content-type: image/jpeg\n\n";) and reading the file and writing it
1185 # to STDOUT (e.g., using sysread() and syswrite()).
1188 # THE META TAG
1190 # All attributes of a META tag are ignored, except the
1191 # CONTENT='text/ssperl; CGI=" ... " [SRC=" ... "]' attribute. The string
1192 # inside the quotes following the CONTENT= indication (white-space is
1193 # ignored, "" '' `` (){}[]-quote pairs are allowed, plus their \ versions)
1194 # MUST start with any of the CGIscriptor mime-types (e.g.: text/ssperl or
1195 # text/osshell) and a comma or semicolon.
1196 # The quoted string following CGI= contains a white-space separated list
1197 # of declarations of the CGI (and Environment) values and default values
1198 # used when no CGI values are supplied by the query string.
1200 # If the default value is a longer string containing special characters,
1201 # possibly spanning several lines, the string must be enclosed in quotes.
1202 # You may use any pair of quotes or brackets from the list '', "", ``, (),
1203 # [], or {} to distinguish default values (or preceded by \, e.g., \(...\)
1204 # is different from (...)). The outermost pair will always be used and any
1205 # other quotes inside the string are considered to be part of the string
1206 # value, e.g.,
1208 # $Value = {['this'
1209 # "and" (this)]}
1210 # will result in $Value getting the default value: ['this'
1211 # "and" (this)]
1212 # (NOTE that the newline is part of the default value!).
1214 # Internally, for defining and initializing CGI (ENV) values, the META
1215 # and SCRIPT tags use the functions "defineCGIvariable($name, $default)"
1216 # (scalars) and "defineCGIvariableList($name, $default)" (lists).
1217 # These functions can be used inside scripts as
1218 # "CGIscriptor::defineCGIvariable($name, $default)" and
1219 # "CGIscriptor::defineCGIvariableList($name, $default)".
1220 # "CGIscriptor::defineCGIvariableHash($name, $default)".
1222 # The CGI attribute will be processed exactly identical when used inside
1223 # the <SCRIPT> tag. However, this use is not according to the
1224 # HTML 4.0 specifications of the W3C.
1227 # THE DIV/INS TAGS
1229 # There is a problem when constructing html files containing
1230 # server-side perl scripts with standard HTML tools. These
1231 # tools will refuse to process any text between <SCRIPT></SCRIPT>
1232 # tags. This is quite annoying when you want to use large
1233 # HTML templates where you will fill in values.
1235 # For this purpose, CGIscriptor will read the neutral
1236 # <DIV CLASS="ssperl" ID="varname"></DIV> or
1237 # <INS CLASS="ssperl" ID="varname"></INS>
1238 # tag (in Cascading Style Sheet manner) Note that
1239 # "varname" has NO '$' before it, it is a bare name.
1240 # Any text between these <DIV ...></DIV> or
1241 # <INS ...></INS>tags will be assigned to '$varname'
1242 # as is (e.g., as a literal).
1243 # No processing or interpolation will be performed.
1244 # There is also NO nesting possible. Do NOT nest a
1245 # </DIV> inside a <DIV></DIV>! Moreover, neither INS nor
1246 # DIV tags do ensure a block structure in the final
1247 # rendering (i.e., no empty lines).
1249 # Note that <DIV CLASS="ssperl" ID="varname"/>
1250 # is handled the XML way. No content is processed,
1251 # but varname is defined, and any SRC directives are
1252 # processed.
1254 # You can use $varname like any other variable name.
1255 # However, $varname is NOT a CGI variable and will be
1256 # completely internal to your script. There is NO
1257 # interaction between $varname and the outside world.
1259 # To interpolate a DIV derived text, you can use:
1260 # $varname =~ s/([\]])/\\\1/g; # Mark ']'-quotes
1261 # $varname = eval("qq[$varname]"); # Interpolate all values
1263 # The DIV tags will process IF, UNLESS, CGI and
1264 # SRC attributes. The SRC files will be pre-pended to the
1265 # body text of the tag. SRC blocks are NOT executed.
1267 # CONDITIONAL PROCESSING: THE 'IF' AND 'UNLESS' ATTRIBUTES
1269 # It is often necessary to include code-blocks that should be executed
1270 # conditionally, e.g., only for certain browsers or operating system.
1271 # Furthermore, quite often sanity and security checks are necessary
1272 # before user (form) data can be processed, e.g., with respect to
1273 # email addresses and filenames.
1275 # Checks added to the code are often difficult to find, interpret or
1276 # maintain and in general mess up the code flow. This kind of confussion
1277 # is dangerous.
1278 # Also, for many of the supported "foreign" scripting languages, adding
1279 # these checks is cumbersome or even impossible.
1281 # As a uniform method for asserting the correctness of "context", two
1282 # attributes are added to all supported tags: IF and UNLESS.
1283 # They both evaluate their value and block execution when the
1284 # result is <FALSE> (IF) or <TRUE> (UNLESS) in Perl, e.g.,
1285 # UNLESS='$NUMBER \> 100;' blocks execution if $NUMBER <= 100. Note that
1286 # the backslash in the '\>' is removed and only used to differentiate
1287 # this conditional '>' from the tag-closing '>'. For symmetry, the
1288 # backslash in '\<' is also removed. Inside these conditionals,
1289 # ~/ and ./ are expanded to their respective directory root paths.
1291 # For example, the following tag will be ignored when the filename is
1292 # invalid:
1294 # <SCRIPT TYPE='text/ssperl' CGI='$FILENAME'
1295 # IF='CGIscriptor::CGIsafeFileName($FILENAME);'>
1296 # ...
1297 # </SCRIPT>
1299 # The IF and UNLESS values must be quoted. The same quotes are supported
1300 # as with the other attributes. The SRC attribute is ignored when IF and
1301 # UNLESS block execution.
1303 # NOTE: 'IF' and 'UNLESS' always evaluate perl code.
1306 # THE MAGIC SOURCE ATTRIBUTE (SRC=)
1308 # The SRC attribute inside tags accepts a list of filenames and URL's
1309 # separated by "," comma's (or ";" semicolons).
1310 # ALL the variable values defined in the CGI attribute are available
1311 # in @ARGV as if the file or block was executed from the command line,
1312 # in the exact order in which they were declared in the preceding CGI
1313 # attribute.
1315 # First, a SRC={}-block will be evaluated as if the code inside the
1316 # block was part of a <SCRIPT></SCRIPT> construct, i.e.,
1317 # "print do { code };'';" or `code` (i.e., SAFEqx('code)).
1318 # Only a single block is evaluated. Note that this is processed less
1319 # efficiently than <SCRIPT> </SCRIPT> blocks. Type of evaluation
1320 # depends on the content-type: Perl for text/ssperl and OS shell for
1321 # text/osshell. For other mime types (scripting languages), anything in
1322 # the source block is put in front of the code block "inside" the tag.
1324 # Second, executable files (i.e., -x filename != 0) are evaluated as:
1325 # print `filename \'$ARGV[0]\' \'$ARGV[1]\' ...`
1326 # That is, you can actually call executables savely from the SRC tag.
1328 # Third, text files that match the file pattern, used by CGIscriptor to
1329 # check whether files should be processed ($FilePattern), are
1330 # processed in-line (i.e., recursively) by CGIscriptor as if the code
1331 # was inserted in the original source file. Recursions, i.e., calling
1332 # a file inside itself, are blocked. If you need them, you have to code
1333 # them explicitely using "main::ProcessFile($file_path)".
1335 # Fourth, Perl text files (i.e., -T filename != 0) are evaluated as:
1336 # "do FileName;'';".
1338 # Last, URL's (i.e., starting with 'HTTP://', 'FTP://', 'GOPHER://',
1339 # 'TELNET://', 'WHOIS://' etc.) are loaded
1340 # and printed. The loading and handling of <BASE> and document header
1341 # is done by a command generated by main::GET_URL($URL [, 0]). You can enter your
1342 # own code (default is curl, wget, or snarf and some post-processing to add a <BASE> tag).
1344 # There are two pseudo-file names: PREFIX and POSTFIX. These implement
1345 # a switch from prefixing the SRC code/files (PREFIX, default) before the
1346 # content of the tag to appending the code after the content of the tag
1347 # (POSTFIX). The switches are done in the order in which the PREFIX and
1348 # POSTFIX labels are encountered. You can mix PREFIX and POSTFIX labels
1349 # in any order with the SRC files. Note that the ORDER of file execution
1350 # is determined for prefixed and postfixed files seperately.
1352 # File paths can be preceded by the URL protocol prefix "file://". This
1353 # is simply STRIPPED from the name.
1355 # Example:
1356 # The request
1357 # "http://cgi-bin/Action_Forms.pl/Statistics/Sign_Test.html?positive=8&negative=22
1358 # will result in printing "${SS_PUB}/Statistics/Sign_Test.html"
1359 # With QUERY_STRING = "positive=8&negative=22"
1361 # on encountering the lines:
1362 # <META CONTENT="text/osshell; CGI='$positive=11 $negative=3'">
1363 # <b><SCRIPT LANGUAGE=PERL TYPE="text/ssperl" SRC="./Statistics/SignTest.pl">
1364 # </SCRIPT></b><p>"
1366 # This line will be processed as:
1367 # "<b>`${SS_SCRIPT}/Statistics/SignTest.pl '8' '22'`</b><p>"
1369 # In which "${SS_SCRIPT}/Statistics/SignTest.pl" is an executable script,
1370 # This line will end up printed as:
1371 # "<b>p <= 0.0161</b><p>"
1373 # Note that the META tag itself will never be printed, and is invisible to
1374 # the outside world.
1376 # The SRC files in a DIV or INS tag will be added (pre-pended) to the body
1377 # of the <DIV></DIV> tag. Blocks are NOT executed! If you do not
1378 # need any content, you can use the <DIV...../> format.
1381 # THE CGISCRIPTOR ROOT DIRECTORIES ~/ AND ./
1383 # Inside <SCRIPT></SCRIPT> tags, filepaths starting
1384 # with "~/" are replaced by "$YOUR_HTML_FILES/", this way files in the
1385 # public directories can be accessed without direct reference to the
1386 # actual paths. Filepaths starting with "./" are replaced by
1387 # "$YOUR_SCRIPTS/" and this should only be used for scripts.
1389 # Note: this replacement can seriously affect Perl scripts. Watch
1390 # out for constructs like $a =~ s/aap\./noot./g, use
1391 # $a =~ s@aap\.@noot.@g instead.
1393 # CGIscriptor.pl will assign the values of $SS_PUB and $SS_SCRIPT
1394 # (i.e., $YOUR_HTML_FILES and $YOUR_SCRIPTS) to the environment variables
1395 # $SS_PUB and $SS_SCRIPT. These can be accessed by the scripts that are
1396 # executed.
1397 # Values not preceded by $, ~/, or ./ are used as literals
1400 # OS SHELL SCRIPT EVALUATION (CONTENT-TYPE=TEXT/OSSHELL)
1402 # OS scripts are executed by a "safe" version of the `` operator (i.e.,
1403 # SAFEqx(), see also below) and any output is printed. CGIscriptor will
1404 # interpolate the script and replace all user-supplied CGI-variables by
1405 # their ''-quoted values (actually, all variables defined in CGI attributes
1406 # are quoted). Other Perl variables are interpolated in a simple fasion,
1407 # i.e., $scalar by their value, @list by join(' ', @list), and %hash by
1408 # their name=value pairs. Complex references, e.g., @$variable, are all
1409 # evaluated in a scalar context. Quotes should be used with care.
1410 # NOTE: the results of the shell script evaluation will appear in the
1411 # @CGIscriptorResults stack just as any other result.
1412 # All occurrences of $@% that should NOT be interpolated must be
1413 # preceeded by a "\". Interpolation can be switched off completely by
1414 # setting $CGIscriptor::NoShellScriptInterpolation = 1
1415 # (set to 0 or undef to switch interpolation on again)
1416 # i.e.,
1417 # <SCRIPT TYPE="text/ssperl">
1418 # $CGIscriptor::NoShellScriptInterpolation = 1;
1419 # </SCRIPT>
1422 # RUN TIME TRANSLATION OF INPUT FILES
1424 # Allows general and global conversions of files using Regular Expressions.
1425 # Very handy (but costly) to rewrite legacy pages to a new format.
1426 # Select files to use it on with
1427 # my $TranslationPaths = 'filepattern';
1428 # This is costly. For efficiency, define:
1429 # $TranslationPaths = ''; when not using translations.
1430 # Accepts general regular expressions: [$pattern, $replacement]
1432 # Define:
1433 # my $TranslationPaths = 'filepattern'; # Pattern matching PATH_INFO
1435 # push(@TranslationTable, ['pattern', 'replacement']);
1436 # e.g. (for Ruby Rails):
1437 # push(@TranslationTable, ['<%=', '<SCRIPT TYPE="text/ssruby">']);
1438 # push(@TranslationTable, ['%>', '</SCRIPT>']);
1440 # Runs:
1441 # my $currentRegExp;
1442 # foreach $currentRegExp (@TranslationTable)
1444 # my ($pattern, $replacement) = @$currentRegExp;
1445 # $$text =~ s!$pattern!$replacement!msg;
1446 # };
1449 # EVALUATION OF OTHER SCRIPTING LANGUAGES
1451 # Adding a MIME-type and an interpreter command to
1452 # %ScriptingLanguages automatically will catch any other
1453 # scripting language in the standard
1454 # <SCRIPT TYPE="[mime]"></SCRIPT> manner.
1455 # E.g., adding: $ScriptingLanguages{'text/sspython'} = 'python';
1456 # will actually execute the folowing code in an HTML page
1457 # (ignore 'REMOTE_HOST' for the moment):
1458 # <SCRIPT TYPE="text/sspython">
1459 # # A Python script
1460 # x = ["A","real","python","script","Hello","World","and", REMOTE_HOST]
1461 # print x[4:8] # Prints the list ["Hello","World","and", REMOTE_HOST]
1462 # </SCRIPT>
1464 # The script code is NOT interpolated by perl, EXCEPT for those
1465 # interpreters that cannot handle variables themselves.
1466 # Currently, several interpreters are pre-installed:
1468 # Perl test - "text/testperl" => 'perl',
1469 # Python - "text/sspython" => 'python',
1470 # Ruby - "text/ssruby" => 'ruby',
1471 # Tcl - "text/sstcl" => 'tcl',
1472 # Awk - "text/ssawk" => 'awk -f-',
1473 # Gnu Lisp - "text/sslisp" => 'rep | tail +5 '.
1474 # "| egrep -v '> |^rep. |^nil\\\$'",
1475 # XLispstat - "text/xlispstat" => 'xlispstat | tail +7 '.
1476 # "| egrep -v '> \\\$|^NIL'",
1477 # Gnu Prolog- "text/ssprolog" => 'gprolog',
1478 # M4 macro's- "text/ssm4" => 'm4',
1479 # Born shell- "text/sh" => 'sh',
1480 # Bash - "text/bash" => 'bash',
1481 # C-shell - "text/csh" => 'csh',
1482 # Korn shell- "text/ksh" => 'ksh',
1483 # Praat - "text/sspraat" => "praat - | sed 's/Praat > //g'",
1484 # R - "text/ssr" => "R --vanilla --slave | sed 's/^[\[0-9\]*] //g'",
1485 # REBOL - "text/ssrebol" =>
1486 # "rebol --quiet|egrep -v '^[> ]* == '|sed 's/^\s*\[> \]* //g'",
1487 # PostgreSQL- "text/postgresql" => 'psql 2>/dev/null',
1488 # (psql)
1490 # Note that the "value" of $ScriptingLanguages{mime} must be a command
1491 # that reads Standard Input and writes to standard output. Any extra
1492 # output of interactive interpreters (banners, echo's, prompts)
1493 # should be removed by piping the output through 'tail', 'grep',
1494 # 'sed', or even 'awk' or 'perl'.
1496 # For access to CGI variables there is a special hashtable:
1497 # %ScriptingCGIvariables.
1498 # CGI variables can be accessed in three ways.
1499 # 1. If the mime type is not present in %ScriptingCGIvariables,
1500 # nothing is done and the script itself should parse the relevant
1501 # environment variables.
1502 # 2. If the mime type IS present in %ScriptingCGIvariables, but it's
1503 # value is empty, e.g., $ScriptingCGIvariables{"text/sspraat"} = '';,
1504 # the script text is interpolated by perl. That is, all $var, @array,
1505 # %hash, and \-slashes are replaced by their respective values.
1506 # 3. In all other cases, the CGI and environment variables are added
1507 # in front of the script according to the format stored in
1508 # %ScriptingCGIvariables. That is, the following (pseudo-)code is
1509 # executed for each CGI- or Environment variable defined in the CGI-tag:
1510 # printf(INTERPRETER, $ScriptingCGIvariables{$mime}, $CGI_NAME, $CGI_VALUE);
1512 # For instance, "text/testperl" => '$%s = "%s";' defines variable
1513 # definitions for Perl, and "text/sspython" => '%s = "%s"' for Python
1514 # (note that these definitions are not save, the real ones contain '-quotes).
1516 # THIS WILL NOT WORK FOR @VARIABLES, the (empty) $VARIABLES will be used
1517 # instead.
1519 # The $CGI_VALUE parameters are "shrubed" of all control characters
1520 # and quotes (by &shrubCGIparameter($CGI_VALUE)) for the options 2 and 3.
1521 # Control characters are replaced by \0<octal ascii value> (the exception
1522 # is \015, the newline, which is replaced by \n) and quotes
1523 # and backslashes by their HTML character
1524 # value (' -> &#39; ` -> &#96; " -> &quot; \ -> &#92; & -> &amper;).
1525 # For example:
1526 # if a client would supply the string value (in standard perl, e.g.,
1527 # \n means <newline>)
1528 # "/dev/null';\nrm -rf *;\necho '"
1529 # it would be processed as
1530 # '/dev/null&#39;;\nrm -rf *;\necho &#39;'
1531 # (e.g., sh or bash would process the latter more according to your
1532 # intentions).
1533 # If your intepreter requires different protection measures, you will
1534 # have to supply these in %main::SHRUBcharacterTR (string => translation),
1535 # e.g., $SHRUBcharacterTR{"\'"} = "&#39;";
1537 # Currently, the following definitions are used:
1538 # %ScriptingCGIvariables = (
1539 # "text/testperl" => "\$\%s = '\%s';", # Perl $VAR = 'value' (for testing)
1540 # "text/sspython" => "\%s = '\%s'", # Python VAR = 'value'
1541 # "text/ssruby" => '@%s = "%s"', # Ruby @VAR = "value"
1542 # "text/sstcl" => 'set %s "%s"', # TCL set VAR "value"
1543 # "text/ssawk" => '%s = "%s";', # Awk VAR = "value";
1544 # "text/sslisp" => '(setq %s "%s")', # Gnu lisp (rep) (setq VAR "value")
1545 # "text/xlispstat" => '(setq %s "%s")', # Xlispstat (setq VAR "value")
1546 # "text/ssprolog" => '', # Gnu prolog (interpolated)
1547 # "text/ssm4" => "define(`\%s', `\%s')", # M4 macro's define(`VAR', `value')
1548 # "text/sh" => "\%s='\%s';", # Born shell VAR='value';
1549 # "text/bash" => "\%s='\%s';", # Born again shell VAR='value';
1550 # "text/csh" => "\$\%s = '\%s';", # C shell $VAR = 'value';
1551 # "text/ksh" => "\$\%s = '\%s';", # Korn shell $VAR = 'value';
1552 # "text/sspraat" => '', # Praat (interpolation)
1553 # "text/ssr" => '%s <- "%s";', # R VAR <- "value";
1554 # "text/ssrebol" => '%s: copy "%s"', # REBOL VAR: copy "value"
1555 # "text/postgresql" => '', # PostgreSQL (interpolation)
1556 # "" => ""
1557 # );
1559 # Four tables allow fine-tuning of interpreter with code that should be
1560 # added before and after each code block:
1562 # Code added before each script block
1563 # %ScriptingPrefix = (
1564 # "text/testperl" => "\# Prefix Code;", # Perl script testing
1565 # "text/ssm4" => 'divert(0)' # M4 macro's (open STDOUT)
1566 # );
1567 # Code added at the end of each script block
1568 # %ScriptingPostfix = (
1569 # "text/testperl" => "\# Postfix Code;", # Perl script testing
1570 # "text/ssm4" => 'divert(-1)' # M4 macro's (block STDOUT)
1571 # );
1572 # Initialization code, inserted directly after opening (NEVER interpolated)
1573 # %ScriptingInitialization = (
1574 # "text/testperl" => "\# Initialization Code;", # Perl script testing
1575 # "text/ssawk" => 'BEGIN {', # Server Side awk scripts
1576 # "text/sslisp" => '(prog1 nil ', # Lisp (rep)
1577 # "text/xlispstat" => '(prog1 nil ', # xlispstat
1578 # "text/ssm4" => 'divert(-1)' # M4 macro's (block STDOUT)
1579 # );
1580 # Cleanup code, inserted before closing (NEVER interpolated)
1581 # %ScriptingCleanup = (
1582 # "text/testperl" => "\# Cleanup Code;", # Perl script testing
1583 # "text/sspraat" => 'Quit',
1584 # "text/ssawk" => '};', # Server Side awk scripts
1585 # "text/sslisp" => '(princ "\n" standard-output)).' # Closing print to rep
1586 # "text/xlispstat" => '(print "" *standard-output*)).' # Closing print to xlispstat
1587 # "text/postgresql" => '\q',
1588 # );
1591 # The SRC attribute is NOT magical for these interpreters. In short,
1592 # all code inside a source file or {} block is written verbattim
1593 # to the interpreter. No (pre-)processing or executional magic is done.
1595 # A serious shortcomming of the described mechanism for handling other
1596 # (scripting) languages, with respect to standard perl scripts
1597 # (i.e., 'text/ssperl'), is that the code is only executed when
1598 # the pipe to the interpreter is closed. So the pipe has to be
1599 # closed at the end of each block. This means that the state of the
1600 # interpreter (e.g., all variable values) is lost after the closing of
1601 # the next </SCRIPT> tag. The standard 'text/ssperl' scripts retain
1602 # all values and definitions.
1604 # APPLICATION MIME TYPES
1606 # To ease some important auxilliary functions from within the
1607 # html pages I have added them as MIME types. This uses
1608 # the mechanism that is also used for the evaluation of
1609 # other scripting languages, with interpolation of CGI
1610 # parameters (and perl-variables). Actually, these are
1611 # defined exactly like any other "scripting language".
1613 # text/ssdisplay: display some (HTML) text with interpolated
1614 # variables (uses `cat`).
1615 # text/sslogfile: write (append) the interpolated block to the file
1616 # mentioned on the first, non-empty line
1617 # (the filename can be preceded by 'File: ',
1618 # note the space after the ':',
1619 # uses `awk .... >> <filename>`).
1620 # text/ssmailto: send email directly from within the script block.
1621 # The first line of the body must contain
1622 # To:Name@Valid.Email.Address
1623 # (note: NO space between 'To:' and the email adres)
1624 # For other options see the mailto man pages.
1625 # It works by directly sending the (interpolated)
1626 # content of the text block to a pipe into the
1627 # Linux program 'mailto'.
1629 # In these script blocks, all Perl variables will be
1630 # replaced by their values. All CGI variables are cleaned before
1631 # they are used. These CGI variables must be redefined with a
1632 # CGI attribute to restore their original values.
1633 # In general, this will be more secure than constructing
1634 # e.g., your own email command lines. For instance, Mailto will
1635 # not execute any odd (forged) email addres, but just stops
1636 # when the email address is invalid and awk will construct
1637 # any filename you give it (e.g. '<File;rm\\\040-f' would end up
1638 # as a "valid" UNIX filename). Note that it will also gladly
1639 # store this file anywhere (/../../../etc/passwd will work!).
1640 # Use the CGIscriptor::CGIsafeFileName() function to clean the
1641 # filename.
1643 # SHELL SCRIPT PIPING
1645 # If a shell script starts with the UNIX style "#! <shell command> \n"
1646 # line, the rest of the shell script is piped into the indicated command,
1647 # i.e.,
1648 # open(COMMAND, "| command");print COMMAND $RestOfScript;
1650 # In many ways this is equivalent to the MIME-type profiling for
1651 # evaluating other scripting languages as discussed above. The
1652 # difference breaks down to convenience. Shell script piping is a
1653 # "raw" implementation. It allows you to control all aspects of
1654 # execution. Using the MIME-type profiling is easier, but has a
1655 # lot of defaults built in that might get in the way. Another
1656 # difference is that shell script piping uses the SAFEqx() function,
1657 # and MIME-type profiling does not.
1659 # Execution of shell scripts is under the control of the Perl Script blocks
1660 # in the document. The MIME-type triggered execution of <SCRIPT></SCRIPT>
1661 # blocks can be simulated easily. You can switch to a different shell,
1662 # e.g. tcl, completely by executing the following Perl commands inside
1663 # your document:
1665 # <SCRIPT TYPE="text/ssperl">
1666 # $main::ShellScriptContentType = "text/ssTcl"; # Yes, you can do this
1667 # CGIscriptor::RedirectShellScript('/usr/bin/tcl'); # Pipe to Tcl
1668 # $CGIscriptor::NoShellScriptInterpolation = 1;
1669 # </SCRIPT>
1671 # After this script is executed, CGIscriptor will parse scripts of
1672 # TYPE="text/ssTcl" and pipe their contents into '|/usr/bin/tcl'
1673 # WITHOUT interpolation (i.e., NO substitution of Perl variables).
1674 # The crucial function is :
1675 # CGIscriptor::RedirectShellScript('/usr/bin/tcl')
1676 # After executing this function, all shell scripts AND all
1677 # calls to SAFEqx()) are piped into '|/usr/bin/tcl'. If the argument
1678 # of RedirectShellScript is empty, e.g., '', the original (default)
1679 # value is reset.
1681 # The standard output, STDOUT, of any pipe is send to the client.
1682 # Currently, you should be carefull with quotes in such a piped script.
1683 # The results of a pipe is NOT put on the @CGIscriptorResults stack.
1684 # As a result, you do not have access to the output of any piped (#!)
1685 # process! If you want such access, execute
1686 # <SCRIPT TYPE="text/osshell">echo "script"|command</SCRIPT>
1687 # or
1688 # <SCRIPT TYPE="text/ssperl">
1689 # $resultvar = SAFEqx('echo "script"|command');
1690 # </SCRIPT>.
1692 # Safety is never complete. Although SAFEqx() prevents some of the
1693 # most obvious forms of attacks and security slips, it cannot prevent
1694 # them all. Especially, complex combinations of quotes and intricate
1695 # variable references cannot be handled safely by SAFEqx. So be on
1696 # guard.
1699 # PERL CODE EVALUATION (CONTENT-TYPE=TEXT/SSPERL)
1701 # All PERL scripts are evaluated inside a PERL package. This package
1702 # has a separate name space. This isolated name space protects the
1703 # CGIscriptor.pl program against interference from user code. However,
1704 # some variables, e.g., $_, are global and cannot be protected. You are
1705 # advised NOT to use such global variable names. You CAN write
1706 # directives that directly access the variables in the main program.
1707 # You do so at your own risk (there is definitely enough rope available
1708 # to hang yourself). The behavior of CGIscriptor becomes undefined if
1709 # you change its private variables during run time. The PERL code
1710 # directives are used as in:
1711 # $Result = eval($directive); print $Result;'';
1712 # ($directive contains all text between <SCRIPT></SCRIPT>).
1713 # That is, the <directive> is treated as ''-quoted string and
1714 # the result is treated as a scalar. To prevent the VALUE of the code
1715 # block from appearing on the client's screen, end the directive with
1716 # ';""</SCRIPT>'. Evaluated directives return the last value, just as
1717 # eval(), blocks, and subroutines, but only as a scalar.
1719 # IMPORTANT: All PERL variables defined are persistent. Each <SCRIPT>
1720 # </SCRIPT> construct is evaluated as a {}-block with associated scope
1721 # (e.g., for "my $var;" declarations). This means that values assigned
1722 # to a PERL variable can be used throughout the document unless they
1723 # were declared with "my". The following will actually work as intended
1724 # (note that the ``-quotes in this example are NOT evaluated, but used
1725 # as simple quotes):
1727 # <META CONTENT="text/ssperl; CGI=`$String='abcdefg'`">
1728 # anything ...
1729 # <SCRIPT TYPE=text/ssperl>@List = split('', $String);</SCRIPT>
1730 # anything ...
1731 # <SCRIPT TYPE=text/ssperl>join(", ", @List[1..$#List]);</SCRIPT>
1733 # The first <SCRIPT TYPE=text/ssperl></SCRIPT> construct will return the
1734 # value scalar(@List), the second <SCRIPT TYPE=text/ssperl></SCRIPT>
1735 # construct will print the elements of $String separated by commas, leaving
1736 # out the first element, i.e., $List[0].
1738 # Another warning: './' and '~/' are ALWAYS replaced by the values of
1739 # $YOUR_SCRIPTS and $YOUR_HTML_FILES, respectively . This can interfere
1740 # with pattern matching, e.g., $a =~ s/aap\./noot\./g will result in the
1741 # evaluations of $a =~ s/aap\\${YOUR_SCRIPTS}noot\\${YOUR_SCRIPTS}g. Use
1742 # s@<regexp>.@<replacement>.@g instead.
1745 # SERVER SIDE SESSIONS AND ACCESS CONTROL (LOGIN)
1747 # An infrastructure for user acount authorization and file access control
1748 # is available. Each request is matched against a list of URL path patterns.
1749 # If the request matches, a Session Ticket is required to access the URL.
1750 # This Session Ticket should be present as a CGI parameter or Cookie, eg:
1752 # CGI: SESSIONTICKET=&lt;value&gt;
1753 # Cookie: CGIscriptorSESSION=&lt;value&gt;
1755 # The example implementation stores Session Tickets as files in a local
1756 # directory. To create Session Tickets, a Login request must be given
1757 # with a LOGIN=&lt;value&gt; CGI parameter, a user name and a (doubly hashed)
1758 # password. The user name and (singly hashed) password are stored in a
1759 # PASSWORD ticket with the same name as the user account (name cleaned up
1760 # for security).
1762 # The example session model implements 4 functions:
1763 # - Login
1764 # The password is hashed with the user name and server side salt, and then
1765 # hashed with a random salt. Client and Server both perform these actions
1766 # and the Server only grants access if restults are the same. The server
1767 # side only stores the password hashed with the user name and
1768 # server side salt. Neither the plain password, nor the hashed password is
1769 # ever exchanged. Only values hashed with the one-time salt are exchanged.
1770 # - Session
1771 # For every access to a restricted URL, the Session Ticket is checked before
1772 # access is granted. There are three session modes. The first uses a fixed
1773 # Session Ticket that is stored as a cookie value in the browser (actually,
1774 # as a sessionStorage value). The second uses only the IP address at login
1775 # to authenticate requests. The third
1776 # is a Challenge mode, where the client has to calculate the value of the
1777 # next one-time Session Ticket from a value derived from the password and
1778 # a random string.
1779 # - Password Change
1780 # A new password is hashed with the user name and server side salt, and
1781 # then encrypted (XORed)
1782 # with the old password hashed with the user name and salt. That value is
1783 # exchanged and XORed with the stored old hashed(salt+password+username).
1784 # Again, the stored password value is never exchanged unencrypted.
1785 # - New Account
1786 # The text of a new account (Type: PASSWORD) file is constructed from
1787 # the new username (CGI: NEWUSERNAME, converted to lowercase) and
1788 # hashed new password (CGI: NEWPASSWORD). The same process is used to encrypt
1789 # the new password as is used for the Password Change function.
1790 # Again, the stored password value is never exchanged unencrypted.
1791 # Some default setting are encoded. For display in the browser, the new password
1792 # is reencrypted (XORed) with a special key, the old password hash
1793 # hashed with a session specific random hex value sent initially with the
1794 # session login ticket ($RANDOMSALT).
1795 # For example for user "NewUser" and password "NewPassword" with filename
1796 # "newuser":
1798 # Type: PASSWORD
1799 # Username: newuser
1800 # Password: 84b26fd2aaacae1c2e42fe07da1793e8232ffe548eceb519b46646fe9ff32612
1801 # Salt: 970e68017413fb0ea84d7fe3c463077636dd6d53486910d4a53c693dd4109b1a
1802 # AllowedPaths: ^/Private/[\w\-]*\.html?
1803 # AllowedPaths: ^/Private/newuser/
1804 # Session: SESSION
1805 # Date: Thu Jun 14 12:34:40 2012 UTC
1806 # Time: 1339677280
1808 # The password is created with the Unix commands:
1809 # printf '%s' '970e68017413fb0ea84d7fe3c463077636dd6d53486910d4a53c693dd4109b1aNewPasswordnewuser'|shasum -a 256
1813 # Implementation
1815 # The session authentication mechanism is based on the exchange of ticket
1816 # identifiers. A ticket identifier is just a string of characters, a name
1817 # or a random 64 character hexadecimal string. Ticket identifiers should be
1818 # "safe" filenames (except user names). There are four types of tickets:
1819 # PASSWORD: User account descriptors, including a user name and password
1820 # LOGIN: Temporary anonymous tickets used during login
1821 # IPADDRESS: Authetication tokens that allow access based on the IP address of the request
1822 # SESSION: Reusable authetication tokens
1823 # CHALLENGE: One-time authetication tokens
1824 # All tickets can have an expiration date in the form of a time duration
1825 # from creation, in seconds, minutes, hours, or days (+duration[smhd]).
1826 # An absolute time can be given in seconds since the epoch of the server host.
1827 # Note that expiration times of CHALLENGE authetication tokens are calculated
1828 # from the last access time. Accounts can include a maximal lifetime
1829 # for session tickets (MaxLifetime).
1831 # A Login page should create a LOGIN ticket file locally and send a
1832 # server specific salt, a Random salt, and a LOGIN ticket
1833 # identifier. The server side compares the username and hashed password,
1834 # actually hashed(Random salt+hashed(serversalt+password)) from the client with
1835 # the values it calculates from the stored Random salt from the LOGIN
1836 # ticket and the hashed(serversalt+password) from the PASSWORD ticket. If
1837 # successful, a new SESSION ticket is generated as a hash sum of the LOGIN
1838 # ticket and the stored password. This SESSION ticket should also be
1839 # generated by the client and stored as sessionStorage and cookie values
1840 # as needed. The Username, IP address and Path are available as
1841 # $LoginUsername, $LoginIPaddress, and $LoginPath, respectively.
1843 # The CHALLENGE protocol stores the same value as the SESSION tickets.
1844 # However, this value is not exchanged, but kept secret in the JavaScript
1845 # sessionStorage object. Instead, every page returned from the
1846 # server will contain a one-time Challenge value ($CHALLENGETICKET) which
1847 # has to be hashed with the stored value to return the current ticket
1848 # id string.
1850 # In the current example implementation, all random values are created as
1851 # full, 256 bit SHA256 hash values (Hex strings) of 64 bytes read from
1852 # /dev/urandom.
1854 # Security considerations with Session tickets
1856 # For strong security, please use end-to-end encryption. This can be
1857 # achieved using a VPN (Virtual Private Network), SSH tunnel, or a HTTPS
1858 # capable server with OpenSSL. The session ticket system of CGIscriptor.pl
1859 # is intended to be used as a simple authentication mechanism WITHOUT
1860 # END-TO-END ENCRYPTION. The authenticating mechanism tries to use some
1861 # simple means to protect the authentication process from eavesdropping.
1862 # For this it uses a secure hash function, SHA256. For all practial purposes,
1863 # it is impossible to "decrypt" a SHA256 sum. But this login scheme is
1864 # only as secure as your browser. Which, in general, is not very secure.
1866 # Humans tend to reuse passwords. A compromise of a site running
1867 # CGIscriptor.pl could therefore lead to a compromise of user accounts at
1868 # other sites. Therefore, plain text passwords are never stored, used, or
1869 # exchanged. Instead, a server site salt value is "encrypted" with
1870 # the plain password and user name. Actually, all are concatenated and hashed
1871 # with a one-way secure hash function (SHA256) into a single string.
1872 # Whenever the word "password" is used, this hash sum is meant. Note that
1873 # the salts are generated from /dev/urandom. You should check whether the
1874 # implementation of /dev/urandom on your platform is secure before
1875 # relying on it. This might be a problem when running CGIscriptor under
1876 # Cygwin on MS Windows.
1877 # Note: no attempt is made to slow down the password hash, so bad
1878 # passwords can be cracked by brute force
1880 # For the authentication and a change of password, the (old) password
1881 # is used to "encrypt" a random one-time token or the new password,
1882 # respectively. For authentication, decryption is not needed, so a secure
1883 # hash function (SHA256) is used to create a one-way hash sum "encryption".
1884 # A new password must be decrypted. New passwords are encryped by XORing
1885 # them with the old password.
1887 # Strong Passwords: It is so easy
1888 # If you only could see what you are typing
1890 # Your password might be vulnerable to brute force guessing
1891 # (https://en.wikipedia.org/wiki/Brute_force_attack).
1892 # Protections against such attacks are costly in terms of code
1893 # complexity, bugs, and execution time. However, there is a very
1894 # simple and secure counter measure. See the XKCD comic
1895 # (http://xkcd.com/936/). The phrase, "There is no password like more
1896 # password" would be both much easier to remember, and still stronger
1897 # than "h4]D%@m:49", at least before this phrase was pasted as an
1898 # example on the Internet.
1900 # For the procedures used at this site, a basic computer setup can
1901 # check in the order of a billion passwords per second. You need a
1902 # password (or phrase) strength in the order of 56 bits to be a
1903 # little secure (one year on a single computer). Please be so kind
1904 # and add the name of your favorite flower, dish, fictional
1905 # character, or small town to your password. Say, Oleander, Curry,
1906 # Sherlock, or Bath (each adds ~12 bits) or even the phrase "Sherlock
1907 # investigates oleander curry in Bath" (adds > 56 bits, note that
1908 # oleander is poisonous, so do not try this curry at home). That
1909 # would be more effective than adding a thousand rounds of encryption.
1910 # Typing long passwords without seeing what you are typing is
1911 # problematic. So a button should be included to make password
1912 # visible.
1915 # USER EXTENSIONS
1917 # A CGIscriptor package is attached to the bottom of this file. With
1918 # this package you can personalize your version of CGIscriptor by
1919 # including often used perl routines. These subroutines can be
1920 # accessed by prefixing their names with CGIscriptor::, e.g.,
1921 # <SCRIPT LANGUAGE=PERL TYPE=text/ssperl>
1922 # CGIscriptor::ListDocs("/Books/*") # List all documents in /Books
1923 # </SCRIPT>
1924 # It already contains some useful subroutines for Document Management.
1925 # As it is a separate package, it has its own namespace, isolated from
1926 # both the evaluator and the main program. To access variables from
1927 # the document <SCRIPT></SCRIPT> blocks, use $CGIexecute::<var>.
1929 # Currently, the following functions are implemented
1930 # (precede them with CGIscriptor::, see below for more information)
1931 # - SAFEqx ('String') -> result of qx/"String"/ # Safe application of ``-quotes
1932 # Is used by text/osshell Shell scripts. Protects all CGI
1933 # (client-supplied) values with single quotes before executing the
1934 # commands (one of the few functions that also works WITHOUT CGIscriptor::
1935 # in front)
1936 # - defineCGIvariable ($name[, $default) -> 0/1 (i.e., failure/success)
1937 # Is used by the META tag to define and initialize CGI and ENV
1938 # name/value pairs. Tries to obtain an initializing value from (in order):
1939 # $ENV{$name}
1940 # The Query string
1941 # The default value given (if any)
1942 # (one of the few functions that also works WITHOUT CGIscriptor::
1943 # in front)
1944 # - CGIsafeFileName (FileName) -> FileName or ""
1945 # Check a string against the Allowed File Characters (and ../ /..).
1946 # Returns an empty string for unsafe filenames.
1947 # - CGIsafeEmailAddress (Email) -> Email or ""
1948 # Check a string against correct email address pattern.
1949 # Returns an empty string for unsafe addresses.
1950 # - RedirectShellScript ('CommandString') -> FILEHANDLER or undef
1951 # Open a named PIPE for SAFEqx to receive ALL shell scripts
1952 # - URLdecode (URL encoded string) -> plain string # Decode URL encoded argument
1953 # - URLencode (plain string) -> URL encoded string # Encode argument as URL code
1954 # - CGIparseValue (ValueName [, URL_encoded_QueryString]) -> Decoded value
1955 # Extract the value of a CGI variable from the global or a private
1956 # URL-encoded query (multipart POST raw, NOT decoded)
1957 # - CGIparseValueList (ValueName [, URL_encoded_QueryString])
1958 # -> List of decoded values
1959 # As CGIparseValue, but now assembles ALL values of ValueName into a list.
1960 # - CGIparseHeader (ValueName [, URL_encoded_QueryString]) -> Header
1961 # Extract the header of a multipart CGI variable from the global or a private
1962 # URL-encoded query ("" when not a multipart variable or absent)
1963 # - CGIparseForm ([URL_encoded_QueryString]) -> Decoded Form
1964 # Decode the complete global URL-encoded query or a private
1965 # URL-encoded query
1966 # - read_url(URL) # Returns the page from URL (with added base tag, both FTP and HTTP)
1967 # Uses main::GET_URL(URL, 1) to get at the command to read the URL.
1968 # - BrowseDirs(RootDirectory [, Pattern, Startdir, CGIname]) # print browsable directories
1969 # - ListDocs(Pattern [,ListType]) # Prints a nested HTML directory listing of
1970 # all documents, e.g., ListDocs("/*", "dl");.
1971 # - HTMLdocTree(Pattern [,ListType]) # Prints a nested HTML listing of all
1972 # local links starting from a given document, e.g.,
1973 # HTMLdocTree("/Welcome.html", "dl");
1976 # THE RESULTS STACK: @CGISCRIPTORRESULTS
1978 # If the pseudo-variable "$CGIscriptorResults" has been defined in a
1979 # META tag, all subsequent SCRIPT and META results are pushed
1980 # on the @CGIscriptorResults stack. This list is just another
1981 # Perl variable and can be used and manipulated like any other list.
1982 # $CGIscriptorResults[-1] is always the last result.
1983 # This is only of limited use, e.g., to use the results of an OS shell
1984 # script inside a Perl script. Will NOT contain the results of Pipes
1985 # or code from MIME-profiling.
1988 # USEFULL CGI PREDEFINED VARIABLES (DO NOT ASSIGN TO THESE)
1990 # $CGI_HOME - The DocumentRoot directory
1991 # $CGI_Decoded_QS - The complete decoded Query String
1992 # $CGI_Content_Length - The ACTUAL length of the Query String
1993 # $CGI_Date - Current date and time
1994 # $CGI_Year $CGI_Month $CGI_Day $CGI_WeekDay - Current Date
1995 # $CGI_Time - Current Time
1996 # $CGI_Hour $CGI_Minutes $CGI_Seconds - Current Time, split
1997 # GMT Date/Time:
1998 # $CGI_GMTYear $CGI_GMTMonth $CGI_GMTDay $CGI_GMTWeekDay $CGI_GMTYearDay
1999 # $CGI_GMTHour $CGI_GMTMinutes $CGI_GMTSeconds $CGI_GMTisdst
2002 # USEFULL CGI ENVIRONMENT VARIABLES
2004 # Variables accessible (in APACHE) as $ENV{<name>}
2005 # (see: "http://hoohoo.ncsa.uiuc.edu/cgi/env.html"):
2007 # QUERY_STRING - The query part of URL, that is, everything that follows the
2008 # question mark.
2009 # PATH_INFO - Extra path information given after the script name
2010 # PATH_TRANSLATED - Extra pathinfo translated through the rule system.
2011 # (This doesn't always make sense.)
2012 # REMOTE_USER - If the server supports user authentication, and the script is
2013 # protected, this is the username they have authenticated as.
2014 # REMOTE_HOST - The hostname making the request. If the server does not have
2015 # this information, it should set REMOTE_ADDR and leave this unset
2016 # REMOTE_ADDR - The IP address of the remote host making the request.
2017 # REMOTE_IDENT - If the HTTP server supports RFC 931 identification, then this
2018 # variable will be set to the remote user name retrieved from
2019 # the server. Usage of this variable should be limited to logging
2020 # only.
2021 # AUTH_TYPE - If the server supports user authentication, and the script
2022 # is protected, this is the protocol-specific authentication
2023 # method used to validate the user.
2024 # CONTENT_TYPE - For queries which have attached information, such as HTTP
2025 # POST and PUT, this is the content type of the data.
2026 # CONTENT_LENGTH - The length of the said content as given by the client.
2027 # SERVER_SOFTWARE - The name and version of the information server software
2028 # answering the request (and running the gateway).
2029 # Format: name/version
2030 # SERVER_NAME - The server's hostname, DNS alias, or IP address as it
2031 # would appear in self-referencing URLs
2032 # GATEWAY_INTERFACE - The revision of the CGI specification to which this
2033 # server complies. Format: CGI/revision
2034 # SERVER_PROTOCOL - The name and revision of the information protocol this
2035 # request came in with. Format: protocol/revision
2036 # SERVER_PORT - The port number to which the request was sent.
2037 # REQUEST_METHOD - The method with which the request was made. For HTTP,
2038 # this is "GET", "HEAD", "POST", etc.
2039 # SCRIPT_NAME - A virtual path to the script being executed, used for
2040 # self-referencing URLs.
2041 # HTTP_ACCEPT - The MIME types which the client will accept, as given by
2042 # HTTP headers. Other protocols may need to get this
2043 # information from elsewhere. Each item in this list should
2044 # be separated by commas as per the HTTP spec.
2045 # Format: type/subtype, type/subtype
2046 # HTTP_USER_AGENT - The browser the client is using to send the request.
2047 # General format: software/version library/version.
2050 # INSTRUCTIONS FOR RUNNING CGIscriptor ON UNIX
2052 # CGIscriptor.pl will run on any WWW server that runs Perl scripts, just add
2053 # a line like the following to your srm.conf file (Apache example):
2055 # ScriptAlias /SHTML/ /real-path/CGIscriptor.pl/
2057 # URL's that refer to http://www.your.address/SHTML/... will now be handled
2058 # by CGIscriptor.pl, which can use a private directory tree (default is the
2059 # DOCUMENT_ROOT directory tree, but it can be anywhere, see manual).
2061 # If your hosting ISP won't let you add ScriptAlias lines you can use
2062 # the following "rewrite"-based "scriptalias" in .htaccess
2063 # (from Gerd Franke)
2065 # RewriteEngine On
2066 # RewriteBase /
2067 # RewriteCond %{REQUEST_FILENAME} .html$
2068 # RewriteCond %{SCRIPT_FILENAME} !cgiscriptor.pl$
2069 # RewriteCond %{REQUEST_FILENAME} -f
2070 # RewriteRule ^(.*)$ /cgi-bin/cgiscriptor.pl/$1?&%{QUERY_STRING}
2072 # Everthing with the extension ".html" and not including "cgiscriptor.pl"
2073 # in the url and where the file "path/filename.html" exists is redirected
2074 # to "/cgi.bin/cgiscriptor.pl/path/filename.html?query".
2075 # The user configuration should get the same path-level as the
2076 # .htaccess-file:
2078 # # Just enter your own directory path here
2079 # $YOUR_HTML_FILES = "$ENV{'DOCUMENT_ROOT'}";
2080 # # use DOCUMENT_ROOT only, if .htaccess lies in the root-directory.
2082 # If this .htaccess goes in a specific directory, the path to this
2083 # directory must be added to $ENV{'DOCUMENT_ROOT'}.
2085 # The CGIscriptor file contains all documentation as comments. These
2086 # comments can be removed to speed up loading (e.g., `egrep -v '^#'
2087 # CGIscriptor.pl` > leanScriptor.pl). A bare bones version of
2088 # CGIscriptor.pl, lacking documentation, most comments, access control,
2089 # example functions etc. (but still with the copyright notice and some
2090 # minimal documentation) can be obtained by calling CGIscriptor.pl on the
2091 # command line with the '-slim' command line argument, e.g.,
2093 # >CGIscriptor.pl -slim > slimCGIscriptor.pl
2095 # CGIscriptor.pl can be run from the command line with <path> and <query> as
2096 # arguments, as `CGIscriptor.pl <path> <query>`, inside a perl script
2097 # with 'do CGIscriptor.pl' after setting $ENV{PATH_INFO}
2098 # and $ENV{QUERY_STRING}, or CGIscriptor.pl can be loaded with 'require
2099 # "/real-path/CGIscriptor.pl"'. In the latter case, requests are processed
2100 # by 'Handle_Request();' (again after setting $ENV{PATH_INFO} and
2101 # $ENV{QUERY_STRING}).
2103 # Using the command line execution option, CGIscriptor.pl can be used as a
2104 # document (meta-)preprocessor. If the first argument is '-', STDIN will be read.
2105 # For example:
2107 # > cat MyDynamicDocument.html | CGIscriptor.pl - '[QueryString]' > MyStaticFile.html
2109 # This command line will produce a STATIC file with the DYNAMIC content of
2110 # MyDocument.html "interpolated".
2112 # This option would be very dangerous when available over the internet.
2113 # If someone could sneak a 'http://www.your.domain/-' URL past your
2114 # server, CGIscriptor could EXECUTE any POSTED contend.
2115 # Therefore, for security reasons, STDIN will NOT be read
2116 # if ANY of the HTTP server environment variables is set (e.g.,
2117 # SERVER_PORT, SERVER_PROTOCOL, SERVER_NAME, SERVER_SOFTWARE,
2118 # HTTP_USER_AGENT, REMOTE_ADDR).
2119 # This block on processing STDIN on HTTP requests can be lifted by setting
2120 # $BLOCK_STDIN_HTTP_REQUEST = 0;
2121 # In the security configuration. Butbe carefull when doing this.
2122 # It can be very dangerous.
2124 # Running demo's and more information can be found at
2125 # http://www.fon.hum.uva.nl/~rob/OSS/OSS.html
2127 # A pocket-size HTTP daemon, CGIservlet.pl, is available from my web site or
2128 # CPAN that can use CGIscriptor.pl as the base of a µWWW server and
2129 # demonstrates its use.
2132 # PROCESSING NON-FILESYSTEM DATA
2134 # Normally, HTTP (WWW) requests map onto file that can be accessed
2135 # using the perl open() function. That is, the web server runs on top of
2136 # some directory structure. However, we can envission (and put to good
2137 # use) other systems that do not use a normal file system. The whole CGI
2138 # was developed to make dynamic document generation possible.
2140 # A special case is where we want to have it both: A normal web server
2141 # with normal "file data", but not a normal files system. For instance,
2142 # we want or normal Web Site to run directly from a RAM hash table or
2143 # other database, instead of from disk. But we do NOT want to code the
2144 # whole site structure in CGI.
2146 # CGIscriptor can do this. If the web server fills an environment variable
2147 # $ENV{'CGI_FILE_CONTENT'} with the content of the "file", then the content
2148 # of this variable is processed instead of opening a file. If this environment
2149 # variable has the value '-', the content of another environment variable,
2150 # $ENV{'CGI_DATA_ACCESS_CODE'} is executed as:
2151 # eval("\@_ = ($file_path); do {$ENV{'CGI_DATA_ACCESS_CODE'}};")
2152 # and the result is processed as if it was the content of the requested
2153 # file.
2154 # (actually, the names of the environment variables are user configurable,
2155 # they are stored in the local variables $CGI_FILE_CONTENT and
2156 # $CGI_DATA_ACCESS_CODE)
2158 # When using this mechanism, the SRC attribute mechanism will only partially work.
2159 # Only the "recursive" calls to CGIscriptor (the ProcessFile() function)
2160 # will work, the automagical execution of SRC files won't. (In this case,
2161 # the SRC attribute won't work either for other scripting languages)
2164 # NON-UNIX PLATFORMS
2166 # CGIscriptor.pl was mainly developed and tested on UNIX. However, as I
2167 # coded part of the time on an Apple Macintosh under MacPerl, I made sure
2168 # CGIscriptor did run under MacPerl (with command line options). But only
2169 # as an independend script, not as part of a HTTP server. I have used it
2170 # under Apache in Windows XP.
2172 ENDOFHELPTEXT
2173 exit;
2175 ###############################################################################
2177 # SECURITY CONFIGURATION
2179 # Special configurations related to SECURITY
2180 # (i.e., optional, see also environment variables below)
2182 # LOGGING
2183 # Log Clients and the requested paths (Redundant when loging Queries)
2185 $ClientLog = "./Client.log"; # (uncomment for use)
2187 # Format: Localtime | REMOTE_USER REMOTE_IDENT REMOTE_HOST REMOTE_ADDRESS \
2188 # PATH_INFO CONTENT_LENGTH (actually, the real query+post length)
2190 # Log Clients and the queries, the CGIQUERYDECODE is required if you want
2191 # to log queries. If you log Queries, the loging of Clients is redundant
2192 # (note that queries can be quite long, so this might not be a good idea)
2194 #$QueryLog = "./Query.log"; # (uncomment for use)
2196 # ACCESS CONTROL
2197 # the Access files should contain Hostnames or IP addresses,
2198 # i.e. REMOTE_HOST or REMOTE_ADDR, each on a separate line
2199 # optionally followed by one ore more file patterns, e.g., "edu /DEMO".
2200 # Matching is done "domain first". For example ".edu" matches all
2201 # clients whose "name" ends in ".edu" or ".EDU". The file pattern
2202 # "/DEMO" matches all paths that contain the strings "/DEMO" or "/demo"
2203 # (both matchings are done case-insensitive).
2204 # The name special symbol "-" matches ALL clients who do not supply a
2205 # REMOTE_HOST name, "*" matches all clients.
2206 # Lines starting with '-e' are evaluated. A non-zero return value indicates
2207 # a match. You can use $REMOTE_HOST, $REMOTE_ADDR, and $PATH_INFO. These
2208 # lines are evaluated in the program's own name-space. So DO NOT assign to
2209 # variables.
2211 # Accept the following users (remove comment # and adapt filename)
2212 $CGI_Accept = -s "$YOUR_SCRIPTS/ACCEPT.lis" ? "$YOUR_SCRIPTS/ACCEPT.lis" : ''; # (uncomment for use)
2214 # Reject requests from the following users (remove comment # and
2215 # adapt filename, this is only of limited use)
2216 $CGI_Reject = -s "$YOUR_SCRIPTS/REJECT.lis" ? "$YOUR_SCRIPTS/REJECT.lis" : ''; # (uncomment for use)
2218 # Empty lines or comment lines starting with '#' are ignored in both
2219 # $CGI_Accept and $CGI_Reject.
2221 # Block STDIN (i.e., '-') requests when servicing an HTTP request
2222 # Comment this out if you realy want to use STDIN in an on-line web server
2223 $BLOCK_STDIN_HTTP_REQUEST = 1;
2226 # End of security configuration
2228 ##################################################<<<<<<<<<<End Remove
2230 # PARSING CGI VALUES FROM THE QUERY STRING (USER CONFIGURABLE)
2232 # The CGI parse commands. These commands extract the values of the
2233 # CGI variables from the URL encoded Query String.
2234 # If you want to use your own CGI decoders, you can call them here
2235 # instead, using your own PATH and commenting/uncommenting the
2236 # appropriate lines
2238 # CGI parse command for individual values
2239 # (if $List > 0, returns a list value, if $List < 0, a hash table, this is optional)
2240 sub YOUR_CGIPARSE # ($Name [, $List]) -> Decoded value
2242 my $Name = shift;
2243 my $List = shift || 0;
2244 # Use one of the following by uncommenting
2245 if(!$List) # Simple value
2247 return CGIscriptor::CGIparseValue($Name) ;
2249 elsif($List < 0) # Hash tables
2251 return CGIscriptor::CGIparseValueHash($Name); # Defined in CGIscriptor below
2253 else # Lists
2255 return CGIscriptor::CGIparseValueList($Name); # Defined in CGIscriptor below
2258 # return `/PATH/cgiparse -value $Name`; # Shell commands
2259 # require "/PATH/cgiparse.pl"; return cgivalue($Name); # Library
2261 # Complete queries
2262 sub YOUR_CGIQUERYDECODE
2264 # Use one of the following by uncommenting
2265 return CGIscriptor::CGIparseForm(); # Defined in CGIscriptor below
2266 # return `/PATH/cgiparse -form`; # Shell commands
2267 # require "/PATH/cgiparse.pl"; return cgiform(); # Library
2270 # End of configuration
2272 #######################################################################
2274 # Translating input files.
2275 # Allows general and global conversions of files using Regular Expressions
2276 # Translations are applied in the order of definition.
2278 # Define:
2279 # my $TranslationPaths = 'pattern'; # Pattern matching PATH_INFO
2281 # push(@TranslationTable, ['pattern', 'replacement']);
2282 # e.g. (for Ruby Rails):
2283 # push(@TranslationTable, ['<%=', '<SCRIPT TYPE="text/ssruby">']);
2284 # push(@TranslationTable, ['%>', '</SCRIPT>']);
2286 # Runs:
2287 # my $currentRegExp;
2288 # foreach $currentRegExp (keys(%TranslationTable))
2290 # my $currentRegExp;
2291 # foreach $currentRegExp (@TranslationTable)
2293 # my ($pattern, $replacement) = @$currentRegExp;
2294 # $$text =~ s!$pattern!$replacement!msg;
2295 # };
2296 # };
2298 # Configuration section
2300 #######################################################################
2302 # The file paths on which to apply the translation
2303 my $TranslationPaths = ''; # NO files
2304 #$TranslationPaths = '.'; # ANY file
2305 # $TranslationPaths = '\.html'; # HTML files
2307 my @TranslationTable = ();
2308 # Some legacy code
2309 push(@TranslationTable, ['\<\s*CGI\s+([^\>])*\>', '\<SCRIPT TYPE=\"text/ssperl\"\>$1\<\/SCRIPT>']);
2310 # Ruby Rails?
2311 push(@TranslationTable, ['<%=', '<SCRIPT TYPE="text/ssruby">']);
2312 push(@TranslationTable, ['%>', '</SCRIPT>']);
2314 sub performTranslation # (\$text)
2316 my $text = shift || return;
2317 if(@TranslationTable && $TranslationPaths && $ENV{'PATH_INFO'} =~ m!$TranslationPaths!)
2319 my $currentRegExp;
2320 foreach $currentRegExp (@TranslationTable)
2322 my ($pattern, $replacement) = @$currentRegExp;
2323 $$text =~ s!$pattern!$replacement!msg;
2328 #######################################################################
2330 # Seamless access to other (Scripting) Languages
2331 # TYPE='text/ss<interpreter>'
2333 # Configuration section
2335 #######################################################################
2337 # OTHER SCRIPTING LANGUAGES AT THE SERVER SIDE (MIME => OScommand)
2338 # Yes, it realy is this simple! (unbelievable, isn't it)
2339 # NOTE: Some interpreters require some filtering to obtain "clean" output
2341 %ScriptingLanguages = (
2342 "text/testperl" => 'perl', # Perl for testing
2343 "text/sspython" => 'python', # Python
2344 "text/ssruby" => 'ruby', # Ruby
2345 "text/sstcl" => 'tcl', # TCL
2346 "text/ssawk" => 'awk -f-', # Awk
2347 "text/sslisp" => # lisp (rep, GNU)
2348 'rep | tail +4 '."| egrep -v '> |^rep. |^nil\\\$'",
2349 "text/xlispstat" => # xlispstat
2350 'xlispstat | tail +7 ' ."| egrep -v '> \\\$|^NIL'",
2351 "text/ssprolog" => # Prolog (GNU)
2352 "gprolog | tail +4 | sed 's/^| ?- //'",
2353 "text/ssm4" => 'm4', # M4 macro's
2354 "text/sh" => 'sh', # Born shell
2355 "text/bash" => 'bash', # Born again shell
2356 "text/csh" => 'csh', # C shell
2357 "text/ksh" => 'ksh', # Korn shell
2358 "text/sspraat" => # Praat (sound/speech analysis)
2359 "praat - | sed 's/Praat > //g'",
2360 "text/ssr" => # R
2361 "R --vanilla --slave | sed 's/^[\[0-9\]*] //'",
2362 "text/ssrebol" => # REBOL
2363 "rebol --quiet|egrep -v '^[> ]* == '|sed 's/^\\s*\[> \]* //'",
2364 "text/postgresql" => 'psql 2>/dev/null',
2366 # Not real scripting, but the use of other applications
2367 "text/ssmailto" => "awk 'NF||F{F=1;print \\\$0;}'|mailto >/dev/null", # Send mail from server
2368 "text/ssdisplay" => 'cat', # Display, (interpolation)
2369 "text/sslogfile" => # Log to file, (interpolation)
2370 "awk 'NF||L {if(!L){L=tolower(\\\$1)~/^file:\\\$/ ? \\\$2 : \\\$1;}else{print \\\$0 >> L;};}'",
2372 "" => ""
2375 # To be able to access the CGI variables in your script, they
2376 # should be passed to the scripting language in a readable form
2377 # Here you can enter how they should be printed (the first %s
2378 # is replaced by the NAME of the CGI variable as it apears in the
2379 # META tag, the second by its VALUE).
2380 # For Perl this would be:
2381 # "text/testperl" => '$%s = "%s";',
2382 # which would be executed as
2383 # printf('$%s = "%s";', $CGI_NAME, $CGI_VALUE);
2385 # If the hash table value doesn't exist, nothing is done
2386 # (you have to parse the Environment variables yourself).
2387 # If it DOES exist but is empty (e.g., "text/sspraat" => '',)
2388 # Perl string interpolation of variables (i.e., $var, @array,
2389 # %hash) is performed. This means that $@%\ must be protected
2390 # with a \.
2392 %ScriptingCGIvariables = (
2393 "text/testperl" => "\$\%s = '\%s';", # Perl $VAR = 'value'; (for testing)
2394 "text/sspython" => "\%s = '\%s'", # Python VAR = 'value'
2395 "text/ssruby" => '@%s = "%s"', # Ruby @VAR = 'value'
2396 "text/sstcl" => 'set %s "%s"', # TCL set VAR "value"
2397 "text/ssawk" => '%s = "%s";', # Awk VAR = 'value';
2398 "text/sslisp" => '(setq %s "%s")', # Gnu lisp (rep) (setq VAR "value")
2399 "text/xlispstat" => '(setq %s "%s")', # xlispstat (setq VAR "value")
2400 "text/ssprolog" => '', # Gnu prolog (interpolated)
2401 "text/ssm4" => "define(`\%s', `\%s')", # M4 macro's define(`VAR', `value')
2402 "text/sh" => "\%s='\%s'", # Born shell VAR='value'
2403 "text/bash" => "\%s='\%s'", # Born again shell VAR='value'
2404 "text/csh" => "\$\%s='\%s';", # C shell $VAR = 'value';
2405 "text/ksh" => "\$\%s='\%s';", # Korn shell $VAR = 'value';
2407 "text/ssrebol" => '%s: copy "%s"', # REBOL VAR: copy "value"
2408 "text/sspraat" => '', # Praat (interpolation)
2409 "text/ssr" => '%s <- "%s";', # R VAR <- "value";
2410 "text/postgresql" => '', # PostgreSQL (interpolation)
2412 # Not real scripting, but the use of other applications
2413 "text/ssmailto" => '', # MAILTO, (interpolation)
2414 "text/ssdisplay" => '', # Display, (interpolation)
2415 "text/sslogfile" => '', # Log to file, (interpolation)
2417 "" => ""
2420 # If you want something added in front or at the back of each script
2421 # block as send to the interpreter add it here.
2422 # mime => "string", e.g., "text/sspython" => "python commands"
2423 %ScriptingPrefix = (
2424 "text/testperl" => "\# Prefix Code;", # Perl script testing
2425 "text/ssm4" => 'divert(0)', # M4 macro's (open STDOUT)
2427 "" => ""
2429 # If you want something added at the end of each script block
2430 %ScriptingPostfix = (
2431 "text/testperl" => "\# Postfix Code;", # Perl script testing
2432 "text/ssm4" => 'divert(-1)', # M4 macro's (block STDOUT)
2434 "" => ""
2436 # If you need initialization code, directly after opening
2437 %ScriptingInitialization = (
2438 "text/testperl" => "\# Initialization Code;", # Perl script testing
2439 "text/ssawk" => 'BEGIN {', # Server Side awk scripts (VAR = "value")
2440 "text/sslisp" => '(prog1 nil ', # Lisp (rep)
2441 "text/xlispstat" => '(prog1 nil ', # xlispstat
2442 "text/ssm4" => 'divert(-1)', # M4 macro's (block STDOUT)
2444 "" => ""
2446 # If you need cleanup code before closing
2447 %ScriptingCleanup = (
2448 "text/testperl" => "\# Cleanup Code;", # Perl script testing
2449 "text/sspraat" => 'Quit',
2450 "text/ssawk" => '};', # Server Side awk scripts (VAR = "value")
2451 "text/sslisp" => '(princ "\n" standard-output)).', # Closing print to rep
2452 "text/xlispstat" => '(print ""))', # Closing print to xlispstat
2453 "text/postgresql" => '\q', # quit psql
2454 "text/ssdisplay" => "", # close cat
2456 "" => ""
2459 # End of configuration for foreign scripting languages
2461 ###############################################################################
2463 # Initialization Code
2466 sub Initialize_Request
2468 ###############################################################################
2470 # ENVIRONMENT VARIABLES
2472 # Use environment variables to configure CGIscriptor on a temporary basis.
2473 # If you define any of the configurable variables as environment variables,
2474 # these are used instead of the "hard coded" values above.
2476 $SS_PUB = $ENV{'SS_PUB'} || $YOUR_HTML_FILES;
2477 $SS_SCRIPT = $ENV{'SS_SCRIPT'} || $YOUR_SCRIPTS;
2480 # Substitution strings, these are used internally to handle the
2481 # directory separator strings, e.g., '~/' -> 'SS_PUB:' (Mac)
2482 $HOME_SUB = $SS_PUB;
2483 $SCRIPT_SUB = $SS_SCRIPT;
2486 # Make sure all script are reliably loaded
2487 push(@INC, $SS_SCRIPT);
2490 # Add the directory separator to the "home" directories.
2491 # (This is required for ~/ and ./ substitution)
2492 $HOME_SUB .= '/' if $HOME_SUB;
2493 $SCRIPT_SUB .= '/' if $SCRIPT_SUB;
2495 $CGI_HOME = $ENV{'DOCUMENT_ROOT'};
2496 $ENV{'PATH_TRANSLATED'} =~ /$ENV{'PATH_INFO'}/is;
2497 $CGI_HOME = $` unless $ENV{'DOCUMENT_ROOT'}; # Get the DOCUMENT_ROOT directory
2498 $default_values{'CGI_HOME'} = $CGI_HOME;
2499 $ENV{'HOME'} = $CGI_HOME;
2500 # Set SS_PUB and SS_SCRIPT as Environment variables (make them available
2501 # to the scripts)
2502 $ENV{'SS_PUB'} = $SS_PUB unless $ENV{'SS_PUB'};
2503 $ENV{'SS_SCRIPT'} = $SS_SCRIPT unless $ENV{'SS_SCRIPT'};
2505 $FilePattern = $ENV{'FilePattern'} || $FilePattern;
2506 $MaximumQuerySize = $ENV{'MaximumQuerySize'} || $MaximumQuerySize;
2507 $ClientLog = $ENV{'ClientLog'} || $ClientLog;
2508 $QueryLog = $ENV{'QueryLog'} || $QueryLog;
2509 $CGI_Accept = $ENV{'CGI_Accept'} || $CGI_Accept;
2510 $CGI_Reject = $ENV{'CGI_Reject'} || $CGI_Reject;
2512 # Parse file names
2513 $CGI_Accept =~ s@^\~/@$HOME_SUB@g if $CGI_Accept;
2514 $CGI_Reject =~ s@^\~/@$HOME_SUB@g if $CGI_Reject;
2515 $ClientLog =~ s@^\~/@$HOME_SUB@g if $ClientLog;
2516 $QueryLog =~ s@^\~/@$HOME_SUB@g if $QueryLog;
2518 $CGI_Accept =~ s@^\./@$SCRIPT_SUB@g if $CGI_Accept;
2519 $CGI_Reject =~ s@^\./@$SCRIPT_SUB@g if $CGI_Reject;
2520 $ClientLog =~ s@^\./@$SCRIPT_SUB@g if $ClientLog;
2521 $QueryLog =~ s@^\./@$SCRIPT_SUB@g if $QueryLog;
2523 @CGIscriptorResults = (); # A stack of results
2525 # end of Environment variables
2527 #############################################################################
2529 # Define and Store "standard" values
2531 # BEFORE doing ANYTHING check the size of Query String
2532 length($ENV{'QUERY_STRING'}) <= $MaximumQuerySize || dieHandler(2, "QUERY TOO LONG\n");
2534 # The Translated Query String and the Actual length of the (decoded)
2535 # Query String
2536 if($ENV{'QUERY_STRING'})
2538 # If this can contain '`"-quotes, be carefull to use it QUOTED
2539 $default_values{CGI_Decoded_QS} = YOUR_CGIQUERYDECODE();
2540 $default_values{CGI_Content_Length} = length($default_values{CGI_Decoded_QS});
2543 # Get the current Date and time and store them as default variables
2545 # Get Local Time
2546 $LocalTime = localtime;
2548 # CGI_Year CGI_Month CGI_Day CGI_WeekDay CGI_Time
2549 # CGI_Hour CGI_Minutes CGI_Seconds
2551 $default_values{CGI_Date} = $LocalTime;
2552 ($default_values{CGI_WeekDay},
2553 $default_values{CGI_Month},
2554 $default_values{CGI_Day},
2555 $default_values{CGI_Time},
2556 $default_values{CGI_Year}) = split(' ', $LocalTime);
2557 ($default_values{CGI_Hour},
2558 $default_values{CGI_Minutes},
2559 $default_values{CGI_Seconds}) = split(':', $default_values{CGI_Time});
2561 # GMT:
2562 # CGI_GMTYear CGI_GMTMonth CGI_GMTDay CGI_GMTWeekDay CGI_GMTYearDay
2563 # CGI_GMTHour CGI_GMTMinutes CGI_GMTSeconds CGI_GMTisdst
2565 ($default_values{CGI_GMTSeconds},
2566 $default_values{CGI_GMTMinutes},
2567 $default_values{CGI_GMTHour},
2568 $default_values{CGI_GMTDay},
2569 $default_values{CGI_GMTMonth},
2570 $default_values{CGI_GMTYear},
2571 $default_values{CGI_GMTWeekDay},
2572 $default_values{CGI_GMTYearDay},
2573 $default_values{CGI_GMTisdst}) = gmtime;
2577 # End of Initialize Request
2579 ###################################################################
2581 # SECURITY: ACCESS CONTROL
2583 # Check the credentials of each client (use pattern matching, domain first).
2584 # This subroutine will kill-off (die) the current process whenever access
2585 # is denied.
2587 sub Access_Control
2589 # >>>>>>>>>>Start Remove
2591 # ACCEPTED CLIENTS
2593 # Only accept clients which are authorized, reject all unnamed clients
2594 # if REMOTE_HOST is given.
2595 # If file patterns are given, check whether the user is authorized for
2596 # THIS file.
2597 if($CGI_Accept)
2599 # Use local variables, REMOTE_HOST becomes '-' if undefined
2600 my $REMOTE_HOST = $ENV{REMOTE_HOST} || '-';
2601 my $REMOTE_ADDR = $ENV{REMOTE_ADDR};
2602 my $PATH_INFO = $ENV{'PATH_INFO'};
2604 open(CGI_Accept, "<$CGI_Accept") || dieHandler(3, "$CGI_Accept: $!\n");
2605 $NoAccess = 1;
2606 while(<CGI_Accept>)
2608 next unless /\S/; # Skip empty lines
2609 next if /^\s*\#/; # Skip comments
2611 # Full expressions
2612 if(/^\s*-e\s/is)
2614 my $Accept = $'; # Get the expression
2615 $NoAccess &&= eval($Accept); # evaluate the expresion
2617 else
2619 my ($Accept, @FilePatternList) = split;
2620 if($Accept eq '*' # Always match
2621 ||$REMOTE_HOST =~ /\Q$Accept\E$/is # REMOTE_HOST matches
2622 || (
2623 $Accept =~ /^[0-9\.]+$/
2624 && $REMOTE_ADDR =~ /^\Q$Accept\E/ # IP address matches
2628 if($FilePatternList[0])
2630 foreach $Pattern (@FilePatternList)
2632 # Check whether this patterns is accepted
2633 $NoAccess &&= ($PATH_INFO !~ m@\Q$Pattern\E@is);
2636 else
2638 $NoAccess = 0; # No file patterns -> Accepted
2642 # Blocked
2643 last unless $NoAccess;
2645 close(CGI_Accept);
2646 if($NoAccess){ dieHandler(4, "No Access: $PATH_INFO\n");};
2650 # REJECTED CLIENTS
2652 # Reject named clients, accept all unnamed clients
2653 if($CGI_Reject)
2655 # Use local variables, REMOTE_HOST becomes '-' if undefined
2656 my $REMOTE_HOST = $ENV{'REMOTE_HOST'} || '-';
2657 my $REMOTE_ADDR = $ENV{'REMOTE_ADDR'};
2658 my $PATH_INFO = $ENV{'PATH_INFO'};
2660 open(CGI_Reject, "<$CGI_Reject") || dieHandler(5, "$CGI_Reject: $!\n");
2661 $NoAccess = 0;
2662 while(<CGI_Reject>)
2664 next unless /\S/; # Skip empty lines
2665 next if /^\s*\#/; # Skip comments
2667 # Full expressions
2668 if(/^-e\s/is)
2670 my $Reject = $'; # Get the expression
2671 $NoAccess ||= eval($Reject); # evaluate the expresion
2673 else
2675 my ($Reject, @FilePatternList) = split;
2676 if($Reject eq '*' # Always match
2677 ||$REMOTE_HOST =~ /\Q$Reject\E$/is # REMOTE_HOST matches
2678 ||($Reject =~ /^[0-9\.]+$/
2679 && $REMOTE_ADDR =~ /^\Q$Reject\E/is # IP address matches
2683 if($FilePatternList[0])
2685 foreach $Pattern (@FilePatternList)
2687 $NoAccess ||= ($PATH_INFO =~ m@\Q$Pattern\E@is);
2690 else
2692 $NoAccess = 1; # No file patterns -> Rejected
2696 last if $NoAccess;
2698 close(CGI_Reject);
2699 if($NoAccess){ dieHandler(6, "Request rejected: $PATH_INFO\n");};
2702 ##########################################################<<<<<<<<<<End Remove
2705 # Get the filename
2707 # Does the filename contain any illegal characters (e.g., |, >, or <)
2708 dieHandler(7, "Illegal request: $ENV{'PATH_INFO'}\n") if $ENV{'PATH_INFO'} =~ /[^$FileAllowedChars]/;
2709 # Does the pathname contain an illegal (blocked) "directory"
2710 dieHandler(8, "Illegal request: $ENV{'PATH_INFO'}\n") if $BlockPathAccess && $ENV{'PATH_INFO'} =~ m@$BlockPathAccess@; # Access is blocked
2711 # Does the pathname contain a direct referencer to BinaryMapFile
2712 dieHandler(9, "Illegal request: $ENV{'PATH_INFO'}\n") if $BinaryMapFile && $ENV{'PATH_INFO'} =~ m@\Q$BinaryMapFile\E@; # Access is blocked
2714 # SECURITY: Is PATH_INFO allowed?
2715 if($FilePattern && $ENV{'PATH_INFO'} && $ENV{'PATH_INFO'} ne '-' &&
2716 ($ENV{'PATH_INFO'} !~ m@($FilePattern)$@is))
2718 # Unsupported file types can be processed by a special raw-file
2719 if($BinaryMapFile)
2721 $ENV{'CGI_BINARY_FILE'} = $ENV{'PATH_INFO'};
2722 $ENV{'PATH_INFO'} = $BinaryMapFile;
2724 else
2726 dieHandler(10, "Illegal file\n");
2732 # End of Security Access Control
2735 ############################################################################
2737 # Get the POST part of the query and add it to the QUERY_STRING.
2740 sub Get_POST_part_of_query
2743 # If POST, Read data from stdin to QUERY_STRING
2744 if($ENV{'REQUEST_METHOD'} =~ /POST/is)
2746 # SECURITY: Check size of Query String
2747 $ENV{'CONTENT_LENGTH'} <= $MaximumQuerySize || dieHandler(11, "Query too long: $ENV{'CONTENT_LENGTH'}\n"); # Query too long
2748 my $QueryRead = 0;
2749 my $SystemRead = $ENV{'CONTENT_LENGTH'};
2750 $ENV{'QUERY_STRING'} .= '&' if length($ENV{'QUERY_STRING'}) > 0;
2751 while($SystemRead > 0)
2753 $QueryRead = sysread(STDIN, $Post, $SystemRead); # Limit length
2754 $ENV{'QUERY_STRING'} .= $Post;
2755 $SystemRead -= $QueryRead;
2757 # Update decoded Query String
2758 $default_values{CGI_Decoded_QS} = YOUR_CGIQUERYDECODE();
2759 $default_values{CGI_Content_Length} =
2760 length($default_values{CGI_Decoded_QS});
2764 # End of getting POST part of query
2767 ############################################################################
2769 # Start (HTML) output and logging
2770 # (if there are irregularities, it can kill the current process)
2773 sub Initialize_output
2775 # Construct the REAL file path (except for STDIN on the command line)
2776 my $file_path = $ENV{'PATH_INFO'} ne '-' ? $SS_PUB . $ENV{'PATH_INFO'} : '-';
2777 $file_path =~ s/\?.*$//; # Remove query
2778 # This is only necessary if your server does not catch ../ directives
2779 $file_path !~ m@\.\./@ || dieHandler(12, "Illegal ../ Construct\n"); # SECURITY: Do not allow ../ constructs
2781 # Block STDIN use (-) if CGIscriptor is servicing a HTTP request
2782 if($file_path eq '-')
2784 dieHandler(13, "STDIN request in On Line system\n") if $BLOCK_STDIN_HTTP_REQUEST
2785 && ($ENV{'SERVER_SOFTWARE'}
2786 || $ENV{'SERVER_NAME'}
2787 || $ENV{'GATEWAY_INTERFACE'}
2788 || $ENV{'SERVER_PROTOCOL'}
2789 || $ENV{'SERVER_PORT'}
2790 || $ENV{'REMOTE_ADDR'}
2791 || $ENV{'HTTP_USER_AGENT'});
2796 if($ClientLog)
2798 open(ClientLog, ">>$ClientLog");
2799 print ClientLog "$LocalTime | ",
2800 ($ENV{REMOTE_USER} || "-"), " ",
2801 ($ENV{REMOTE_IDENT} || "-"), " ",
2802 ($ENV{REMOTE_HOST} || "-"), " ",
2803 $ENV{REMOTE_ADDR}, " ",
2804 $ENV{PATH_INFO}, " ",
2805 $ENV{'CGI_BINARY_FILE'}, " ",
2806 ($default_values{CGI_Content_Length} || "-"),
2807 "\n";
2808 close(ClientLog);
2810 if($QueryLog)
2812 open(QueryLog, ">>$QueryLog");
2813 print QueryLog "$LocalTime\n",
2814 ($ENV{REMOTE_USER} || "-"), " ",
2815 ($ENV{REMOTE_IDENT} || "-"), " ",
2816 ($ENV{REMOTE_HOST} || "-"), " ",
2817 $ENV{REMOTE_ADDR}, ": ",
2818 $ENV{PATH_INFO}, " ",
2819 $ENV{'CGI_BINARY_FILE'}, "\n";
2821 # Write Query to Log file
2822 print QueryLog $default_values{CGI_Decoded_QS}, "\n\n";
2823 close(QueryLog);
2826 # Return the file path
2827 return $file_path;
2830 # End of Initialize output
2833 ############################################################################
2835 # Handle login access
2837 # Access is based on a valid session ticket.
2838 # Session tickets should be dependend on user name
2839 # and IP address. The patterns of URLs for which a
2840 # session ticket is needed and the login URL are stored in
2841 # %TicketRequiredPatterns as:
2842 # 'RegEx pattern' -> 'SessionPath\tPasswordPath\tLogin URL\tExpiration'
2845 sub Log_In_Access # () -> 0 = Access Allowed, Login page if access is not allowed
2847 # No patterns, no login
2848 return 0 unless %TicketRequiredPatterns;
2850 # Get and initialize values (watch out for stuff processed by BinaryMap files)
2851 my ($SessionPath, $PasswordsPath, $Login, $valid_duration) = ("", "", "", 0);
2852 my $PATH_INFO = $ENV{'CGI_BINARY_FILE'} ? $ENV{'CGI_BINARY_FILE'} : $ENV{'PATH_INFO'};
2853 my $REMOTE_ADDR = $ENV{'REMOTE_ADDR'};
2854 return 0 if $REMOTE_ADDR =~ /[^0-9\.]/;
2855 # Extract TICKETs, starting with returned cookies
2856 CGIexecute::defineCGIvariable('LOGINTICKET', "");
2857 CGIexecute::defineCGIvariable('SESSIONTICKET', "");
2858 CGIexecute::defineCGIvariable('CHALLENGETICKET', "");
2859 if($ENV{'COOKIE_JAR'})
2861 my $CurrentCookieJar = $ENV{'COOKIE_JAR'};
2862 $CurrentCookieJar =~ s/\w+\=\-\s*(\;\s*|$)//isg;
2863 if($CurrentCookieJar =~ /\s*CGIscriptorLOGIN\=\s*([^\;]+)/)
2865 ${"CGIexecute::LOGINTICKET"} = $1;
2867 if($CurrentCookieJar =~ /\s*CGIscriptorCHALLENGE\=\s*([^\;]+)/ && $1 ne '-')
2869 ${"CGIexecute::CHALLENGETICKET"} = $1;
2871 if($CurrentCookieJar =~ /\s*CGIscriptorSESSION\=\s*([^\;]+)/ && $1 ne '-')
2873 ${"CGIexecute::SESSIONTICKET"} = $1;
2876 # Get and check the tickets. Tickets are restricted to word-characters (alphanumeric+_+.)
2877 my $LOGINTICKET = ${"CGIexecute::LOGINTICKET"};
2878 return 0 if ($LOGINTICKET && $LOGINTICKET =~ /[^\w\.]/isg);
2879 my $SESSIONTICKET = ${"CGIexecute::SESSIONTICKET"};
2880 return 0 if ($SESSIONTICKET && $SESSIONTICKET =~ /[^\w\.]/isg);
2881 my $CHALLENGETICKET = ${"CGIexecute::CHALLENGETICKET"};
2882 return 0 if ($SESSIONTICKET && $SESSIONTICKET =~ /[^\w\.]/isg);
2883 # Look for a LOGOUT message
2884 my $LOGOUT = $ENV{QUERY_STRING} =~ /(^|\&)LOGOUT([\=\&]|$)/;
2885 # Username and password
2886 CGIexecute::defineCGIvariable('CGIUSERNAME', "");
2887 my $username = lc(${"CGIexecute::CGIUSERNAME"});
2888 return 0 if $username =~ m!^[^\w]!isg || $username =~ m![^\w \-]!isg;
2889 my $userfile = lc($username);
2890 $userfile =~ s/[^\w]/_/isg;
2891 CGIexecute::defineCGIvariable('PASSWORD', "");
2892 my $password = ${"CGIexecute::PASSWORD"};
2893 CGIexecute::defineCGIvariable('NEWUSERNAME', "");
2894 my $newuser = lc(${"CGIexecute::NEWUSERNAME"});
2895 CGIexecute::defineCGIvariable('NEWPASSWORD', "");
2896 my $newpassword = ${"CGIexecute::NEWPASSWORD"};
2898 foreach my $pattern (keys(%TicketRequiredPatterns))
2900 # Check BOTH the real PATH_INFO and the CGI_BINARY_FILE variable
2901 if($ENV{'PATH_INFO'} =~ m#$pattern# || $ENV{'CGI_BINARY_FILE'} =~ m#$pattern#)
2903 # Fall through a sieve of requirements
2904 ($SessionPath, $PasswordsPath, $Login, $validtime) = split(/\t/, $TicketRequiredPatterns{$pattern});
2905 # If a LOGOUT is present, remove everything
2906 if($LOGOUT && !$LOGINTICKET)
2908 unlink "$SessionPath/$LOGINTICKET" if $LOGINTICKET && (-s "$SessionPath/$LOGINTICKET");
2909 $LOGINTICKET = "";
2910 unlink "$SessionPath/$SESSIONTICKET" if $SESSIONTICKET && (-s "$SessionPath/$SESSIONTICKET");
2911 $SESSIONTICKET = "";
2912 unlink "$SessionPath/$CHALLENGETICKET" if $CHALLENGETICKET && (-s "$SessionPath/$CHALLENGETICKET");
2913 $CHALLENGETICKET = "";
2914 unlink "$SessionPath/$REMOTE_ADDR" if (-s "$SessionPath/$REMOTE_ADDR");
2915 $CHALLENGETICKET = "";
2916 goto Login;
2918 # Is there a change password request?
2919 if($newuser && $LOGINTICKET && $username)
2921 goto Login unless (-s "$SessionPath/$LOGINTICKET");
2922 goto Login unless (-s "$PasswordsPath/$userfile");
2923 my $ticket_valid = check_ticket_validity("PASSWORD", "$PasswordsPath/$userfile", $REMOTE_ADDR, $PATH_INFO);
2924 goto Login unless $ticket_valid;
2926 my ($sessiontype, $currentticket) = ("", "");
2927 if($CHALLENGETICKET) {($sessiontype, $currentticket) = ("CHALLENGE", $CHALLENGETICKET);}
2928 elsif($SESSIONTICKET) {($sessiontype, $currentticket) = ("SESSION", $SESSIONTICKET);}
2929 elsif(-s "$SessionPath/$REMOTE_ADDR") {($sessiontype, $currentticket) = ("IPADDRESS", $REMOTE_ADDR);
2931 if($sessiontype)
2933 goto Login unless (-s "$SessionPath/$currentticket");
2934 my $ticket_valid = check_ticket_validity($sessiontype, "$SessionPath/$currentticket", $REMOTE_ADDR, $PATH_INFO);
2935 goto Login unless $ticket_valid;
2937 # Authorize
2938 my $TMPTICKET = authorize_login("$SessionPath/$LOGINTICKET", "$PasswordsPath/$userfile", $password, $SessionPath);
2939 goto Login unless $TMPTICKET;
2941 # Create a new user account
2942 CGIexecute::defineCGIvariable('NEWSESSION', "");
2943 my $newsession = ${"CGIexecute::NEWSESSION"};
2944 my $newaccount = create_newuser("$SessionPath/$LOGINTICKET", "$SessionPath/$currentticket",
2945 "$PasswordsPath/$userfile", $password, $newuser, $newpassword, $newsession);
2946 CGIexecute::defineCGIvariable('NEWACCOUNTTEXT', $newaccount);
2947 ${CGIexecute::NEWACCOUNTTEXT} = $newaccount;
2948 # NEWACCOUNTTEXT is NOT to be set by the query
2949 CGIexecute::ProtectCGIvariable('NEWACCOUNTTEXT');
2952 # Ready
2953 return 0;
2955 # Is there a change password request?
2956 elsif($newpassword && $LOGINTICKET && $username)
2958 goto Login unless (-s "$SessionPath/$LOGINTICKET");
2959 goto Login unless (-s "$PasswordsPath/$userfile");
2960 my $ticket_valid = check_ticket_validity("PASSWORD", "$PasswordsPath/$userfile", $REMOTE_ADDR, $PATH_INFO);
2961 goto Login unless $ticket_valid;
2963 my ($sessiontype, $currentticket) = ("", "");
2964 if($CHALLENGETICKET) {($sessiontype, $currentticket) = ("CHALLENGE", $CHALLENGETICKET);}
2965 elsif($SESSIONTICKET) {($sessiontype, $currentticket) = ("SESSION", $SESSIONTICKET);}
2966 elsif(-s "$SessionPath/$REMOTE_ADDR") {($sessiontype, $currentticket) = ("IPADDRESS", $REMOTE_ADDR);
2968 if($sessiontype)
2970 goto Login unless (-s "$SessionPath/$currentticket");
2971 my $ticket_valid = check_ticket_validity($sessiontype, "$SessionPath/$currentticket", $REMOTE_ADDR, $PATH_INFO);
2972 goto Login unless $ticket_valid;
2974 # Authorize
2975 change_password("$SessionPath/$LOGINTICKET", "$SessionPath/$currentticket", "$PasswordsPath/$userfile", $password, $newpassword);
2976 # After a change of password, you have to login again for a CHALLENGE
2977 if($CHALLENGETICKET){$CHALLENGETICKET = "";};
2978 # Ready
2979 return 0;
2981 # Is there a login ticket of this name?
2982 elsif($LOGINTICKET)
2984 my $tickets_removed = remove_expired_tickets($SessionPath);
2985 goto Login unless (-s "$SessionPath/$LOGINTICKET");
2986 goto Login unless (-s "$PasswordsPath/$userfile");
2987 my $ticket_valid = check_ticket_validity("PASSWORD", "$PasswordsPath/$userfile", $REMOTE_ADDR, $PATH_INFO);
2988 goto Login unless $ticket_valid;
2989 $ticket_valid = check_ticket_validity("LOGIN", "$SessionPath/$LOGINTICKET", $REMOTE_ADDR, ".");
2990 goto Login unless $ticket_valid;
2992 # Remove any lingering tickets
2993 unlink "$SessionPath/$SESSIONTICKET" if $SESSIONTICKET && (-s "$SessionPath/$SESSIONTICKET");
2994 $SESSIONTICKET = "";
2995 unlink "$SessionPath/$CHALLENGETICKET" if $CHALLENGETICKET && (-s "$SessionPath/$CHALLENGETICKET");
2996 $CHALLENGETICKET = "";
2999 # Authorize
3000 my $TMPTICKET = authorize_login("$SessionPath/$LOGINTICKET", "$PasswordsPath/$userfile", $password, $SessionPath);
3001 if($TMPTICKET)
3003 my $authorization = read_ticket("$PasswordsPath/$userfile");
3004 # Session type is read from the userfile
3005 if($authorization->{"Session"} && $authorization->{"Session"}->[0] eq "CHALLENGE")
3007 # Create New Random CHALLENGETICKET
3008 $CHALLENGETICKET = $TMPTICKET;
3009 create_session_file("$SessionPath/$CHALLENGETICKET", "$SessionPath/$LOGINTICKET", "$PasswordsPath/$userfile", $PATH_INFO);
3011 elsif($authorization->{"Session"} && $authorization->{"Session"}->[0] eq "IPADDRESS")
3013 create_session_file("$SessionPath/$REMOTE_ADDR", "$SessionPath/$LOGINTICKET", "$PasswordsPath/$userfile", $PATH_INFO);
3015 else
3017 $SESSIONTICKET = $TMPTICKET;
3018 create_session_file("$SessionPath/$SESSIONTICKET", "$SessionPath/$LOGINTICKET", "$PasswordsPath/$userfile", $PATH_INFO);
3019 $SETCOOKIELIST{"CGIscriptorSESSION"} = "-";
3022 # Login ticket file has been used, remove it
3023 unlink($loginfile);
3025 # Is there a session ticket of this name?
3026 # CHALLENGE
3027 if($CHALLENGETICKET)
3029 goto Login unless (-s "$SessionPath/$CHALLENGETICKET");
3030 my $ticket_valid = check_ticket_validity("CHALLENGE", "$SessionPath/$CHALLENGETICKET", $REMOTE_ADDR, $PATH_INFO);
3031 goto Login unless $ticket_valid;
3033 my $oldchallenge = read_ticket("$SessionPath/$CHALLENGETICKET");
3034 my $userfile = lc($oldchallenge->{"Username"}->[0]);
3035 $userfile =~ s/[^\w]/_/isg;
3036 goto Login unless (-s "$PasswordsPath/$userfile");
3038 $ticket_valid = check_ticket_validity("PASSWORD", "$PasswordsPath/$userfile", $REMOTE_ADDR, $PATH_INFO);
3039 goto Login unless $ticket_valid;
3041 my $NEWCHALLENGETICKET = "";
3042 $NEWCHALLENGETICKET = copy_challenge_file("$SessionPath/$CHALLENGETICKET", "$PasswordsPath/$userfile", $SessionPath);
3043 # Sessionticket is available to scripts, do NOT set the cookie
3044 $ENV{'CHALLENGETICKET'} = $NEWCHALLENGETICKET;
3045 return 0;
3047 # IPADDRESS
3048 elsif(-s "$SessionPath/$REMOTE_ADDR")
3050 my $ticket_valid = check_ticket_validity("IPADDRESS", "$SessionPath/$REMOTE_ADDR", $REMOTE_ADDR, $PATH_INFO);
3051 goto Login unless $ticket_valid;
3052 return 0;
3054 # SESSION
3055 elsif($SESSIONTICKET)
3057 goto Login unless (-s "$SessionPath/$SESSIONTICKET");
3058 my $ticket_valid = check_ticket_validity("SESSION", "$SessionPath/$SESSIONTICKET", $REMOTE_ADDR, $PATH_INFO);
3059 goto Login unless $ticket_valid;
3060 # Sessionticket is available to scripts
3061 $ENV{'SESSIONTICKET'} = $SESSIONTICKET;
3062 return 0;
3065 goto Login;
3066 return 0;
3069 return 0;
3071 Login:
3072 create_login_file($PasswordsPath, $SessionPath, $REMOTE_ADDR);
3073 # Note, cookies are set only ONCE
3074 $SETCOOKIELIST{"CGIscriptorLOGIN"} = "-";
3075 return "$YOUR_HTML_FILES/$Login";
3078 sub authorize_login # ($loginfile, $authorizationfile, $password, $SessionPath) => SESSIONTICKET First two arguments are file paths
3080 my $loginfile = shift || "";
3081 my $authorizationfile = shift || "";
3082 my $password = shift || "";
3083 my $SessionPath = shift || "";
3085 # Get Login session ticket
3086 my $loginticket = read_ticket($loginfile);
3087 # Get User credentials for authorization
3088 my $authorization = read_ticket($authorizationfile);
3090 # Get Randomsalt
3091 my $Randomsalt = $loginticket->{'Randomsalt'}->[0];
3092 return "" unless $Randomsalt;
3094 my $storedpassword = $authorization->{'Password'}->[0];
3095 return "" unless $storedpassword;
3096 my $Hashedpassword = hash_string("$Randomsalt$storedpassword");
3097 chomp($Hashedpassword);
3098 return "" unless $password eq $Hashedpassword;
3100 # Extract Session Ticket
3101 my $loginsession = $loginticket->{'Session'}->[0];
3102 my $sessionticket = hash_string("$loginsession$storedpassword");
3103 chomp($sessionticket);
3104 $sessionticket = "" if -x "$SessionPath/$sessionticket";
3106 return $sessionticket;
3109 sub change_password # ($loginfile, $sessionfile, $authorizationfile, $password, $newpassword) First three arguments are file paths
3111 my $loginfile = shift || "";
3112 my $sessionfile = shift || "";
3113 my $authorizationfile = shift || "";
3114 my $password = shift || "";
3115 my $newpassword = shift || "";
3116 # Get Login session ticket
3117 my $loginticket = read_ticket($loginfile);
3118 # Login ticket file has been used, remove it
3119 unlink($loginfile);
3120 # Get Randomsalt
3121 my $Randomsalt = $loginticket->{'Randomsalt'}->[0];
3123 return "" unless $Randomsalt;
3125 # Get session ticket
3126 my $sessionticket = read_ticket($sessionfile);
3127 # Get User credentials for authorization
3128 my $authorization = read_ticket($authorizationfile);
3129 return "" unless lc($authorization->{'Username'}->[0]) eq lc($sessionticket->{'Username'}->[0]);
3131 my $storedpassword = $authorization->{'Password'}->[0];
3132 my $Hashedpassword = hash_string("$Randomsalt$storedpassword");
3133 chomp($Hashedpassword);
3134 return "" unless $password eq $Hashedpassword;
3136 # Decrypt the $newpassword
3137 my $loginticketid = $loginticket->{'Session'}->[0];
3138 my $passwordkey = hash_string("$loginticketid$storedpassword");
3139 chomp($passwordkey);
3140 my $decryptedPassword = XOR_hex_strings($passwordkey, $newpassword);
3141 return "" unless $decryptedPassword;
3142 # Authorization succeeded, change password
3143 $authorization->{'Password'}->[0] = $decryptedPassword;
3145 open(USERFILE, "<$authorizationfile") || die "<$authorizationfile: $!\n";
3146 my @USERlines = <USERFILE>;
3147 close(USERFILE);
3148 # Change
3149 open(USERFILE, ">$authorizationfile") || die ">$authorizationfile: $!\n";
3150 foreach my $line (@USERlines)
3152 $line =~ s/^Password: ($storedpassword)$/Password: $decryptedPassword/ig;
3153 print USERFILE $line;
3155 close(USERFILE);
3157 return $newpassword;
3160 sub create_newuser # ($loginfile, $sessionfile, $authorizationfile, $password, $newuser, $newpassword, $newsession) First two arguments are file paths
3162 my $loginfile = shift || "";
3163 my $sessionfile = shift || "";
3164 my $authorizationfile = shift || "";
3165 my $password = shift || "";
3166 my $newuser = shift || "";
3167 my $newpassword = shift || "";
3168 my $newsession = shift || "";
3170 # Get Login session ticket
3171 my $loginticket = read_ticket($loginfile);
3172 # Login ticket file has been used, remove it
3173 unlink($loginfile);
3174 # Get Randomsalt
3175 my $Randomsalt = $loginticket->{'Randomsalt'}->[0];
3177 return "" unless $Randomsalt;
3179 # Get session ticket
3180 my $sessionticket = read_ticket($sessionfile);
3181 # Get User credentials for authorization
3182 my $authorization = read_ticket($authorizationfile);
3183 return "" unless lc($authorization->{'Username'}->[0]) eq lc($sessionticket->{'Username'}->[0]);
3184 my $sessionkey = $sessionticket->{'Key'}->[0];
3185 my $sessionRansal = $sessionticket->{'Randomsalt'}->[0];
3186 my $serversalt = $authorization->{'Salt'}->[0];
3187 return "" unless $serversalt;
3189 my $storedpassword = $authorization->{'Password'}->[0];
3190 my $Hashedpassword = hash_string("$Randomsalt$storedpassword");
3191 chomp($Hashedpassword);
3192 return "" unless $password eq $Hashedpassword;
3194 # Decrypt the $newpassword
3195 my $loginticketid = $loginticket->{'Session'}->[0];
3196 my $passwordkey = hash_string("$loginticketid$storedpassword");
3197 my $decryptedPassword = XOR_hex_strings($passwordkey, $newpassword);
3198 return "" unless $decryptedPassword;
3199 # Authorization succeeded, create new account
3200 my $newaccount = {};
3201 $newaccount->{'Type'} = ['PASSWORD'];
3202 $newaccount->{'Username'} = [$newuser];
3203 $newaccount->{'Password'} = [$decryptedPassword];
3204 $newaccount->{'Salt'} = [$serversalt];
3205 $newaccount->{'Session'} = ['SESSION'];
3206 if($newsession eq 'IPADDRESS'){$newaccount->{'Session'} = ['IPADDRESS'];};
3207 if($newsession eq 'CHALLENGE'){$newaccount->{'Session'} = ['CHALLENGE'];};
3209 # Re-encrypt the new password
3210 my $newkey = hash_string("$sessionRansal$storedpassword");
3211 $newaccount->{'Password'}->[0] = XOR_hex_strings($newkey, $newaccount->{'Password'}->[0]);
3213 # AllowedPaths
3214 my $NewAllowedPaths = "";
3215 my $PATH_INFO = $ENV{'CGI_BINARY_FILE'} ? $ENV{'CGI_BINARY_FILE'} : $ENV{'PATH_INFO'};
3216 my $currentRoot = "";
3217 $currentRoot = $1 if $PATH_INFO =~ m!^([\w\-\. /]+)!isg;
3218 $currentRoot =~ s![^/]+$!!isg;
3219 if($currentRoot)
3221 $currentRoot .= '/' unless $currentRoot =~ m!/$!;
3222 $NewAllowedPaths .= 'AllowedPaths: ^'.${currentRoot}.'[\w\-]*\.html?'."\n";
3224 else
3226 # Tricky PATH_INFO, deny all
3227 $NewAllowedPaths .= "DeniedPaths: ^/\n";
3229 # Construct home directory path
3230 my $currentHome = lc($newaccount->{'Username'}->[0]);
3231 $currentHome =~ s/[^\w]/_/isg;
3232 $NewAllowedPaths .= "AllowedPaths: ^${currentRoot}$currentHome/\n";
3233 chomp($NewAllowedPaths);
3235 # Write
3236 my $datetime = gmtime();
3237 my $timesec = time();
3238 my $newaccounttext = << "ENDOFNEWACCOUNTTEXT";
3239 Type: $newaccount->{'Type'}->[0]
3240 Username: $newaccount->{'Username'}->[0]
3241 Password: <span id="newaccount">$newaccount->{'Password'}->[0]</span>
3242 Salt: $newaccount->{'Salt'}->[0]
3243 $NewAllowedPaths
3244 Session: $newaccount->{'Session'}->[0]
3245 Date: $datetime UTC
3246 Time: $timesec
3247 ENDOFNEWACCOUNTTEXT
3248 return $newaccounttext;
3251 sub XOR_hex_strings # (hex1, hex2) -> hex
3253 my $hex1 = shift || "";
3254 my $hex2 = shift || "";
3255 my @hex1list = split('', $hex1);
3256 my @hex2list = split('', $hex2);
3257 my @hexresultlist = ();
3258 for(my $i; $i < scalar(@hex1list); ++$i)
3260 my $d1 = hex($hex1list[$i]);
3261 my $d2 = hex($hex2list[$i]);
3262 my $dresult = ($d1 ^ $d2);
3263 $hexresultlist[$i] = sprintf("%x", $dresult);
3265 $hexresult = join('', @hexresultlist);
3266 return $hexresult;
3269 # Copy a Challenge ticket file to a new name which is the hash of the new $CHALLENGETICKET and the password
3270 sub copy_challenge_file #($oldchallengefile, $authorizationfile, $sessionpath) -> $CHALLENGETICKET
3272 my $oldchallengefile = shift || "";
3273 my $authorizationfile = shift || "";
3274 my $sessionpath = shift || "";
3275 $sessionpath =~ s!/+$!!g;
3277 # Get Login session ticket
3278 my $oldchallenge = read_ticket($oldchallengefile);
3280 # Get Authorization (user) session file
3281 my $authorization = read_ticket($authorizationfile);
3282 my $storedpassword = $authorization->{'Password'}->[0];
3283 return "" unless $storedpassword;
3284 my $challengekey = $oldchallenge->{'Key'}->[0];
3285 return "" unless $challengekey;
3287 # Create Random Hash Salt
3288 my $NEWCHALLENGETICKET = get_random_hex();;
3289 my $newchallengefile = hash_string("$NEWCHALLENGETICKET$challengekey");
3290 return "" unless $newchallengefile;
3292 $ENV{'CHALLENGETICKET'} = $NEWCHALLENGETICKET;
3293 CGIexecute::defineCGIvariable('CHALLENGETICKET', "");
3294 ${"CGIexecute::CHALLENGETICKET"} = $NEWCHALLENGETICKET;
3296 # Write Session Ticket
3297 open(OLDCHALLENGE, "<$oldchallengefile") || die "<$oldchallengefile: $!\n";
3298 my @OldChallengeLines = <OLDCHALLENGE>;
3299 close(OLDCHALLENGE);
3300 # Old file should now be removed
3301 unlink($oldchallengefile);
3303 open(SESSION, ">$sessionpath/$newchallengefile") || die "$sessionpath/$newchallengefile: $!\n";
3304 foreach $line (@OldChallengeLines)
3306 print SESSION $line;
3308 close(SESSION);
3310 return $NEWCHALLENGETICKET;
3313 sub create_login_file #($PasswordDir, $SessionDir, $IPaddress)
3315 my $PasswordDir = shift || "";
3316 my $SessionDir = shift || "";
3317 my $IPaddress = shift || "";
3319 # Create Login Ticket
3320 my $LOGINTICKET= get_random_hex ();
3322 # Create Random Hash Salt
3323 my $RANDOMSALT= get_random_hex();
3325 # Create SALT file if it does not exist
3326 # Remove this, including test account for life system
3327 unless(-d "$SessionDir")
3329 `mkdir -p "$SessionDir"`;
3331 unless(-d "$PasswordDir")
3333 `mkdir -p "$PasswordDir"`;
3335 # Create SERVERSALT and default test account
3336 my $SERVERSALT = "";
3337 unless(-s "$PasswordDir/SALT")
3339 $SERVERSALT= get_random_hex();
3340 open(SALTFILE, ">$PasswordDir/SALT") || die ">$PasswordDir/SALT: $!\n";
3341 print SALTFILE "$SERVERSALT\n";
3342 close(SALTFILE);
3344 # Update test account (should be removed in live system)
3345 my @alltestusers = ("test", "testip", "testchallenge", "admin");
3346 foreach my $testuser (@alltestusers)
3348 if(-s "$PasswordDir/$testuser")
3350 my $plainpassword = $testuser eq 'admin' ? "There is no password like more password" : "test";
3351 my $storedpassword = hash_string("${SERVERSALT}${$plainpassword}${testuser}");
3352 chomp($storedpassword);
3353 open(USERFILE, "<$PasswordDir/$testuser") || die "</Private/.Passwords/$testuser: $!\n";
3354 @USERlines = <USERFILE>;
3355 close(USERFILE);
3357 open(USERFILE, ">$PasswordDir/$testuser") || die ">/Private/.Passwords/$testuser: $!\n";
3358 # Add Password and Salt
3359 foreach my $line (@USERlines)
3361 $line =~ s/^Password: (.*)$/Password: $storedpassword/ig;
3362 $line =~ s/^Salt: (.*)$/Salt: $SERVERSALT/ig;
3364 # Print the line
3365 print USERFILE $line;
3367 # Disable all accounts with an expiration date, ie, admin
3368 print USERFILE "Expires: -1\n" if $line =~ /Expires/;
3370 close(USERFILE);
3376 # Read in site Salt
3377 open(SALTFILE, "<$PasswordDir/SALT") || die "$PasswordDir/SALT: $!\n";
3378 $SERVERSALT=<SALTFILE>;
3379 close(SALTFILE);
3380 chomp($SERVERSALT);
3382 # Create login session ticket
3383 my $datetime = gmtime();
3384 my $timesec = time();
3385 open(LOGINTICKET, ">$SessionDir/$LOGINTICKET") || die "$SessionDir/$LOGINTICKET: $!\n";
3386 print LOGINTICKET << "ENDOFLOGINTICKET";
3387 Type: LOGIN
3388 IPaddress: $IPaddress
3389 Salt: $SERVERSALT
3390 Session: $LOGINTICKET
3391 Randomsalt: $RANDOMSALT
3392 Expires: +600s
3393 Date: $datetime UTC
3394 Time: $timesec
3395 ENDOFLOGINTICKET
3396 close(LOGINTICKET);
3398 # Set global variables
3399 # $SERVERSALT
3400 $ENV{'SERVERSALT'} = $SERVERSALT;
3401 CGIexecute::defineCGIvariable('SERVERSALT', "");
3402 ${"CGIexecute::SERVERSALT"} = $SERVERSALT;
3404 # $SESSIONTICKET
3405 $ENV{'SESSIONTICKET'} = $SESSIONTICKET;
3406 CGIexecute::defineCGIvariable('SESSIONTICKET', "");
3407 ${"CGIexecute::SESSIONTICKET"} = $SESSIONTICKET;
3409 # $RANDOMSALT
3410 $ENV{'RANDOMSALT'} = $RANDOMSALT;
3411 CGIexecute::defineCGIvariable('RANDOMSALT', "");
3412 ${"CGIexecute::RANDOMSALT"} = $RANDOMSALT;
3414 # $LOGINTICKET
3415 $ENV{'LOGINTICKET'} = $LOGINTICKET;
3416 CGIexecute::defineCGIvariable('LOGINTICKET', "");
3417 ${"CGIexecute::LOGINTICKET"} = $LOGINTICKET;
3419 return $ENV{'LOGINTICKET'};
3422 sub create_session_file #($sessionfile, $loginfile, $authorizationfile, $path) -> Is $loginfile deleted? 0/1
3424 my $sessionfile = shift || "";
3425 my $loginfile = shift || "";
3426 my $authorizationfile = shift || "";
3427 my $path = shift || "";
3429 # Get Login session ticket
3430 my $loginticket = read_ticket($loginfile);
3432 # Get Authorization (user) session file
3433 my $authorization = read_ticket($authorizationfile);
3434 # For a Session or a Challenge, we need a stored key
3435 my $sessionkey = "";
3436 if($authorization->{'Session'} && $authorization->{'Session'}->[0] ne 'IPADDRESS')
3438 my $storedpassword = $authorization->{'Password'}->[0];
3439 my $loginticketid = $loginticket->{'Session'}->[0];
3440 $sessionkey = hash_string("$loginticketid$storedpassword");
3441 chomp($sessionkey);
3444 # Convert Authorization content to Session content
3445 my $sessionContent = {};
3446 $sessionContent->{IPaddress} = $loginticket->{'IPaddress'};
3447 $sessionContent->{Randomsalt} = $loginticket->{'Randomsalt'};
3448 $sessionContent->{AllowedPaths} = $authorization->{'AllowedPaths'};
3449 $sessionContent->{DeniedPaths} = $authorization->{'DeniedPaths'};
3450 $sessionContent->{Expires} = $authorization->{'MaxLifetime'};
3451 $sessionContent->{Capabilities} = $authorization->{'Capabilities'};
3452 foreach my $pattern (keys(%TicketRequiredPatterns))
3454 if($path =~ m#$pattern#)
3456 my ($SessionPath, $PasswordsPath, $Login, $validtime) = split(/\t/, $TicketRequiredPatterns{$pattern});
3457 push(@{$sessionContent->{Expires}}, $validtime);
3461 # Write Session Ticket
3462 open(SESSION, ">$sessionfile") || die "$sessionfile: $!\n";
3463 if($authorization->{'Session'} && $authorization->{'Session'}->[0])
3465 print SESSION "Type: ", $authorization->{'Session'}->[0], "\n";
3467 else
3469 print SESSION "Type: SESSION\n";
3471 foreach my $list ('IPaddress', 'AllowedPaths', 'DeniedPaths', 'Expires', 'Capabilities', 'Randomsalt')
3473 foreach my $entry (@{$sessionContent->{$list}})
3475 print SESSION "$list: $entry\n";
3479 # Special lines
3480 print SESSION "Username: ", lc($authorization->{'Username'}->[0]), "\n";
3481 print SESSION "Key: $sessionkey\n" if $sessionkey;
3482 print SESSION "Date: ", gmtime()." UTC\n";
3483 print SESSION "Time: ", time, "\n";
3484 close(SESSION);
3486 # Login file should now be removed
3487 return unlink($loginfile);
3490 sub check_ticket_validity # ($type, $ticketfile, $address, $path)
3492 my $type = shift || "SESSION";
3493 my $ticketfile = shift || "";
3494 my $address = shift || "";
3495 my $path = shift || "";
3497 # Is there a session ticket of this name?
3498 return 0 unless -s "$ticketfile";
3500 # There is a session ticket, is it linked to this IP address?
3501 my $ticket = read_ticket($ticketfile);
3503 # Is this the right type of ticket
3504 return unless $ticket->{"Type"}->[0] eq $type;
3506 # Does the IP address match?
3507 my $IPmatches = 0;
3508 for $IPpattern (@{$ticket->{"IPaddress"}})
3510 ++$IPmatches if $address =~ m#^$IPpattern#ig;
3512 return 0 unless !$ticket->{"IPaddress"} || $IPmatches;
3514 # Is the path denied
3515 my $Pathmatches = 0;
3516 foreach $Pathpattern (@{$ticket->{"DeniedPaths"}})
3518 ++$Pathmatches if $path =~ m#$Pathpattern#ig;
3520 return 0 if @{$ticket->{"DeniedPaths"}} && $Pathmatches;
3522 # Is the path allowed
3523 $Pathmatches = 0;
3524 foreach $Pathpattern (@{$ticket->{"AllowedPaths"}})
3526 ++$Pathmatches if $path =~ m#$Pathpattern#ig;
3528 return 0 unless !@{$ticket->{"AllowedPaths"}} || $Pathmatches;
3530 # Is the ticket expired?
3531 my $Expired = 0;
3532 if($ticket->{"Expires"} && @{$ticket->{"Expires"}})
3534 my $CurrentTime = time();
3535 ++$Expired if($CurrentTime > $ticket->{"Expires"}->[0]);
3537 return 0 if $Expired;
3539 # Make login values available (will also protect against resetting by query)
3540 $ENV{"LOGINUSERNAME"} = lc($ticket->{'Username'}->[0]);
3541 $ENV{"LOGINIPADDRESS"} = $address;
3542 $ENV{"LOGINPATH"} = $path;
3543 $ENV{"SESSIONTYPE"} = $type unless $type eq "PASSWORD";
3545 # Set Capabilities, if present
3546 if($ticket->{'Username'}->[0] && @{$ticket->{'Capabilities'}})
3548 $ENV{'CAPABILITIES'} = $ticket->{'Username'}->[0];
3549 CGIexecute::defineCGIvariableList('CAPABILITIES', "");
3550 @{"CGIexecute::CAPABILITIES"} = @{$ticket->{'Capabilities'}};
3551 # Capabilities should not be changed anymore by CGI query!
3553 # Capabilities are NOT to be set by the query
3554 CGIexecute::ProtectCGIvariable('CAPABILITIES');
3556 return 1;
3560 sub remove_expired_tickets # ($path) -> number of tickets removed
3562 my $path = shift || "";
3563 return 0 unless $path;
3564 $path =~ s!/+$!!g;
3565 my $removed_tickets = 0;
3566 my @ticketlist = glob("$path/*");
3567 foreach my $ticketfile (@ticketlist)
3569 my $ticket = read_ticket($ticketfile);
3570 if(@{$ticket->{'Expires'}} && $ticket->{'Expires'}->[0] < time)
3572 unlink $ticketfile;
3573 ++$removed_tickets;
3576 return $removed_tickets;
3579 sub read_ticket # ($ticketfile) -> &%ticket
3581 my $ticketfile = shift || "";
3582 my $ticket = {};
3583 if($ticketfile && -s $ticketfile)
3585 open(TICKETFILE, "<$ticketfile") || die "$ticketfile: $!\n";
3586 my @alllines = <TICKETFILE>;
3587 close(TICKETFILE);
3588 foreach my $currentline (@alllines)
3590 # Skip empty lines and comments
3591 next unless $currentline =~ /\S/;
3592 next if $currentline =~ /^\s*\#/;
3594 if($currentline =~ /^\s*(\S[^\:]+)\:\s+(.*)\s*$/)
3596 my $Label = $1;
3597 my $Value = $2;
3598 # Recalculate expire date from relative time
3599 if($Label =~ /^Expires$/ig && $Value =~ /^\+/)
3601 # Get SessionTicket file stats
3602 my ($dev,$ino,$mode,$nlink,$uid,$gid,$rdev,$size,$atime,$mtime,$ctime,$blksize,$blocks)
3603 = stat("$ticketfile");
3604 if($Value =~ /^\+(\d+)\s*d(ays)?\s*$/)
3606 $ExpireTime = 24*3600*$1;
3608 elsif($Value =~ /^\+(\d+)\s*m(inutes)?\s*$/)
3610 $ExpireTime = 60*$1;
3612 elsif($Value =~ /^\+(\d+)\s*h(ours)?\s*$/)
3614 $ExpireTime = 3600*$1;
3616 elsif($Value =~ /^\+(\d+)\s*s(econds)?\s*$/)
3618 $ExpireTime = $1;
3620 elsif($Value =~ /^\+(\d+)\s*$/)
3622 $ExpireTime = $1;
3625 my $ActualExpireTime = $ExpireTime + $ctime;
3626 $Value = $ActualExpireTime;
3628 $ticket->{$Label} = () unless exists($ticket->{$Label});
3629 push(@{$ticket->{$Label}}, $Value);
3633 if(exists($ticket->{Expires}))
3635 @{$ticket->{Expires}} = sort(@{$ticket->{Expires}});
3637 return $ticket;
3640 # End of Handle login access
3643 ############################################################################
3645 # Handle foreign interpreters (i.e., scripting languages)
3647 # Insert perl code to execute scripts in foreign scripting languages.
3648 # Actually, the scripts inside the <SCRIPT></SCRIPT> blocks are piped
3649 # into an interpreter.
3650 # The code presented here is fairly confusing because it
3651 # actually writes perl code code to the output.
3653 # A table with the file handles
3654 %SCRIPTINGINPUT = ();
3656 # A function to clean up Client delivered CGI parameter values
3657 # (i.e., quote all odd characters)
3658 %SHRUBcharacterTR =
3660 "\'" => '&#39;',
3661 "\`" => '&#96;',
3662 "\"" => '&quot;',
3663 '&' => '&amper;',
3664 "\\" => '&#92;'
3667 sub shrubCGIparameter # ($String) -> Cleaned string
3669 my $String = shift || "";
3671 # Change all quotes [`'"] into HTML character entities
3672 my ($Char, $Transcript) = ('&', $SHRUBcharacterTR{'&'});
3674 # Protect &
3675 $String =~ s/\Q$Char\E/$Transcript/isg if $Transcript;
3677 while( ($Char, $Transcript) = each %SHRUBcharacterTR)
3679 next if $Char eq '&';
3680 $String =~ s/\Q$Char\E/$Transcript/isg;
3683 # Replace newlines
3684 $String =~ s/[\n]/\\n/g;
3685 # Replace control characters with their backslashed octal ordinal numbers
3686 $String =~ s/([^\S \t])/(sprintf("\\0%o", ord($1)))/eisg; #
3687 $String =~ s/([\x00-\x08\x0A-\x1F])/(sprintf("\\0%o", ord($1)))/eisg; #
3689 return $String;
3693 # The initial open statements: Open a pipe to the foreign script interpreter
3694 sub OpenForeignScript # ($ContentType) -> $DirectivePrefix
3696 my $ContentType = lc(shift) || return "";
3697 my $NewDirective = "";
3699 return $NewDirective if($SCRIPTINGINPUT{$ContentType});
3701 # Construct a unique file handle name
3702 $SCRIPTINGFILEHANDLE = uc($ContentType);
3703 $SCRIPTINGFILEHANDLE =~ s/\W/\_/isg;
3704 $SCRIPTINGINPUT{$ContentType} = $SCRIPTINGFILEHANDLE
3705 unless $SCRIPTINGINPUT{$ContentType};
3707 # Create the relevant script: Open the pipe to the interpreter
3708 $NewDirective .= <<"BLOCKCGISCRIPTOROPEN";
3709 # Open interpreter for '$ContentType'
3710 # Open pipe to interpreter (if it isn't open already)
3711 open($SCRIPTINGINPUT{$ContentType}, "|$ScriptingLanguages{$ContentType}") || main::dieHandler(14, "$ContentType: \$!\\n");
3712 BLOCKCGISCRIPTOROPEN
3714 # Insert Initialization code and CGI variables
3715 $NewDirective .= InitializeForeignScript($ContentType);
3717 # Ready
3718 return $NewDirective;
3722 # The final closing code to stop the interpreter
3723 sub CloseForeignScript # ($ContentType) -> $DirectivePrefix
3725 my $ContentType = lc(shift) || return "";
3726 my $NewDirective = "";
3728 # Do nothing unless the pipe realy IS open
3729 return "" unless $SCRIPTINGINPUT{$ContentType};
3731 # Initial comment
3732 $NewDirective .= "\# Close interpreter for '$ContentType'\n";
3735 # Write the Postfix code
3736 $NewDirective .= CleanupForeignScript($ContentType);
3738 # Create the relevant script: Close the pipe to the interpreter
3739 $NewDirective .= <<"BLOCKCGISCRIPTORCLOSE";
3740 close($SCRIPTINGINPUT{$ContentType}) || main::dieHandler(15, \"$ContentType: \$!\\n\");
3741 select(STDOUT); \$|=1;
3743 BLOCKCGISCRIPTORCLOSE
3745 # Remove the file handler of the foreign script
3746 delete($SCRIPTINGINPUT{$ContentType});
3748 return $NewDirective;
3752 # The initialization code for the foreign script interpreter
3753 sub InitializeForeignScript # ($ContentType) -> $DirectivePrefix
3755 my $ContentType = lc(shift) || return "";
3756 my $NewDirective = "";
3758 # Add initialization code
3759 if($ScriptingInitialization{$ContentType})
3761 $NewDirective .= <<"BLOCKCGISCRIPTORINIT";
3762 # Initialization Code for '$ContentType'
3763 # Select relevant output filehandle
3764 select($SCRIPTINGINPUT{$ContentType}); \$|=1;
3766 # The Initialization code (if any)
3767 print $SCRIPTINGINPUT{$ContentType} <<'${ContentType}INITIALIZATIONCODE';
3768 $ScriptingInitialization{$ContentType}
3769 ${ContentType}INITIALIZATIONCODE
3771 BLOCKCGISCRIPTORINIT
3774 # Add all CGI variables defined
3775 if(exists($ScriptingCGIvariables{$ContentType}))
3777 # Start writing variable definitions to the Interpreter
3778 if($ScriptingCGIvariables{$ContentType})
3780 $NewDirective .= <<"BLOCKCGISCRIPTORVARDEF";
3781 # CGI variables (from the %default_values table)
3782 print $SCRIPTINGINPUT{$ContentType} << '${ContentType}CGIVARIABLES';
3783 BLOCKCGISCRIPTORVARDEF
3786 my ($N, $V);
3787 foreach $N (keys(%default_values))
3789 # Determine whether the parameter has been defined
3790 # (the eval is a workaround to get at the variable value)
3791 next unless eval("defined(\$CGIexecute::$N)");
3793 # Get the value from the EXECUTION environment
3794 $V = eval("\$CGIexecute::$N");
3795 # protect control characters (i.e., convert them to \0.. form)
3796 $V = shrubCGIparameter($V);
3798 # Protect interpolated variables
3799 eval("\$CGIexecute::$N = '$V';") unless $ScriptingCGIvariables{$ContentType};
3801 # Print the actual declaration for this scripting language
3802 if($ScriptingCGIvariables{$ContentType})
3804 $NewDirective .= sprintf($ScriptingCGIvariables{$ContentType}, $N, $V);
3805 $NewDirective .= "\n";
3809 # Stop writing variable definitions to the Interpreter
3810 if($ScriptingCGIvariables{$ContentType})
3812 $NewDirective .= <<"BLOCKCGISCRIPTORVARDEFEND";
3813 ${ContentType}CGIVARIABLES
3814 BLOCKCGISCRIPTORVARDEFEND
3819 $NewDirective .= << "BLOCKCGISCRIPTOREND";
3821 # Select STDOUT filehandle
3822 select(STDOUT); \$|=1;
3824 BLOCKCGISCRIPTOREND
3826 return $NewDirective;
3830 # The cleanup code for the foreign script interpreter
3831 sub CleanupForeignScript # ($ContentType) -> $DirectivePrefix
3833 my $ContentType = lc(shift) || return "";
3834 my $NewDirective = "";
3836 # Return if not needed
3837 return $NewDirective unless $ScriptingCleanup{$ContentType};
3839 # Create the relevant script: Open the pipe to the interpreter
3840 $NewDirective .= <<"BLOCKCGISCRIPTORSTOP";
3841 # Cleanup Code for '$ContentType'
3842 # Select relevant output filehandle
3843 select($SCRIPTINGINPUT{$ContentType}); \$|=1;
3844 # Print Cleanup code to foreign script
3845 print $SCRIPTINGINPUT{$ContentType} <<'${ContentType}SCRIPTSTOP';
3846 $ScriptingCleanup{$ContentType}
3847 ${ContentType}SCRIPTSTOP
3849 # Select STDOUT filehandle
3850 select(STDOUT); \$|=1;
3851 BLOCKCGISCRIPTORSTOP
3853 return $NewDirective;
3857 # The prefix code for each <script></script> block
3858 sub PrefixForeignScript # ($ContentType) -> $DirectivePrefix
3860 my $ContentType = lc(shift) || return "";
3861 my $NewDirective = "";
3863 # Return if not needed
3864 return $NewDirective unless $ScriptingPrefix{$ContentType};
3866 my $Quote = "\'";
3867 # If the CGIvariables parameter is defined, but empty, interpolate
3868 # code string (i.e., $var .= << "END" i.s.o. $var .= << 'END')
3869 $Quote = '"' if exists($ScriptingCGIvariables{$ContentType}) &&
3870 !$ScriptingCGIvariables{$ContentType};
3872 # Add initialization code
3873 $NewDirective .= <<"BLOCKCGISCRIPTORPREFIX";
3874 # Prefix Code for '$ContentType'
3875 # Select relevant output filehandle
3876 select($SCRIPTINGINPUT{$ContentType}); \$|=1;
3878 # The block Prefix code (if any)
3879 print $SCRIPTINGINPUT{$ContentType} <<$Quote${ContentType}PREFIXCODE$Quote;
3880 $ScriptingPrefix{$ContentType}
3881 ${ContentType}PREFIXCODE
3882 # Select STDOUT filehandle
3883 select(STDOUT); \$|=1;
3884 BLOCKCGISCRIPTORPREFIX
3886 return $NewDirective;
3890 # The postfix code for each <script></script> block
3891 sub PostfixForeignScript # ($ContentType) -> $DirectivePrefix
3893 my $ContentType = lc(shift) || return "";
3894 my $NewDirective = "";
3896 # Return if not needed
3897 return $NewDirective unless $ScriptingPostfix{$ContentType};
3899 my $Quote = "\'";
3900 # If the CGIvariables parameter is defined, but empty, interpolate
3901 # code string (i.e., $var .= << "END" i.s.o. $var .= << 'END')
3902 $Quote = '"' if exists($ScriptingCGIvariables{$ContentType}) &&
3903 !$ScriptingCGIvariables{$ContentType};
3905 # Create the relevant script: Open the pipe to the interpreter
3906 $NewDirective .= <<"BLOCKCGISCRIPTORPOSTFIX";
3907 # Postfix Code for '$ContentType'
3908 # Select filehandle to interpreter
3909 select($SCRIPTINGINPUT{$ContentType}); \$|=1;
3910 # Print postfix code to foreign script
3911 print $SCRIPTINGINPUT{$ContentType} <<$Quote${ContentType}SCRIPTPOSTFIX$Quote;
3912 $ScriptingPostfix{$ContentType}
3913 ${ContentType}SCRIPTPOSTFIX
3914 # Select STDOUT filehandle
3915 select(STDOUT); \$|=1;
3916 BLOCKCGISCRIPTORPOSTFIX
3918 return $NewDirective;
3921 sub InsertForeignScript # ($ContentType, $directive, @SRCfile) -> $NewDirective
3923 my $ContentType = lc(shift) || return "";
3924 my $directive = shift || return "";
3925 my @SRCfile = @_;
3926 my $NewDirective = "";
3928 my $Quote = "\'";
3929 # If the CGIvariables parameter is defined, but empty, interpolate
3930 # code string (i.e., $var .= << "END" i.s.o. $var .= << 'END')
3931 $Quote = '"' if exists($ScriptingCGIvariables{$ContentType}) &&
3932 !$ScriptingCGIvariables{$ContentType};
3934 # Create the relevant script
3935 $NewDirective .= <<"BLOCKCGISCRIPTORINSERT";
3936 # Insert Code for '$ContentType'
3937 # Select filehandle to interpreter
3938 select($SCRIPTINGINPUT{$ContentType}); \$|=1;
3939 BLOCKCGISCRIPTORINSERT
3941 # Use SRC feature files
3942 my $ThisSRCfile;
3943 while($ThisSRCfile = shift(@_))
3945 # Handle blocks
3946 if($ThisSRCfile =~ /^\s*\{\s*/)
3948 my $Block = $';
3949 $Block = $` if $Block =~ /\s*\}\s*$/;
3950 $NewDirective .= <<"BLOCKCGISCRIPTORSRCBLOCK";
3951 print $SCRIPTINGINPUT{$ContentType} <<$Quote${ContentType}SRCBLOCKCODE$Quote;
3952 $Block
3953 ${ContentType}SRCBLOCKCODE
3954 BLOCKCGISCRIPTORSRCBLOCK
3956 next;
3959 # Handle files
3960 $NewDirective .= <<"BLOCKCGISCRIPTORSRCFILES";
3961 # Read $ThisSRCfile
3962 open(SCRIPTINGSOURCE, "<$ThisSRCfile") || main::dieHandler(16, "$ThisSRCfILE: \$!");
3963 while(<SCRIPTINGSOURCE>)
3965 print $SCRIPTINGINPUT{$ContentType} \$_;
3967 close(SCRIPTINGSOURCE);
3969 BLOCKCGISCRIPTORSRCFILES
3973 # Add the directive
3974 if($directive)
3976 $NewDirective .= <<"BLOCKCGISCRIPTORINSERT";
3977 print $SCRIPTINGINPUT{$ContentType} <<$Quote${ContentType}DIRECTIVECODE$Quote;
3978 $directive
3979 ${ContentType}DIRECTIVECODE
3980 BLOCKCGISCRIPTORINSERT
3984 $NewDirective .= <<"BLOCKCGISCRIPTORSELECT";
3985 # Select STDOUT filehandle
3986 select(STDOUT); \$|=1;
3987 BLOCKCGISCRIPTORSELECT
3989 # Ready
3990 return $NewDirective;
3993 sub CloseAllForeignScripts # Call CloseForeignScript on all open scripts
3995 my $ContentType;
3996 foreach $ContentType (keys(%SCRIPTINGINPUT))
3998 my $directive = CloseForeignScript($ContentType);
3999 print STDERR "\nDirective $CGI_Date: ", $directive;
4000 CGIexecute->evaluate($directive);
4005 # End of handling foreign (external) scripting languages.
4007 ############################################################################
4009 # A subroutine to handle "nested" quotes, it cuts off the leading
4010 # item or quoted substring
4011 # E.g.,
4012 # ' A_word and more words' -> @('A_word', ' and more words')
4013 # '"quoted string" The rest' -> @('quoted string', ' The rest')
4014 # (this is needed for parsing the <TAGS> and their attributes)
4015 my $SupportedQuotes = "\'\"\`\(\{\[";
4016 my %QuotePairs = ('('=>')','['=>']','{'=>'}'); # Brackets
4017 sub ExtractQuotedItem # ($String) -> @($QuotedString, $RestOfString)
4019 my @Result = ();
4020 my $String = shift || return @Result;
4022 if($String =~ /^\s*([\w\/\-\.]+)/is)
4024 push(@Result, $1, $');
4026 elsif($String =~ /^\s*(\\?)([\Q$SupportedQuotes\E])/is)
4028 my $BackSlash = $1 || "";
4029 my $OpenQuote = $2;
4030 my $CloseQuote = $OpenQuote;
4031 $CloseQuote = $QuotePairs{$OpenQuote} if $QuotePairs{$OpenQuote};
4033 if($BackSlash)
4035 $String =~ /^\s*\\\Q$OpenQuote\E/i;
4036 my $Onset = $';
4037 $Onset =~ /\\\Q$CloseQuote\E/i;
4038 my $Rest = $';
4039 my $Item = $`;
4040 push(@Result, $Item, $Rest);
4043 else
4045 $String =~ /^\s*\Q$OpenQuote\E([^\Q$CloseQuote\E]*)\Q$CloseQuote\E/i;
4046 push(@Result, $1, $');
4049 else
4051 push(@Result, "", $String);
4053 return @Result;
4056 # Now, start with the real work
4058 # Control the output of the Content-type: text/html\n\n message
4059 my $SupressContentType = 0;
4061 # Process a file
4062 sub ProcessFile # ($file_path)
4064 my $file_path = shift || return 0;
4067 # Generate a unique file handle (for recursions)
4068 my @SRClist = ();
4069 my $FileHandle = "file";
4070 my $n = 0;
4071 while(!eof($FileHandle.$n)) {++$n;};
4072 $FileHandle .= $n;
4074 # Start HTML output
4075 # Use the default Content-type if this is NOT a raw file
4076 unless(($RawFilePattern && $ENV{'PATH_INFO'} =~ m@($RawFilePattern)$@i)
4077 || $SupressContentType)
4079 $ENV{'PATH_INFO'} =~ m@($FilePattern)$@i;
4080 my $ContentType = $ContentTypeTable{$1};
4081 print "Content-type: $ContentType\n";
4082 if(%SETCOOKIELIST && keys(%SETCOOKIELIST))
4084 foreach my $name (keys(%SETCOOKIELIST))
4086 my $value = $SETCOOKIELIST{$name};
4087 print "Set-Cookie: $name=$value\n";
4089 # Cookies are set only ONCE
4090 %SETCOOKIELIST = ();
4092 print "\n";
4093 $SupressContentType = 1; # Content type has been printed
4097 # Get access to the actual data. This can be from RAM (by way of an
4098 # environment variable) or by opening a file.
4100 # Handle the use of RAM images (file-data is stored in the
4101 # $CGI_FILE_CONTENTS environment variable)
4102 # Note that this environment variable will be cleared, i.e., it is strictly for
4103 # single-use only!
4104 if($ENV{$CGI_FILE_CONTENTS})
4106 # File has been read already
4107 $_ = $ENV{$CGI_FILE_CONTENTS};
4108 # Sorry, you have to do the reading yourself (dynamic document creation?)
4109 # NOTE: you must read the whole document at once
4110 if($_ eq '-')
4112 $_ = eval("\@_=('$file_path'); do{$ENV{$CGI_DATA_ACCESS_CODE}}");
4114 else # Clear environment variable
4116 $ENV{$CGI_FILE_CONTENTS} = '-';
4119 # Open Only PLAIN TEXT files (or STDIN) and NO executable files (i.e., scripts).
4120 # THIS IS A SECURITY FEATURE!
4121 elsif($file_path eq '-' || (-e "$file_path" && -r _ && -T _ && -f _ && ! (-x _ || -X _) ))
4123 open($FileHandle, $file_path) || dieHandler(17, "<h2>File not found</h2>\n");
4124 push(@OpenFiles, $file_path);
4125 $_ = <$FileHandle>; # Read first line
4127 else
4129 print "<h2>File not found</h2>\n";
4130 dieHandler(18, "$file_path\n");
4133 $| = 1; # Flush output buffers
4135 # Initialize variables
4136 my $METAarguments = ""; # The CGI arguments from the latest META tag
4137 my @METAvalues = (); # The ''-quoted CGI values from the latest META tag
4138 my $ClosedTag = 0; # <TAG> </TAG> versus <TAG/>
4141 # Send document to output
4142 # Process the requested document.
4143 # Do a loop BEFORE reading input again (this catches the RAM/Database
4144 # type of documents).
4145 do {
4148 # Handle translations if needed
4150 performTranslation(\$_) if $TranslationPaths;
4152 # Catch <SCRIPT LANGUAGE="PERL" TYPE="text/ssperl" > directives in $_
4153 # There can be more than 1 <SCRIPT> or META tags on a line
4154 while(/\<\s*(SCRIPT|META|DIV|INS)\s/is)
4156 my $directive = "";
4157 # Store rest of line
4158 my $Before = $`;
4159 my $ScriptTag = $&;
4160 my $After = $';
4161 my $TagType = uc($1);
4162 # The before part can be send to the output
4163 print $Before;
4165 # Read complete Tag from after and/or file
4166 until($After =~ /([^\\])\>/)
4168 $After .= <$FileHandle>;
4169 performTranslation(\$After) if $TranslationPaths;
4172 if($After =~ /([^\\])\>/)
4174 $ScriptTag .= $`.$&; # Keep the Script Tag intact
4175 $After = $';
4177 else
4179 dieHandler(19, "Closing > not found\n");
4182 # The tag could be closed by />, we handle this in the XML way
4183 # and don't process any content (we ignore whitespace)
4184 $ClosedTag = ($ScriptTag =~ m@[^\\]/\s*\>\s*$@) ? 1 : 0;
4187 # TYPE or CLASS?
4188 my $TypeName = ($TagType =~ /META/is) ? "CONTENT" : "TYPE";
4189 $TypeName = "CLASS" if $TagType eq 'DIV' || $TagType eq 'INS';
4191 # Parse <SCRIPT> or <META> directive
4192 # If NOT (TYPE|CONTENT)="text/ssperl" (i.e., $ServerScriptContentType),
4193 # send the line to the output and go to the next loop
4194 my $CurrentContentType = "";
4195 if($ScriptTag =~ /(^|\s)$TypeName\s*=\s*/is)
4197 my ($Type) = ExtractQuotedItem($');
4198 $Type =~ /^\s*([\w\/\-]+)\s*[\,\;]?/;
4199 $CurrentContentType = lc($1); # Note: mime-types are "case-less"
4200 # CSS classes are aliases of $ServerScriptContentType
4201 if($TypeName eq "CLASS" && $CurrentContentType eq $ServerScriptContentClass)
4203 $CurrentContentType = $ServerScriptContentType;
4208 # Not a known server-side content type, print and continue
4209 unless(($CurrentContentType =~
4210 /$ServerScriptContentType|$ShellScriptContentType/is) ||
4211 $ScriptingLanguages{$CurrentContentType})
4213 print $ScriptTag;
4214 $_ = $After;
4215 next;
4219 # A known server-side content type, evaluate
4221 # First, handle \> and \<
4222 $ScriptTag =~ s/\\\>/\>/isg;
4223 $ScriptTag =~ s/\\\</\</isg;
4225 # Extract the CGI, SRC, ID, IF and UNLESS attributes
4226 my %ScriptTagAttributes = ();
4227 while($ScriptTag =~ /(^|\s)(CGI|IF|UNLESS|SRC|ID)\s*=\s*/is)
4229 my $Attribute = $2;
4230 my $Rest = $';
4231 my $Value = "";
4232 ($Value, $ScriptTag) = ExtractQuotedItem($Rest);
4233 $ScriptTagAttributes{uc($Attribute)} = $Value;
4237 # The attribute used to define the CGI variables
4238 # Extract CGI-variables from
4239 # <META CONTENT="text/ssperl; CGI='' SRC=''">
4240 # <SCRIPT TYPE='text/ssperl' CGI='' SRC=''>
4241 # <DIV CLASS='ssperl' CGI='' SRC='' ID=""> tags
4242 # <INS CLASS='ssperl' CGI='' SRC='' ID=""> tags
4243 if($ScriptTagAttributes{'CGI'})
4245 @ARGV = (); # Reset ARGV
4246 $ARGC = 0;
4247 $METAarguments = ""; # Reset the META CGI arguments
4248 @METAvalues = ();
4249 my $Meta_CGI = $ScriptTagAttributes{'CGI'};
4251 # Process default values of variables ($<name> = 'default value')
4252 # Allowed quotes are '', "", ``, (), [], and {}
4253 while($Meta_CGI =~ /(^\s*|[^\\])([\$\@\%]?)([\w\-]+)\s*/is)
4255 my $varType = $2 || '$'; # Variable or list
4256 my $name = $3; # The Name
4257 my $default = "";
4258 $Meta_CGI = $';
4260 if($Meta_CGI =~ /^\s*\=\s*/is)
4262 # Locate (any) default value
4263 ($default, $Meta_CGI) = ExtractQuotedItem($'); # Cut the parameter from the CGI
4265 $RemainingTag = $Meta_CGI;
4268 # Define CGI (or ENV) variable, initalize it from the
4269 # Query string or the default value
4271 # Also construct the @ARGV and @_ arrays. This allows other (SRC=) Perl
4272 # scripts to access the CGI arguments defined in the META tag
4273 # (Not for CGI inside <SCRIPT> tags)
4274 if($varType eq '$')
4276 CGIexecute::defineCGIvariable($name, $default)
4277 || dieHandler(20, "INVALID CGI name/value pair ($name, $default)\n");
4278 push(@METAvalues, "'".${"CGIexecute::$name"}."'");
4279 # Add value to the @ARGV list
4280 push(@ARGV, ${"CGIexecute::$name"});
4281 ++$ARGC;
4283 elsif($varType eq '@')
4285 CGIexecute::defineCGIvariableList($name, $default)
4286 || dieHandler(21, "INVALID CGI name/value list pair ($name, $default)\n");
4287 push(@METAvalues, "'".join("'", @{"CGIexecute::$name"})."'");
4288 # Add value to the @ARGV list
4289 push(@ARGV, @{"CGIexecute::$name"});
4290 $ARGC = scalar(@CGIexecute::ARGV);
4292 elsif($varType eq '%')
4294 CGIexecute::defineCGIvariableHash($name, $default)
4295 || dieHandler(22, "INVALID CGI name/value hash pair ($name, $default)\n");
4296 my @PairList = map {"$_ => ".${"CGIexecute::$name"}{$_}} keys(%{"CGIexecute::$name"});
4297 push(@METAvalues, "'".join("'", @PairList)."'");
4298 # Add value to the @ARGV list
4299 push(@ARGV, %{"CGIexecute::$name"});
4300 $ARGC = scalar(@CGIexecute::ARGV);
4303 # Store the values for internal and later use
4304 $METAarguments .= "$varType".$name.","; # A string of CGI variable names
4306 push(@METAvalues, "\'".eval("\"$varType\{CGIexecute::$name\}\"")."\'"); # ALWAYS add '-quotes around values
4311 # The IF (conditional execution) Attribute
4312 # Evaluate the condition and stop unless it evaluates to true
4313 if($ScriptTagAttributes{'IF'})
4315 my $IFcondition = $ScriptTagAttributes{'IF'};
4317 # Convert SCRIPT calls, ./<script>
4318 $IFcondition =~ s@([\W]|^)\./([\S])@$1$SCRIPT_SUB$2@g;
4320 # Convert FILE calls, ~/<file>
4321 $IFcondition =~ s@([\W])\~/([\S])@$1$HOME_SUB$2@g;
4323 # Block execution if necessary
4324 unless(CGIexecute->evaluate($IFcondition))
4326 %ScriptTagAttributes = ();
4327 $CurrentContentType = "";
4331 # The UNLESS (conditional execution) Attribute
4332 # Evaluate the condition and stop if it evaluates to true
4333 if($ScriptTagAttributes{'UNLESS'})
4335 my $UNLESScondition = $ScriptTagAttributes{'UNLESS'};
4337 # Convert SCRIPT calls, ./<script>
4338 $UNLESScondition =~ s@([\W]|^)\./([\S])@$1$SCRIPT_SUB$2@g;
4340 # Convert FILE calls, ~/<file>
4341 $UNLESScondition =~ s@([\W])\~/([\S])@$1$HOME_SUB$2@g;
4343 # Block execution if necessary
4344 if(CGIexecute->evaluate($UNLESScondition))
4346 %ScriptTagAttributes = ();
4347 $CurrentContentType = "";
4351 # The SRC (Source File) Attribute
4352 # Extract any source script files and add them in
4353 # front of the directive
4354 # The SRC list should be emptied
4355 @SRClist = ();
4356 my $SRCtag = "";
4357 my $Prefix = 1;
4358 my $PrefixDirective = "";
4359 my $PostfixDirective = "";
4360 # There is a SRC attribute
4361 if($ScriptTagAttributes{'SRC'})
4363 $SRCtag = $ScriptTagAttributes{'SRC'};
4364 # Remove "file://" prefixes
4365 $SRCtag =~ s@([^\w\/\\]|^)file\://([^\s\/\@\=])@$1$2@gis;
4366 # Expand script filenames "./Script"
4367 $SRCtag =~ s@([^\w\/\\]|^)\./([^\s\/\@\=])@$1$SCRIPT_SUB/$2@gis;
4368 # Expand script filenames "~/Script"
4369 $SRCtag =~ s@([^\w\/\\]|^)\~/([^\s\/\@\=])@$1$HOME_SUB/$2@gis;
4372 # File source tags
4373 while($SRCtag =~ /\S/is)
4375 my $SRCdirective = "";
4377 # Pseudo file, just a switch to go from PREFIXING to POSTFIXING
4378 # SRC files
4379 if($SRCtag =~ /^[\s\;\,]*(POSTFIX|PREFIX)([^$FileAllowedChars]|$)/is)
4381 my $InsertionPlace = $1;
4382 $SRCtag = $2.$';
4384 $Prefix = $InsertionPlace =~ /POSTFIX/i ? 0 : 1;
4385 # Go to next round
4386 next;
4388 # {}-blocks are just evaluated by "do"
4389 elsif($SRCtag =~ /^[\s\;\,]*\{/is)
4391 my $SRCblock = $';
4392 if($SRCblock =~ /\}[\s\;\,]*([^\}]*)$/is)
4394 $SRCblock = $`;
4395 $SRCtag = $1.$';
4396 # SAFEqx shell script blocks
4397 if($CurrentContentType =~ /$ShellScriptContentType/is)
4399 # Handle ''-quotes inside the script
4400 $SRCblock =~ s/[\']/\\$&/gis;
4402 $SRCblock = "print do { SAFEqx(\'".$SRCblock."\'); };'';";
4403 $SRCdirective .= $SRCblock."\n";
4405 # do { SRCblocks }
4406 elsif($CurrentContentType =~ /$ServerScriptContentType/is)
4408 $SRCblock = "print do { $SRCblock };'';";
4409 $SRCdirective .= $SRCblock."\n";
4411 else # The interpreter should handle this
4413 push(@SRClist, "{ $SRCblock }");
4417 else
4418 { dieHandler(23, "Closing \} missing\n");};
4420 # Files are processed as Text or Executable files
4421 elsif($SRCtag =~ /[\s\;\,]*([$FileAllowedChars]+)[\;\,\s]*/is)
4423 my $SrcFile = $1;
4424 $SRCtag = $';
4426 # We are handling one of the external interpreters
4427 if($ScriptingLanguages{$CurrentContentType})
4429 push(@SRClist, $SrcFile);
4431 # We are at the start of a DIV tag, just load all SRC files and/or URL's
4432 elsif($TagType eq 'DIV' || $TagType eq 'INS') # All files are prepended in DIV's
4434 # $SrcFile is a URL pointing to an HTTP or FTP server
4435 if($SrcFile =~ m!^([a-z]+)\://!)
4437 my $URLoutput = CGIscriptor::read_url($SrcFile);
4438 $SRCdirective .= $URLoutput;
4440 # SRC file is an existing file
4441 elsif(-e "$SrcFile")
4443 open(DIVSOURCE, "<$SrcFile") || dieHandler(24, "<$SrcFile: $!\n");
4444 my $Content;
4445 while(sysread(DIVSOURCE, $Content, 1024) > 0)
4447 $SRCdirective .= $Content;
4449 close(DIVSOURCE);
4452 # Executable files are executed as
4453 # `$SrcFile 'ARGV[0]' 'ARGV[1]'`
4454 elsif(-x "$SrcFile")
4456 $SRCdirective .= "print \`$SrcFile @METAvalues\`;'';\n";
4458 # Handle 'standard' files, using ProcessFile
4459 elsif((-T "$SrcFile" || $ENV{$CGI_FILE_CONTENTS})
4460 && $SrcFile =~ m@($FilePattern)$@) # A recursion
4463 # Do not process still open files because it can lead
4464 # to endless recursions
4465 if(grep(/^$SrcFile$/, @OpenFiles))
4466 { dieHandler(25, "$SrcFile allready opened (endless recursion)\n")};
4467 # Prepare meta arguments
4468 $SRCdirective .= '@ARGV = (' .$METAarguments.");\n" if $METAarguments;
4469 # Process the file
4470 $SRCdirective .= "main::ProcessFile(\'$SrcFile\');'';\n";
4472 elsif($SrcFile =~ m!^([a-z]+)\://!) # URL's are loaded and printed
4474 $SRCdirective .= GET_URL($SrcFile);
4476 elsif(-T "$SrcFile") # Textfiles are "do"-ed (Perl execution)
4478 $SRCdirective .= '@ARGV = (' .$METAarguments.");\n" if $METAarguments;
4479 $SRCdirective .= "do \'$SrcFile\';'';\n";
4481 else # This one could not be resolved (should be handled by BinaryMapFile)
4483 $SRCdirective .= 'print "'.$SrcFile.' cannot be used"'."\n";
4488 # Postfix or Prefix
4489 if($Prefix)
4491 $PrefixDirective .= $SRCdirective;
4493 else
4495 $PostfixDirective .= $SRCdirective;
4498 # The prefix should be handled immediately
4499 $directive .= $PrefixDirective;
4500 $PrefixDirective = "";
4504 # Handle the content of the <SCRIPT></SCRIPT> tags
4505 # Do not process the content of <SCRIPT/>
4506 if($TagType =~ /SCRIPT/is && !$ClosedTag) # The <SCRIPT> TAG
4508 my $EndScriptTag = "";
4510 # Execute SHELL scripts with SAFEqx()
4511 if($CurrentContentType =~ /$ShellScriptContentType/is)
4513 $directive .= "SAFEqx(\'";
4516 # Extract Program
4517 while($After !~ /\<\s*\/SCRIPT[^\>]*\>/is && !eof($FileHandle))
4519 $After .= <$FileHandle>;
4520 performTranslation(\$After) if $TranslationPaths;
4523 if($After =~ /\<\s*\/SCRIPT[^\>]*\>/is)
4525 $directive .= $`;
4526 $EndScriptTag = $&;
4527 $After = $';
4529 else
4531 dieHandler(26, "Missing </SCRIPT> end tag in $ENV{'PATH_INFO'}\n");
4534 # Process only when content should be executed
4535 if($CurrentContentType)
4538 # Remove all comments from Perl scripts
4539 # (NOT from OS shell scripts)
4540 $directive =~ s/[^\\\$]\#[^\n\f\r]*([\n\f\r])/$1/g
4541 if $CurrentContentType =~ /$ServerScriptContentType/i;
4543 # Convert SCRIPT calls, ./<script>
4544 $directive =~ s@([\W]|^)\./([\S])@$1$SCRIPT_SUB$2@g;
4546 # Convert FILE calls, ~/<file>
4547 $directive =~ s@([\W])\~/([\S])@$1$HOME_SUB$2@g;
4549 # Execute SHELL scripts with SAFEqx(), closing bracket
4550 if($CurrentContentType =~ /$ShellScriptContentType/i)
4552 # Handle ''-quotes inside the script
4553 $directive =~ /SAFEqx\(\'/;
4554 $directive = $`.$&;
4555 my $Executable = $';
4556 $Executable =~ s/[\']/\\$&/gs;
4558 $directive .= $Executable."\');"; # Closing bracket
4561 else
4563 $directive = "";
4566 # Handle the content of the <DIV></DIV> tags
4567 # Do not process the content of <DIV/>
4568 elsif(($TagType eq 'DIV' || $TagType eq 'INS') && !$ClosedTag) # The <DIV> TAGs
4570 my $EndScriptTag = "";
4572 # Extract Text
4573 while($After !~ /\<\s*\/$TagType[^\>]*\>/is && !eof($FileHandle))
4575 $After .= <$FileHandle>;
4576 performTranslation(\$After) if $TranslationPaths;
4579 if($After =~ /\<\s*\/$TagType[^\>]*\>/is)
4581 $directive .= $`;
4582 $EndScriptTag = $&;
4583 $After = $';
4585 else
4587 dieHandler(27, "Missing </$TagType> end tag in $ENV{'PATH_INFO'}\n");
4590 # Add the Postfixed directives (but only when it contains something printable)
4591 $directive .= "\n".$PostfixDirective if $PostfixDirective =~ /\S/;
4592 $PostfixDirective = "";
4595 # Process only when content should be handled
4596 if($CurrentContentType)
4599 # Get the name (ID), and clean it (i.e., remove anything that is NOT part of
4600 # a valid Perl name). Names should not contain $, but we can handle it.
4601 my $name = $ScriptTagAttributes{'ID'};
4602 $name =~ /^\s*[\$\@\%]?([\w\-]+)/;
4603 $name = $1;
4605 # Assign DIV contents to $NAME value OUTSIDE the CGI values!
4606 CGIexecute::defineCGIexecuteVariable($name, $directive);
4607 $directive = "";
4610 # Nothing to execute
4611 $directive = "";
4615 # Handle Foreign scripting languages
4616 if($ScriptingLanguages{$CurrentContentType})
4618 my $newDirective = "";
4619 $newDirective .= OpenForeignScript($CurrentContentType); # Only if not already done
4620 $newDirective .= PrefixForeignScript($CurrentContentType);
4621 $newDirective .= InsertForeignScript($CurrentContentType, $directive, @SRClist);
4622 $newDirective .= PostfixForeignScript($CurrentContentType);
4623 $newDirective .= CloseForeignScript($CurrentContentType); # This shouldn't be necessary
4625 $newDirective .= '"";';
4627 $directive = $newDirective;
4631 # Add the Postfixed directives (but only when it contains something printable)
4632 $directive .= "\n".$PostfixDirective if $PostfixDirective =~ /\S/;
4633 $PostfixDirective = "";
4636 # EXECUTE the script and print the results
4638 # Use this to debug the program
4639 # print STDERR "Directive $CGI_Date: \n", $directive, "\n\n";
4641 my $Result = CGIexecute->evaluate($directive) if $directive; # Evaluate as PERL code
4642 $Result =~ s/\n$//g; # Remove final newline
4644 # Print the Result of evaluating the directive
4645 # (this will handle LARGE, >64 kB output)
4646 my $BytesWritten = 1;
4647 while($Result && $BytesWritten)
4649 $BytesWritten = syswrite(STDOUT, $Result, 64);
4650 $Result = substr($Result, $BytesWritten);
4652 # print $Result; # Could be used instead of above code
4654 # Store result if wanted, i.e., if $CGIscriptorResults has been
4655 # defined in a <META> tag.
4656 push(@CGIexecute::CGIscriptorResults, $Result)
4657 if exists($default_values{'CGIscriptorResults'});
4659 # Process the rest of the input line (this could contain
4660 # another directive)
4661 $_ = $After;
4663 print $_;
4664 } while(<$FileHandle>); # Read and Test AFTER first loop!
4666 close ($FileHandle);
4667 dieHandler(28, "Error in recursion\n") unless pop(@OpenFiles) == $file_path;
4671 ###############################################################################
4673 # Call the whole package
4675 sub Handle_Request
4677 my $file_path = "";
4679 # Initialization Code
4680 Initialize_Request();
4682 # SECURITY: ACCESS CONTROL
4683 Access_Control();
4685 # Read the POST part of the query, if there is one
4686 Get_POST_part_of_query();
4688 # Start (HTML) output and logging
4689 $file_path = Initialize_output();
4691 # Check login access or divert to login procedure
4692 $Use_Login = Log_In_Access();
4693 $file_path = $Use_Login if $Use_Login;
4695 # Record which files are still open (to avoid endless recursions)
4696 my @OpenFiles = ();
4698 # Record whether the default HTML ContentType has already been printed
4699 # but only if the SERVER uses HTTP or some other protocol that might interpret
4700 # a content MIME type.
4702 $SupressContentType = !("$ENV{'SERVER_PROTOCOL'}" =~ /($ContentTypeServerProtocols)/i);
4704 # Process the specified file
4705 ProcessFile($file_path) if $file_path ne $SS_PUB;
4707 # Cleanup all open external (foreign) interpreters
4708 CloseAllForeignScripts();
4711 "" # SUCCESS
4714 # Make a single call to handle an (empty) request
4715 Handle_Request();
4718 # END OF PACKAGE MAIN
4721 ####################################################################################
4723 # The CGIEXECUTE PACKAGE
4725 ####################################################################################
4727 # Isolate the evaluation of directives as PERL code from the rest of the program.
4728 # Remember that each package has its own name space.
4729 # Note that only the FIRST argument of execute->evaluate is actually evaluated,
4730 # all other arguments are accessible inside the first argument as $_[0] to $_[$#_].
4732 package CGIexecute;
4734 sub evaluate
4736 my $self = shift;
4737 my $directive = shift;
4738 $directive = eval($directive);
4739 warn $@ if $@; # Write an error message to STDERR
4740 $directive; # Return value of directive
4744 # defineCGIexecuteVariable($name [, $value]) -> 0/1
4746 # Define and intialize variables inside CGIexecute
4747 # Does no sanity checking, for internal use only
4749 sub defineCGIexecuteVariable # ($name [, $value]) -> 0/1
4751 my $name = shift || return 0; # The Name
4752 my $value = shift || ""; # The value
4754 ${$name} = $value;
4756 return 1;
4759 # Protect certain CGI variables values when set internally
4760 my %CGIprotectedVariable = ();
4761 sub ProtectCGIvariable # ($name) -> 0/1
4763 my $name = shift || "";
4764 return 0 unless $name && $name =~ /\w/;
4766 ++$CGIprotectedVariable{$name};
4768 return $CGIprotectedVariable{$name};
4771 # defineCGIvariable($name [, $default]) -> 0/1
4773 # Define and intialize CGI variables
4774 # Tries (in order) $ENV{$name}, the Query string and the
4775 # default value.
4776 # Removes all '-quotes etc.
4778 sub defineCGIvariable # ($name [, $default]) -> 0/1
4780 my $name = shift || return 0; # The Name
4781 my $default = shift || ""; # The default value
4783 # Protect variables set internally
4784 return 1 if !$name || exists($CGIprotectedVariable{$name});
4786 # Remove \-quoted characters
4787 $default =~ s/\\(.)/$1/g;
4788 # Store default values
4789 $::default_values{$name} = $default if $default;
4791 # Process variables
4792 my $temp = undef;
4793 # If there is a user supplied value, it replaces the
4794 # default value.
4796 # Environment values have precedence
4797 if(exists($ENV{$name}))
4799 $temp = $ENV{$name};
4801 # Get name and its value from the query string
4802 elsif($ENV{QUERY_STRING} =~ /$name/) # $name is in the query string
4804 $temp = ::YOUR_CGIPARSE($name);
4806 # Defined values must exist for security
4807 elsif(!exists($::default_values{$name}))
4809 $::default_values{$name} = undef;
4812 # SECURITY, do not allow '- and `-quotes in
4813 # client values.
4814 # Remove all existing '-quotes
4815 $temp =~ s/([\r\f]+\n)/\n/g; # Only \n is allowed
4816 $temp =~ s/[\']/&#8217;/igs; # Remove all single quotes
4817 $temp =~ s/[\`]/&#8216;/igs; # Remove all backtick quotes
4818 # If $temp is empty, use the default value (if it exists)
4819 unless($temp =~ /\S/ || length($temp) > 0) # I.e., $temp is empty
4821 $temp = $::default_values{$name};
4822 # Remove all existing '-quotes
4823 $temp =~ s/([\r\f]+\n)/\n/g; # Only \n is allowed
4824 $temp =~ s/[\']/&#8217;/igs; # Remove all single quotes
4825 $temp =~ s/[\`]/&#8216;/igs; # Remove all backtick quotes
4827 else # Store current CGI values and remove defaults
4829 $::default_values{$name} = $temp;
4831 # Define the CGI variable and its value (in the execute package)
4832 ${$name} = $temp;
4834 # return SUCCES
4835 return 1;
4838 sub defineCGIvariableList # ($name [, $default]) -> 0/1)
4840 my $name = shift || return 0; # The Name
4841 my $default = shift || ""; # The default value
4843 # Protect variables set internally
4844 return 1 if !$name || exists($CGIprotectedVariable{$name});
4846 # Defined values must exist for security
4847 if(!exists($::default_values{$name}))
4849 $::default_values{$name} = $default;
4852 my @temp = ();
4855 # For security:
4856 # Environment values have precedence
4857 if(exists($ENV{$name}))
4859 push(@temp, $ENV{$name});
4861 # Get name and its values from the query string
4862 elsif($ENV{QUERY_STRING} =~ /$name/) # $name is in the query string
4864 push(@temp, ::YOUR_CGIPARSE($name, 1)); # Extract LIST
4866 else
4868 push(@temp, $::default_values{$name});
4872 # SECURITY, do not allow '- and `-quotes in
4873 # client values.
4874 # Remove all existing '-quotes
4875 @temp = map {s/([\r\f]+\n)/\n/g; $_} @temp; # Only \n is allowed
4876 @temp = map {s/[\']/&#8217;/igs; $_} @temp; # Remove all single quotes
4877 @temp = map {s/[\`]/&#8216;/igs; $_} @temp; # Remove all backtick quotes
4879 # Store current CGI values and remove defaults
4880 $::default_values{$name} = $temp[0];
4882 # Define the CGI variable and its value (in the execute package)
4883 @{$name} = @temp;
4885 # return SUCCES
4886 return 1;
4889 sub defineCGIvariableHash # ($name [, $default]) -> 0/1) Note: '$name{""} = $default';
4891 my $name = shift || return 0; # The Name
4892 my $default = shift || ""; # The default value
4894 # Protect variables set internally
4895 return 1 if !$name || exists($CGIprotectedVariable{$name});
4897 # Defined values must exist for security
4898 if(!exists($::default_values{$name}))
4900 $::default_values{$name} = $default;
4903 my %temp = ();
4906 # For security:
4907 # Environment values have precedence
4908 if(exists($ENV{$name}))
4910 $temp{""} = $ENV{$name};
4912 # Get name and its values from the query string
4913 elsif($ENV{QUERY_STRING} =~ /$name/) # $name is in the query string
4915 %temp = ::YOUR_CGIPARSE($name, -1); # Extract HASH table
4917 elsif($::default_values{$name} ne "")
4919 $temp{""} = $::default_values{$name};
4923 # SECURITY, do not allow '- and `-quotes in
4924 # client values.
4925 # Remove all existing '-quotes
4926 my $Key;
4927 foreach $Key (keys(%temp))
4929 $temp{$Key} =~ s/([\r\f]+\n)/\n/g; # Only \n is allowed
4930 $temp{$Key} =~ s/[\']/&#8217;/igs; # Remove all single quotes
4931 $temp{$Key} =~ s/[\`]/&#8216;/igs; # Remove all backtick quotes
4934 # Store current CGI values and remove defaults
4935 $::default_values{$name} = $temp{""};
4937 # Define the CGI variable and its value (in the execute package)
4938 %{$name} = ();
4939 my $tempKey;
4940 foreach $tempKey (keys(%temp))
4942 ${$name}{$tempKey} = $temp{$tempKey};
4945 # return SUCCES
4946 return 1;
4950 # SAFEqx('CommandString')
4952 # A special function that is a safe alternative to backtick quotes (and qx//)
4953 # with client-supplied CGI values. All CGI variables are surrounded by
4954 # single ''-quotes (except between existing \'\'-quotes, don't try to be
4955 # too smart). All variables are then interpolated. Simple (@) lists are
4956 # expanded with join(' ', @List), and simple (%) hash tables expanded
4957 # as a list of "key=value" pairs. Complex variables, e.g., @$var, are
4958 # evaluated in a scalar context (e.g., as scalar(@$var)). All occurrences of
4959 # $@% that should NOT be interpolated must be preceeded by a "\".
4960 # If the first line of the String starts with "#! interpreter", the
4961 # remainder of the string is piped into interpreter (after interpolation), i.e.,
4962 # open(INTERPRETER, "|interpreter");print INTERPRETER remainder;
4963 # just like in UNIX. There are some problems with quotes. Be carefull in
4964 # using them. You do not have access to the output of any piped (#!)
4965 # process! If you want such access, execute
4966 # <SCRIPT TYPE="text/osshell">echo "script"|interpreter</SCRIPT> or
4967 # <SCRIPT TYPE="text/ssperl">$resultvar = SAFEqx('echo "script"|interpreter');
4968 # </SCRIPT>.
4970 # SAFEqx ONLY WORKS WHEN THE STRING ITSELF IS SURROUNDED BY SINGLE QUOTES
4971 # (SO THAT IT IS NOT INTERPOLATED BEFORE IT CAN BE PROTECTED)
4972 sub SAFEqx # ('String') -> result of executing qx/"String"/
4974 my $CommandString = shift;
4975 my $NewCommandString = "";
4977 # Only interpolate when required (check the On/Off switch)
4978 unless($CGIscriptor::NoShellScriptInterpolation)
4981 # Handle existing single quotes around CGI values
4982 while($CommandString =~ /\'[^\']+\'/s)
4984 my $CurrentQuotedString = $&;
4985 $NewCommandString .= $`;
4986 $CommandString = $'; # The remaining string
4987 # Interpolate CGI variables between quotes
4988 # (e.g., '$CGIscriptorResults[-1]')
4989 $CurrentQuotedString =~
4990 s/(^|[^\\])([\$\@])((\w*)([\{\[][\$\@\%]?[\:\w\-]+[\}\]])*)/if(exists($main::default_values{$4})){
4991 "$1".eval("$2$3")}else{"$&"}/egs;
4993 # Combine result with previous result
4994 $NewCommandString .= $CurrentQuotedString;
4996 $CommandString = $NewCommandString.$CommandString;
4998 # Select known CGI variables and surround them with single quotes,
4999 # then interpolate all variables
5000 $CommandString =~
5001 s/(^|[^\\])([\$\@\%]+)((\w*)([\{\[][\w\:\$\"\-]+[\}\]])*)/
5002 if($2 eq '$' && exists($main::default_values{$4}))
5003 {"$1\'".eval("\$$3")."\'";}
5004 elsif($2 eq '@'){$1.join(' ', @{"$3"});}
5005 elsif($2 eq '%'){my $t=$1;map {$t.=" $_=".${"$3"}{$_}}
5006 keys(%{"$3"});$t}
5007 else{$1.eval("${2}$3");
5008 }/egs;
5010 # Remove backslashed [$@%]
5011 $CommandString =~ s/\\([\$\@\%])/$1/gs;
5014 # Debugging
5015 # return $CommandString;
5017 # Handle UNIX style "#! shell command\n" constructs as
5018 # a pipe into the shell command. The output cannot be tapped.
5019 my $ReturnValue = "";
5020 if($CommandString =~ /^\s*\#\!([^\f\n\r]+)[\f\n\r]/is)
5022 my $ShellScripts = $';
5023 my $ShellCommand = $1;
5024 open(INTERPRETER, "|$ShellCommand") || dieHandler(29, "\'$ShellCommand\' PIPE not opened: &!\n");
5025 select(INTERPRETER);$| = 1;
5026 print INTERPRETER $ShellScripts;
5027 close(INTERPRETER);
5028 select(STDOUT);$| = 1;
5030 # Shell scripts which are redirected to an existing named pipe.
5031 # The output cannot be tapped.
5032 elsif($CGIscriptor::ShellScriptPIPE)
5034 CGIscriptor::printSAFEqxPIPE($CommandString);
5036 else # Plain ``-backtick execution
5038 # Execute the commands
5039 $ReturnValue = qx/$CommandString/;
5041 return $ReturnValue;
5044 ####################################################################################
5046 # The CGIscriptor PACKAGE
5048 ####################################################################################
5050 # Isolate the evaluation of CGIscriptor functions, i.e., those prefixed with
5051 # "CGIscriptor::"
5053 package CGIscriptor;
5056 # The Interpolation On/Off switch
5057 my $NoShellScriptInterpolation = undef;
5058 # The ShellScript redirection pipe
5059 my $ShellScriptPIPE = undef;
5061 # Open a named PIPE for SAFEqx to receive ALL shell scripts
5062 sub RedirectShellScript # ('CommandString')
5064 my $CommandString = shift || undef;
5066 if($CommandString)
5068 $ShellScriptPIPE = "ShellScriptNamedPipe";
5069 open($ShellScriptPIPE, "|$CommandString")
5070 || main::dieHandler(30, "\'|$CommandString\' PIPE open failed: $!\n");
5072 else
5074 close($ShellScriptPIPE);
5075 $ShellScriptPIPE = undef;
5077 return $ShellScriptPIPE;
5080 # Print to redirected shell script pipe
5081 sub printSAFEqxPIPE # ("String") -> print return value
5083 my $String = shift || undef;
5085 select($ShellScriptPIPE); $| = 1;
5086 my $returnvalue = print $ShellScriptPIPE ($String);
5087 select(STDOUT); $| = 1;
5089 return $returnvalue;
5092 # a pointer to CGIexecute::SAFEqx
5093 sub SAFEqx # ('String') -> result of qx/"String"/
5095 my $CommandString = shift;
5096 return CGIexecute::SAFEqx($CommandString);
5100 # a pointer to CGIexecute::defineCGIvariable
5101 sub defineCGIvariable # ($name[, $default]) ->0/1
5103 my $name = shift;
5104 my $default = shift;
5105 return CGIexecute::defineCGIvariable($name, $default);
5109 # a pointer to CGIexecute::defineCGIvariable
5110 sub defineCGIvariableList # ($name[, $default]) ->0/1
5112 my $name = shift;
5113 my $default = shift;
5114 return CGIexecute::defineCGIvariableList($name, $default);
5118 # a pointer to CGIexecute::defineCGIvariable
5119 sub defineCGIvariableHash # ($name[, $default]) ->0/1
5121 my $name = shift;
5122 my $default = shift;
5123 return CGIexecute::defineCGIvariableHash($name, $default);
5127 # Decode URL encoded arguments
5128 sub URLdecode # (URL encoded input) -> string
5130 my $output = "";
5131 my $char;
5132 my $Value;
5133 foreach $Value (@_)
5135 my $EncodedValue = $Value; # Do not change the loop variable
5136 # Convert all "+" to " "
5137 $EncodedValue =~ s/\+/ /g;
5138 # Convert all hexadecimal codes (%FF) to their byte values
5139 while($EncodedValue =~ /\%([0-9A-F]{2})/i)
5141 $output .= $`.chr(hex($1));
5142 $EncodedValue = $';
5144 $output .= $EncodedValue; # The remaining part of $Value
5146 $output;
5149 # Encode arguments as URL codes.
5150 sub URLencode # (input) -> URL encoded string
5152 my $output = "";
5153 my $char;
5154 my $Value;
5155 foreach $Value (@_)
5157 my @CharList = split('', $Value);
5158 foreach $char (@CharList)
5160 if($char =~ /\s/)
5161 { $output .= "+";}
5162 elsif($char =~ /\w\-/)
5163 { $output .= $char;}
5164 else
5166 $output .= uc(sprintf("%%%2.2x", ord($char)));
5170 $output;
5173 # Extract the value of a CGI variable from the URL-encoded $string
5174 # Also extracts the data blocks from a multipart request. Does NOT
5175 # decode the multipart blocks
5176 sub CGIparseValue # (ValueName [, URL_encoded_QueryString [, \$QueryReturnReference]]) -> Decoded value
5178 my $ValueName = shift;
5179 my $QueryString = shift || $main::ENV{'QUERY_STRING'};
5180 my $ReturnReference = shift || undef;
5181 my $output = "";
5183 if($QueryString =~ /(^|\&)$ValueName\=([^\&]*)(\&|$)/)
5185 $output = URLdecode($2);
5186 $$ReturnReference = $' if ref($ReturnReference);
5188 # Get multipart POST or PUT methods
5189 elsif($main::ENV{'CONTENT_TYPE'} =~ m@(multipart/([\w\-]+)\;\s+boundary\=([\S]+))@i)
5191 my $MultipartType = $2;
5192 my $BoundaryString = $3;
5193 # Remove the boundary-string
5194 my $temp = $QueryString;
5195 $temp =~ /^\Q--$BoundaryString\E/m;
5196 $temp = $';
5198 # Identify the newline character(s), this is the first character in $temp
5199 my $NewLine = "\r\n"; # Actually, this IS the correct one
5200 unless($temp =~ /^(\-\-|\r\n)/) # However, you never realy can be sure
5202 # Is this correct??? I have to check.
5203 $NewLine = "\r\n" if $temp =~ /^(\r\n)/; # Double (CRLF, the correct one)
5204 $NewLine = "\n\r" if $temp =~ /^(\n\r)/; # Double
5205 $NewLine = "\n" if $temp =~ /^([\n])/; # Single Line Feed
5206 $NewLine = "\r" if $temp =~ /^([\r])/; # Single Return
5209 # search through all data blocks
5210 while($temp =~ /^\Q--$BoundaryString\E/m)
5212 my $DataBlock = $`;
5213 $temp = $';
5214 # Get the empty line after the header
5215 $DataBlock =~ /$NewLine$NewLine/;
5216 $Header = $`;
5217 $output = $';
5218 my $Header = $`;
5219 $output = $';
5221 # Remove newlines from the header
5222 $Header =~ s/$NewLine/ /g;
5224 # Look whether this block is the one you are looking for
5225 # Require the quotes!
5226 if($Header =~ /name\s*=\s*[\"\']$ValueName[\"\']/m)
5228 my $i;
5229 for($i=length($NewLine); $i; --$i)
5231 chop($output);
5233 # OK, get out
5234 last;
5236 # reinitialize the output
5237 $output = "";
5239 $$ReturnReference = $temp if ref($ReturnReference);
5241 elsif($QueryString !~ /(^|\&)$ValueName\=/) # The value simply isn't there
5243 return undef;
5244 $$ReturnReference = undef if ref($ReturnReference);
5246 else
5248 print "ERROR: $ValueName $main::ENV{'CONTENT_TYPE'}\n";
5250 return $output;
5254 # Get a list of values for the same ValueName. Uses CGIparseValue
5256 sub CGIparseValueList # (ValueName [, URL_encoded_QueryString]) -> List of decoded values
5258 my $ValueName = shift;
5259 my $QueryString = shift || $main::ENV{'QUERY_STRING'};
5260 my @output = ();
5261 my $RestQueryString;
5262 my $Value;
5263 while($QueryString &&
5264 (($Value = CGIparseValue($ValueName, $QueryString, \$RestQueryString))
5265 || defined($Value)))
5267 push(@output, $Value);
5268 $QueryString = $RestQueryString; # QueryString is consumed!
5270 # ready, return list with values
5271 return @output;
5274 sub CGIparseValueHash # (ValueName [, URL_encoded_QueryString]) -> Hash table of decoded values
5276 my $ValueName = shift;
5277 my $QueryString = shift || $main::ENV{'QUERY_STRING'};
5278 my $RestQueryString;
5279 my %output = ();
5280 while($QueryString && $QueryString =~ /(^|\&)$ValueName([\w]*)\=/)
5282 my $Key = $2;
5283 my $Value = CGIparseValue("$ValueName$Key", $QueryString, \$RestQueryString);
5284 $output{$Key} = $Value;
5285 $QueryString = $RestQueryString; # QueryString is consumed!
5287 # ready, return list with values
5288 return %output;
5291 sub CGIparseForm # ([URL_encoded_QueryString]) -> Decoded Form (NO multipart)
5293 my $QueryString = shift || $main::ENV{'QUERY_STRING'};
5294 my $output = "";
5296 $QueryString =~ s/\&/\n/g;
5297 $output = URLdecode($QueryString);
5299 $output;
5302 # Extract the header of a multipart CGI variable from the POST input
5303 sub CGIparseHeader # (ValueName [, URL_encoded_QueryString]) -> Decoded value
5305 my $ValueName = shift;
5306 my $QueryString = shift || $main::ENV{'QUERY_STRING'};
5307 my $output = "";
5309 if($main::ENV{'CONTENT_TYPE'} =~ m@(multipart/([\w\-]+)\;\s+boundary\=([\S]+))@i)
5311 my $MultipartType = $2;
5312 my $BoundaryString = $3;
5313 # Remove the boundary-string
5314 my $temp = $QueryString;
5315 $temp =~ /^\Q--$BoundaryString\E/m;
5316 $temp = $';
5318 # Identify the newline character(s), this is the first character in $temp
5319 my $NewLine = "\r\n"; # Actually, this IS the correct one
5320 unless($temp =~ /^(\-\-|\r\n)/) # However, you never realy can be sure
5322 $NewLine = "\n" if $temp =~ /^([\n])/; # Single Line Feed
5323 $NewLine = "\r" if $temp =~ /^([\r])/; # Single Return
5324 $NewLine = "\r\n" if $temp =~ /^(\r\n)/; # Double (CRLF, the correct one)
5325 $NewLine = "\n\r" if $temp =~ /^(\n\r)/; # Double
5328 # search through all data blocks
5329 while($temp =~ /^\Q--$BoundaryString\E/m)
5331 my $DataBlock = $`;
5332 $temp = $';
5333 # Get the empty line after the header
5334 $DataBlock =~ /$NewLine$NewLine/;
5335 $Header = $`;
5336 my $Header = $`;
5338 # Remove newlines from the header
5339 $Header =~ s/$NewLine/ /g;
5341 # Look whether this block is the one you are looking for
5342 # Require the quotes!
5343 if($Header =~ /name\s*=\s*[\"\']$ValueName[\"\']/m)
5345 $output = $Header;
5346 last;
5348 # reinitialize the output
5349 $output = "";
5352 return $output;
5356 # Checking variables for security (e.g., file names and email addresses)
5357 # File names are tested against the $::FileAllowedChars and $::BlockPathAccess variables
5358 sub CGIsafeFileName # FileName -> FileName or ""
5360 my $FileName = shift || "";
5361 return "" if $FileName =~ m?[^$::FileAllowedChars]?;
5362 return "" if $FileName =~ m!(^|/|\:)[\-\.]!;
5363 return "" if $FileName =~ m@\.\.\Q$::DirectorySeparator\E@; # Higher directory not allowed
5364 return "" if $FileName =~ m@\Q$::DirectorySeparator\E\.\.@; # Higher directory not allowed
5365 return "" if $::BlockPathAccess && $FileName =~ m@$::BlockPathAccess@; # Invisible (blocked) file
5367 return $FileName;
5370 sub CGIsafeEmailAddress # email -> email or ""
5372 my $Email = shift || "";
5373 return "" unless $Email =~ m/^[\w\.\-]+[\@][\w\.\-\:]+$/;
5374 return $Email;
5377 # Get a URL from the web. Needs main::GET_URL($URL) function
5378 # (i.e., curl, snarf, or wget)
5379 sub read_url # ($URL) -> page/file
5381 my $URL = shift || return "";
5383 # Get the commands to read the URL, do NOT add a print command
5384 my $URL_command = main::GET_URL($URL, 1);
5385 # execute the commands, i.e., actually read it
5386 my $URLcontent = CGIexecute->evaluate($URL_command);
5388 # Ready, return the content.
5389 return $URLcontent;
5392 ################################################>>>>>>>>>>Start Remove
5394 # BrowseAllDirs(Directory, indexfile)
5396 # usage:
5397 # <SCRIPT TYPE='text/ssperl'>
5398 # CGIscriptor::BrowseAllDirs('Sounds', 'index.html', '\.wav$')
5399 # </SCRIPT>
5401 # Allows to browse all directories. Stops at '/'. If the directory contains
5402 # an indexfile, eg, index.html, that file will be used instead. Files must match
5403 # the $Pattern, if it is given. Default is
5404 # CGIscriptor::BrowseAllDirs('/', 'index.html', '')
5406 sub BrowseAllDirs # (Directory, indexfile, $Pattern) -> Print HTML code
5408 my $Directory = shift || '/';
5409 my $indexfile = shift || 'index.html';
5410 my $Pattern = shift || '';
5411 $Directory =~ s!/$!!g;
5413 # If the index directory exists, use that one
5414 if(-s "$::CGI_HOME$Directory/$indexfile")
5416 return main::ProcessFile("$::CGI_HOME$Directory/$indexfile");
5419 # No indexfile, continue
5420 my @DirectoryList = glob("$::CGI_HOME$Directory");
5421 $CurrentDirectory = shift(@DirectoryList);
5422 $CurrentDirectory = $' if $CurrentDirectory =~ m@(/\.\./)+@;
5423 $CurrentDirectory =~ s@^$::CGI_HOME@@g;
5424 print "<h1>";
5425 print "$CurrentDirectory" if $CurrentDirectory;
5426 print "</h1>\n";
5428 opendir(BROWSE, "$::CGI_HOME$Directory") || main::dieHandler(31, "$::CGI_HOME$Directory $!");
5429 my @AllFiles = sort grep(!/^([\.]+[^\.]|\~)/, readdir(BROWSE));
5431 # Print directories
5432 my $file;
5433 print "<pre><ul TYPE='NONE'>\n";
5434 foreach $file (@AllFiles)
5436 next unless -d "$::CGI_HOME$Directory/$file";
5437 # Check whether this file should be visible
5438 next if $::BlockPathAccess &&
5439 "$Directory/$file/" =~ m@$::BlockPathAccess@;
5440 print "<dt><a href='$Directory/$file'>$file</a></dt>\n";
5442 print "</ul></pre>\n";
5444 # Print files
5445 print "<pre><ul TYPE='CIRCLE'>\n";
5446 my $TotalSize = 0;
5447 foreach $file (@AllFiles)
5449 next if $file =~ /^\./;
5450 next if -d "$::CGI_HOME$Directory/$file";
5451 next if -l "$::CGI_HOME$Directory/$file";
5452 # Check whether this file should be visible
5453 next if $::BlockPathAccess &&
5454 "$Directory/$file" =~ m@$::BlockPathAccess@;
5456 if(!$Pattern || $file =~ m@$Pattern@)
5458 my $Date = localtime($^T - (-M "$::CGI_HOME$Directory/$file")*3600*24);
5459 my $Size = -s "$::CGI_HOME$Directory/$file";
5460 $Size = sprintf("%6.0F kB", $Size/1024);
5461 my $Type = `file $::CGI_HOME$Directory/$file`;
5462 $Type =~ s@\s*$::CGI_HOME$Directory/$file\s*\:\s*@@ig;
5463 chomp($Type);
5465 print "<li>";
5466 print "<a href='$Directory/$file'>";
5467 printf("%-40s", "$file</a>");
5468 print "\t$Size\t$Date\t$Type";
5469 print "</li>\n";
5472 print "</ul></pre>";
5474 return 1;
5478 ################################################
5480 # BrowseDirs(RootDirectory [, Pattern, Start])
5482 # usage:
5483 # <SCRIPT TYPE='text/ssperl'>
5484 # CGIscriptor::BrowseDirs('Sounds', '\.aifc$', 'Speech', 'DIRECTORY')
5485 # </SCRIPT>
5487 # Allows to browse subdirectories. Start should be relative to the RootDirectory,
5488 # e.g., the full path of the directory 'Speech' is '~/Sounds/Speech'.
5489 # Only files which fit /$Pattern/ and directories are displayed.
5490 # Directories down or up the directory tree are supplied with a
5491 # GET request with the name of the CGI variable in the fourth argument (default
5492 # is 'BROWSEDIRS'). So the correct call for a subdirectory could be:
5493 # CGIscriptor::BrowseDirs('Sounds', '\.aifc$', $DIRECTORY, 'DIRECTORY')
5495 sub BrowseDirs # (RootDirectory [, Pattern, Start, CGIvariable, HTTPserver]) -> Print HTML code
5497 my $RootDirectory = shift; # || return 0;
5498 my $Pattern = shift || '\S';
5499 my $Start = shift || "";
5500 my $CGIvariable = shift || "BROWSEDIRS";
5501 my $HTTPserver = shift || '';
5503 $Start = CGIscriptor::URLdecode($Start); # Sometimes, too much has been encoded
5504 $Start =~ s@//+@/@g;
5505 $Start =~ s@[^/]+/\.\.@@ig;
5506 $Start =~ s@^\.\.@@ig;
5507 $Start =~ s@/\.$@@ig;
5508 $Start =~ s!/+$!!g;
5509 $Start .= "/" if $Start;
5511 my @Directory = glob("$::CGI_HOME/$RootDirectory/$Start");
5512 $CurrentDirectory = shift(@Directory);
5513 $CurrentDirectory = $' if $CurrentDirectory =~ m@(/\.\./)+@;
5514 $CurrentDirectory =~ s@^$::CGI_HOME@@g;
5515 print "<h1>";
5516 print "$CurrentDirectory" if $CurrentDirectory;
5517 print "</h1>\n";
5518 opendir(BROWSE, "$::CGI_HOME/$RootDirectory/$Start") || main::dieHandler(31, "$::CGI_HOME/$RootDirectory/$Start $!");
5519 my @AllFiles = sort grep(!/^([\.]+[^\.]|\~)/, readdir(BROWSE));
5521 # Print directories
5522 my $file;
5523 print "<pre><ul TYPE='NONE'>\n";
5524 foreach $file (@AllFiles)
5526 next unless -d "$::CGI_HOME/$RootDirectory/$Start$file";
5527 # Check whether this file should be visible
5528 next if $::BlockPathAccess &&
5529 "/$RootDirectory/$Start$file/" =~ m@$::BlockPathAccess@;
5531 my $NewURL = $Start ? "$Start$file" : $file;
5532 $NewURL = CGIscriptor::URLencode($NewURL);
5533 print "<dt><a href='";
5534 print "$ENV{SCRIPT_NAME}" if $ENV{SCRIPT_NAME} !~ m@[^\w+\-/]@;
5535 print "$ENV{PATH_INFO}?$CGIvariable=$NewURL'>$file</a></dt>\n";
5537 print "</ul></pre>\n";
5539 # Print files
5540 print "<pre><ul TYPE='CIRCLE'>\n";
5541 my $TotalSize = 0;
5542 foreach $file (@AllFiles)
5544 next if $file =~ /^\./;
5545 next if -d "$::CGI_HOME/$RootDirectory/$Start$file";
5546 next if -l "$::CGI_HOME/$RootDirectory/$Start$file";
5547 # Check whether this file should be visible
5548 next if $::BlockPathAccess &&
5549 "$::CGI_HOME/$RootDirectory/$Start$file" =~ m@$::BlockPathAccess@;
5551 if($file =~ m@$Pattern@)
5553 my $Date = localtime($^T - (-M "$::CGI_HOME/$RootDirectory/$Start$file")*3600*24);
5554 my $Size = -s "$::CGI_HOME/$RootDirectory/$Start$file";
5555 $Size = sprintf("%6.0F kB", $Size/1024);
5556 my $Type = `file $::CGI_HOME/$RootDirectory/$Start$file`;
5557 $Type =~ s@\s*$::CGI_HOME/$RootDirectory/$Start$file\s*\:\s*@@ig;
5558 chomp($Type);
5560 print "<li>";
5561 if($HTTPserver =~ /^\s*[\.\~]\s*$/)
5563 print "<a href='$RootDirectory/$Start$file'>";
5565 elsif($HTTPserver)
5567 print "<a href='$HTTPserver/$RootDirectory/$Start$file'>";
5569 printf("%-40s", "$file</a>") if $HTTPserver;
5570 printf("%-40s", "$file") unless $HTTPserver;
5571 print "\t$Size\t$Date\t$Type";
5572 print "</li>\n";
5575 print "</ul></pre>";
5577 return 1;
5581 # ListDocs(Pattern [,ListType])
5583 # usage:
5584 # <SCRIPT TYPE=text/ssperl>
5585 # CGIscriptor::ListDocs("/*", "dl");
5586 # </SCRIPT>
5588 # This subroutine is very usefull to manage collections of independent
5589 # documents. The resulting list will display the tree-like directory
5590 # structure. If this routine is too slow for online use, you can
5591 # store the result and use a link to that stored file.
5593 # List HTML and Text files with title and first header (HTML)
5594 # or filename and first meaningfull line (general text files).
5595 # The listing starts at the ServerRoot directory. Directories are
5596 # listed recursively.
5598 # You can change the list type (default is dl).
5599 # e.g.,
5600 # <dt><a href=<file.html>>title</a>
5601 # <dd>First Header
5602 # <dt><a href=<file.txt>>file.txt</a>
5603 # <dd>First meaningfull line of text
5605 sub ListDocs # ($Pattern [, prefix]) e.g., ("/Books/*", [, "dl"])
5607 my $Pattern = shift;
5608 $Pattern =~ /\*/;
5609 my $ListType = shift || "dl";
5610 my $Prefix = lc($ListType) eq "dl" ? "dt" : "li";
5611 my $URL_root = "http://$::ENV{'SERVER_NAME'}\:$::ENV{'SERVER_PORT'}";
5612 my @FileList = glob("$::CGI_HOME$Pattern");
5613 my ($FileName, $Path, $Link);
5615 # Print List markers
5616 print "<$ListType>\n";
5618 # Glob all files
5619 File: foreach $FileName (@FileList)
5621 # Check whether this file should be visible
5622 next if $::BlockPathAccess && $FileName =~ m@$::BlockPathAccess@;
5624 # Recursively list files in all directories
5625 if(-d $FileName)
5627 $FileName =~ m@([^/]*)$@;
5628 my $DirName = $1;
5629 print "<$Prefix>$DirName\n";
5630 $Pattern =~ m@([^/]*)$@;
5631 &ListDocs("$`$DirName/$1", $ListType);
5632 next;
5634 # Use textfiles
5635 elsif(-T "$FileName")
5637 open(TextFile, $FileName) || next;
5639 # Ignore all other file types
5640 else
5641 { next;};
5643 # Get file path for link
5644 $FileName =~ /$::CGI_HOME/;
5645 print "<$Prefix><a href=$URL_root$'>";
5646 # Initialize all variables
5647 my $Line = "";
5648 my $TitleFound = 0;
5649 my $Caption = "";
5650 my $Title = "";
5651 # Read file and step through
5652 while(<TextFile>)
5654 chop $_;
5655 $Line = $_;
5656 # HTML files
5657 if($FileName =~ /\.ht[a-zA-Z]*$/i)
5659 # Catch Title
5660 while(!$Title)
5662 if($Line =~ m@<title>([^<]*)</title>@i)
5664 $Title = $1;
5665 $Line = $';
5667 else
5669 $Line .= <TextFile> || goto Print;
5670 chop $Line;
5673 # Catch First Header
5674 while(!$Caption)
5676 if($Line =~ m@</h1>@i)
5678 $Caption = $`;
5679 $Line = $';
5680 $Caption =~ m@<h1>@i;
5681 $Caption = $';
5682 $Line = $`.$Caption.$Line;
5684 else
5686 $Line .= <TextFile> || goto Print;
5687 chop $Line;
5691 # Other text files
5692 else
5694 # Title equals file name
5695 $FileName =~ /([^\/]+)$/;
5696 $Title = $1;
5697 # Catch equals First Meaningfull line
5698 while(!$Caption)
5700 if($Line =~ /[A-Z]/ &&
5701 ($Line =~ /subject|title/i || $Line =~ /^[\w,\.\s\?\:]+$/)
5702 && $Line !~ /Newsgroup/ && $Line !~ /\:\s*$/)
5704 $Line =~ s/\<[^\>]+\>//g;
5705 $Caption = $Line;
5707 else
5709 $Line = <TextFile> || goto Print;
5713 Print: # Print title and subject
5714 print "$Title</a>\n";
5715 print "<dd>$Caption\n" if $ListType eq "dl";
5716 $TitleFound = 0;
5717 $Caption = "";
5718 close TextFile;
5719 next File;
5722 # Print Closing List Marker
5723 print "</$ListType>\n";
5724 ""; # Empty return value
5728 # HTMLdocTree(Pattern [,ListType])
5730 # usage:
5731 # <SCRIPT TYPE=text/ssperl>
5732 # CGIscriptor::HTMLdocTree("/Welcome.html", "dl");
5733 # </SCRIPT>
5735 # The following subroutine is very usefull for checking large document
5736 # trees. Starting from the root (s), it reads all files and prints out
5737 # a nested list of links to all attached files. Non-existing or misplaced
5738 # files are flagged. This is quite a file-i/o intensive routine
5739 # so you would not like it to be accessible to everyone. If you want to
5740 # use the result, save the whole resulting page to disk and use a link
5741 # to this file.
5743 # HTMLdocTree takes an HTML file or file pattern and constructs nested lists
5744 # with links to *local* files (i.e., only links to the local server are
5745 # followed). The list entries are the document titles.
5746 # If the list type is <dl>, the first <H1> header is used too.
5747 # For each file matching the pattern, a list is made recursively of all
5748 # HTML documents that are linked from it and are stored in the same directory
5749 # or a sub-directory. Warnings are given for missing files.
5750 # The listing starts for the ServerRoot directory.
5751 # You can change the default list type <dl> (<dl>, <ul>, <ol>).
5753 %LinkUsed = ();
5755 sub HTMLdocTree # ($Pattern [, listtype])
5756 # e.g., ("/Welcome.html", [, "ul"])
5758 my $Pattern = shift;
5759 my $ListType = shift || "dl";
5760 my $Prefix = lc($ListType) eq "dl" ? "dt" : "li";
5761 my $URL_root = "http://$::ENV{'SERVER_NAME'}\:$::ENV{'SERVER_PORT'}";
5762 my ($Filename, $Path, $Link);
5763 my %LocalLinks = {};
5765 # Read files (glob them for expansion of wildcards)
5766 my @FileList = glob("$::CGI_HOME$Pattern");
5767 foreach $Path (@FileList)
5769 # Get URL_path
5770 $Path =~ /$::CGI_HOME/;
5771 my $URL_path = $';
5772 # Check whether this file should be visible
5773 next if $::BlockPathAccess && $URL_path =~ m@$::BlockPathAccess@;
5775 my $Title = $URL_path;
5776 my $Caption = "";
5777 # Current file should not be used again
5778 ++$LinkUsed{$URL_path};
5779 # Open HTML doc
5780 unless(open(TextFile, $Path))
5782 print "<$Prefix>$Title <blink>(not found)</blink><br>\n";
5783 next;
5785 while(<TextFile>)
5787 chop $_;
5788 $Line = $_;
5789 # Catch Title
5790 while($Line =~ m@<title>@i)
5792 if($Line =~ m@<title>([^<]*)</title>@i)
5794 $Title = $1;
5795 $Line = $';
5797 else
5799 $Line .= <TextFile>;
5800 chop $Line;
5803 # Catch First Header
5804 while(!$Caption && $Line =~ m@<h1>@i)
5806 if($Line =~ m@</h[1-9]>@i)
5808 $Caption = $`;
5809 $Line = $';
5810 $Caption =~ m@<h1>@i;
5811 $Caption = $';
5812 $Line = $`.$Caption.$Line;
5814 else
5816 $Line .= <TextFile>;
5817 chop $Line;
5820 # Catch and print Links
5821 while($Line =~ m@<a href\=([^>]*)>@i)
5823 $Link = $1;
5824 $Line = $';
5825 # Remove quotes
5826 $Link =~ s/\"//g;
5827 # Remove extras
5828 $Link =~ s/[\#\?].*$//g;
5829 # Remove Servername
5830 if($Link =~ m@(http://|^)@i)
5832 $Link = $';
5833 # Only build tree for current server
5834 next unless $Link =~ m@$::ENV{'SERVER_NAME'}|^/@;
5835 # Remove server name and port
5836 $Link =~ s@^[^\/]*@@g;
5838 # Store the current link
5839 next if $LinkUsed{$Link} || $Link eq $URL_path;
5840 ++$LinkUsed{$Link};
5841 ++$LocalLinks{$Link};
5845 close TextFile;
5846 print "<$Prefix>";
5847 print "<a href=http://";
5848 print "$::ENV{'SERVER_NAME'}\:$::ENV{'SERVER_PORT'}$URL_path>";
5849 print "$Title</a>\n";
5850 print "<br>$Caption\n"
5851 if $Caption && $Caption ne $Title && $ListType =~ /dl/i;
5852 print "<$ListType>\n";
5853 foreach $Link (keys(%LocalLinks))
5855 &HTMLdocTree($Link, $ListType);
5857 print "</$ListType>\n";
5861 ###########################<<<<<<<<<<End Remove
5863 # Make require happy
5866 =head1 NAME
5868 CGIscriptor -
5870 =head1 DESCRIPTION
5872 A flexible HTML 4 compliant script/module for CGI-aware
5873 embeded Perl, shell-scripts, and other scripting languages,
5874 executed at the server side.
5876 =head1 README
5878 Executes embeded Perl code in HTML pages with easy
5879 access to CGI variables. Also processes embeded shell
5880 scripts and scripts in any other language with an
5881 interactive interpreter (e.g., in-line Python, Tcl,
5882 Ruby, Awk, Lisp, Xlispstat, Prolog, M4, R, REBOL, Praat,
5883 sh, bash, csh, ksh).
5885 CGIscriptor is very flexible and hides all the specifics
5886 and idiosyncrasies of correct output and CGI coding and naming.
5887 CGIscriptor complies with the W3C HTML 4.0 recommendations.
5889 This Perl program will run on any WWW server that runs
5890 Perl scripts, just add a line like the following to your
5891 srm.conf file (Apache example):
5893 ScriptAlias /SHTML/ /real-path/CGIscriptor.pl/
5895 URL's that refer to http://www.your.address/SHTML/... will
5896 now be handled by CGIscriptor.pl, which can use a private
5897 directory tree (default is the DOCUMENT_ROOT directory tree,
5898 but it can be anywhere).
5900 =head1 PREREQUISITES
5903 =head1 COREQUISITES
5906 =pod OSNAMES
5908 Linux, *BSD, *nix, MS WinXP
5910 =pod SCRIPT CATEGORIES
5912 Servers
5916 =cut