This commit was manufactured by cvs2svn to create tag 'r212'.
[python/dscho.git] / Lib / cgi.py
blobe03f4437c95ad91670ad4de26ccabe483a3d2d41
1 #! /usr/local/bin/python
3 # NOTE: the above "/usr/local/bin/python" is NOT a mistake. It is
4 # intentionally NOT "/usr/bin/env python". On many systems
5 # (e.g. Solaris), /usr/local/bin is not in $PATH as passed to CGI
6 # scripts, and /usr/local/bin is the default directory where Python is
7 # installed, so /usr/bin/env would be unable to find python. Granted,
8 # binary installations by Linux vendors often install Python in
9 # /usr/bin. So let those vendors patch cgi.py to match their choice
10 # of installation.
12 """Support module for CGI (Common Gateway Interface) scripts.
14 This module defines a number of utilities for use by CGI scripts
15 written in Python.
16 """
18 # XXX Perhaps there should be a slimmed version that doesn't contain
19 # all those backwards compatible and debugging classes and functions?
21 # History
22 # -------
24 # Michael McLay started this module. Steve Majewski changed the
25 # interface to SvFormContentDict and FormContentDict. The multipart
26 # parsing was inspired by code submitted by Andreas Paepcke. Guido van
27 # Rossum rewrote, reformatted and documented the module and is currently
28 # responsible for its maintenance.
31 __version__ = "2.6"
34 # Imports
35 # =======
37 import sys
38 import os
39 import urllib
40 import mimetools
41 import rfc822
42 import UserDict
43 from StringIO import StringIO
45 __all__ = ["MiniFieldStorage", "FieldStorage", "FormContentDict",
46 "SvFormContentDict", "InterpFormContentDict", "FormContent",
47 "parse", "parse_qs", "parse_qsl", "parse_multipart",
48 "parse_header", "print_exception", "print_environ",
49 "print_form", "print_directory", "print_arguments",
50 "print_environ_usage", "escape"]
52 # Logging support
53 # ===============
55 logfile = "" # Filename to log to, if not empty
56 logfp = None # File object to log to, if not None
58 def initlog(*allargs):
59 """Write a log message, if there is a log file.
61 Even though this function is called initlog(), you should always
62 use log(); log is a variable that is set either to initlog
63 (initially), to dolog (once the log file has been opened), or to
64 nolog (when logging is disabled).
66 The first argument is a format string; the remaining arguments (if
67 any) are arguments to the % operator, so e.g.
68 log("%s: %s", "a", "b")
69 will write "a: b" to the log file, followed by a newline.
71 If the global logfp is not None, it should be a file object to
72 which log data is written.
74 If the global logfp is None, the global logfile may be a string
75 giving a filename to open, in append mode. This file should be
76 world writable!!! If the file can't be opened, logging is
77 silently disabled (since there is no safe place where we could
78 send an error message).
80 """
81 global logfp, log
82 if logfile and not logfp:
83 try:
84 logfp = open(logfile, "a")
85 except IOError:
86 pass
87 if not logfp:
88 log = nolog
89 else:
90 log = dolog
91 apply(log, allargs)
93 def dolog(fmt, *args):
94 """Write a log message to the log file. See initlog() for docs."""
95 logfp.write(fmt%args + "\n")
97 def nolog(*allargs):
98 """Dummy function, assigned to log when logging is disabled."""
99 pass
101 log = initlog # The current logging function
104 # Parsing functions
105 # =================
107 # Maximum input we will accept when REQUEST_METHOD is POST
108 # 0 ==> unlimited input
109 maxlen = 0
111 def parse(fp=None, environ=os.environ, keep_blank_values=0, strict_parsing=0):
112 """Parse a query in the environment or from a file (default stdin)
114 Arguments, all optional:
116 fp : file pointer; default: sys.stdin
118 environ : environment dictionary; default: os.environ
120 keep_blank_values: flag indicating whether blank values in
121 URL encoded forms should be treated as blank strings.
122 A true value indicates that blanks should be retained as
123 blank strings. The default false value indicates that
124 blank values are to be ignored and treated as if they were
125 not included.
127 strict_parsing: flag indicating what to do with parsing errors.
128 If false (the default), errors are silently ignored.
129 If true, errors raise a ValueError exception.
131 if not fp:
132 fp = sys.stdin
133 if not environ.has_key('REQUEST_METHOD'):
134 environ['REQUEST_METHOD'] = 'GET' # For testing stand-alone
135 if environ['REQUEST_METHOD'] == 'POST':
136 ctype, pdict = parse_header(environ['CONTENT_TYPE'])
137 if ctype == 'multipart/form-data':
138 return parse_multipart(fp, pdict)
139 elif ctype == 'application/x-www-form-urlencoded':
140 clength = int(environ['CONTENT_LENGTH'])
141 if maxlen and clength > maxlen:
142 raise ValueError, 'Maximum content length exceeded'
143 qs = fp.read(clength)
144 else:
145 qs = '' # Unknown content-type
146 if environ.has_key('QUERY_STRING'):
147 if qs: qs = qs + '&'
148 qs = qs + environ['QUERY_STRING']
149 elif sys.argv[1:]:
150 if qs: qs = qs + '&'
151 qs = qs + sys.argv[1]
152 environ['QUERY_STRING'] = qs # XXX Shouldn't, really
153 elif environ.has_key('QUERY_STRING'):
154 qs = environ['QUERY_STRING']
155 else:
156 if sys.argv[1:]:
157 qs = sys.argv[1]
158 else:
159 qs = ""
160 environ['QUERY_STRING'] = qs # XXX Shouldn't, really
161 return parse_qs(qs, keep_blank_values, strict_parsing)
164 def parse_qs(qs, keep_blank_values=0, strict_parsing=0):
165 """Parse a query given as a string argument.
167 Arguments:
169 qs: URL-encoded query string to be parsed
171 keep_blank_values: flag indicating whether blank values in
172 URL encoded queries should be treated as blank strings.
173 A true value indicates that blanks should be retained as
174 blank strings. The default false value indicates that
175 blank values are to be ignored and treated as if they were
176 not included.
178 strict_parsing: flag indicating what to do with parsing errors.
179 If false (the default), errors are silently ignored.
180 If true, errors raise a ValueError exception.
182 dict = {}
183 for name, value in parse_qsl(qs, keep_blank_values, strict_parsing):
184 if dict.has_key(name):
185 dict[name].append(value)
186 else:
187 dict[name] = [value]
188 return dict
190 def parse_qsl(qs, keep_blank_values=0, strict_parsing=0):
191 """Parse a query given as a string argument.
193 Arguments:
195 qs: URL-encoded query string to be parsed
197 keep_blank_values: flag indicating whether blank values in
198 URL encoded queries should be treated as blank strings. A
199 true value indicates that blanks should be retained as blank
200 strings. The default false value indicates that blank values
201 are to be ignored and treated as if they were not included.
203 strict_parsing: flag indicating what to do with parsing errors. If
204 false (the default), errors are silently ignored. If true,
205 errors raise a ValueError exception.
207 Returns a list, as G-d intended.
209 pairs = [s2 for s1 in qs.split('&') for s2 in s1.split(';')]
210 r = []
211 for name_value in pairs:
212 nv = name_value.split('=', 1)
213 if len(nv) != 2:
214 if strict_parsing:
215 raise ValueError, "bad query field: %s" % `name_value`
216 continue
217 if len(nv[1]) or keep_blank_values:
218 name = urllib.unquote(nv[0].replace('+', ' '))
219 value = urllib.unquote(nv[1].replace('+', ' '))
220 r.append((name, value))
222 return r
225 def parse_multipart(fp, pdict):
226 """Parse multipart input.
228 Arguments:
229 fp : input file
230 pdict: dictionary containing other parameters of conten-type header
232 Returns a dictionary just like parse_qs(): keys are the field names, each
233 value is a list of values for that field. This is easy to use but not
234 much good if you are expecting megabytes to be uploaded -- in that case,
235 use the FieldStorage class instead which is much more flexible. Note
236 that content-type is the raw, unparsed contents of the content-type
237 header.
239 XXX This does not parse nested multipart parts -- use FieldStorage for
240 that.
242 XXX This should really be subsumed by FieldStorage altogether -- no
243 point in having two implementations of the same parsing algorithm.
246 boundary = ""
247 if pdict.has_key('boundary'):
248 boundary = pdict['boundary']
249 if not valid_boundary(boundary):
250 raise ValueError, ('Invalid boundary in multipart form: %s'
251 % `boundary`)
253 nextpart = "--" + boundary
254 lastpart = "--" + boundary + "--"
255 partdict = {}
256 terminator = ""
258 while terminator != lastpart:
259 bytes = -1
260 data = None
261 if terminator:
262 # At start of next part. Read headers first.
263 headers = mimetools.Message(fp)
264 clength = headers.getheader('content-length')
265 if clength:
266 try:
267 bytes = int(clength)
268 except ValueError:
269 pass
270 if bytes > 0:
271 if maxlen and bytes > maxlen:
272 raise ValueError, 'Maximum content length exceeded'
273 data = fp.read(bytes)
274 else:
275 data = ""
276 # Read lines until end of part.
277 lines = []
278 while 1:
279 line = fp.readline()
280 if not line:
281 terminator = lastpart # End outer loop
282 break
283 if line[:2] == "--":
284 terminator = line.strip()
285 if terminator in (nextpart, lastpart):
286 break
287 lines.append(line)
288 # Done with part.
289 if data is None:
290 continue
291 if bytes < 0:
292 if lines:
293 # Strip final line terminator
294 line = lines[-1]
295 if line[-2:] == "\r\n":
296 line = line[:-2]
297 elif line[-1:] == "\n":
298 line = line[:-1]
299 lines[-1] = line
300 data = "".join(lines)
301 line = headers['content-disposition']
302 if not line:
303 continue
304 key, params = parse_header(line)
305 if key != 'form-data':
306 continue
307 if params.has_key('name'):
308 name = params['name']
309 else:
310 continue
311 if partdict.has_key(name):
312 partdict[name].append(data)
313 else:
314 partdict[name] = [data]
316 return partdict
319 def parse_header(line):
320 """Parse a Content-type like header.
322 Return the main content-type and a dictionary of options.
325 plist = map(lambda x: x.strip(), line.split(';'))
326 key = plist[0].lower()
327 del plist[0]
328 pdict = {}
329 for p in plist:
330 i = p.find('=')
331 if i >= 0:
332 name = p[:i].strip().lower()
333 value = p[i+1:].strip()
334 if len(value) >= 2 and value[0] == value[-1] == '"':
335 value = value[1:-1]
336 pdict[name] = value
337 return key, pdict
340 # Classes for field storage
341 # =========================
343 class MiniFieldStorage:
345 """Like FieldStorage, for use when no file uploads are possible."""
347 # Dummy attributes
348 filename = None
349 list = None
350 type = None
351 file = None
352 type_options = {}
353 disposition = None
354 disposition_options = {}
355 headers = {}
357 def __init__(self, name, value):
358 """Constructor from field name and value."""
359 self.name = name
360 self.value = value
361 # self.file = StringIO(value)
363 def __repr__(self):
364 """Return printable representation."""
365 return "MiniFieldStorage(%s, %s)" % (`self.name`, `self.value`)
368 class FieldStorage:
370 """Store a sequence of fields, reading multipart/form-data.
372 This class provides naming, typing, files stored on disk, and
373 more. At the top level, it is accessible like a dictionary, whose
374 keys are the field names. (Note: None can occur as a field name.)
375 The items are either a Python list (if there's multiple values) or
376 another FieldStorage or MiniFieldStorage object. If it's a single
377 object, it has the following attributes:
379 name: the field name, if specified; otherwise None
381 filename: the filename, if specified; otherwise None; this is the
382 client side filename, *not* the file name on which it is
383 stored (that's a temporary file you don't deal with)
385 value: the value as a *string*; for file uploads, this
386 transparently reads the file every time you request the value
388 file: the file(-like) object from which you can read the data;
389 None if the data is stored a simple string
391 type: the content-type, or None if not specified
393 type_options: dictionary of options specified on the content-type
394 line
396 disposition: content-disposition, or None if not specified
398 disposition_options: dictionary of corresponding options
400 headers: a dictionary(-like) object (sometimes rfc822.Message or a
401 subclass thereof) containing *all* headers
403 The class is subclassable, mostly for the purpose of overriding
404 the make_file() method, which is called internally to come up with
405 a file open for reading and writing. This makes it possible to
406 override the default choice of storing all files in a temporary
407 directory and unlinking them as soon as they have been opened.
411 def __init__(self, fp=None, headers=None, outerboundary="",
412 environ=os.environ, keep_blank_values=0, strict_parsing=0):
413 """Constructor. Read multipart/* until last part.
415 Arguments, all optional:
417 fp : file pointer; default: sys.stdin
418 (not used when the request method is GET)
420 headers : header dictionary-like object; default:
421 taken from environ as per CGI spec
423 outerboundary : terminating multipart boundary
424 (for internal use only)
426 environ : environment dictionary; default: os.environ
428 keep_blank_values: flag indicating whether blank values in
429 URL encoded forms should be treated as blank strings.
430 A true value indicates that blanks should be retained as
431 blank strings. The default false value indicates that
432 blank values are to be ignored and treated as if they were
433 not included.
435 strict_parsing: flag indicating what to do with parsing errors.
436 If false (the default), errors are silently ignored.
437 If true, errors raise a ValueError exception.
440 method = 'GET'
441 self.keep_blank_values = keep_blank_values
442 self.strict_parsing = strict_parsing
443 if environ.has_key('REQUEST_METHOD'):
444 method = environ['REQUEST_METHOD'].upper()
445 if method == 'GET' or method == 'HEAD':
446 if environ.has_key('QUERY_STRING'):
447 qs = environ['QUERY_STRING']
448 elif sys.argv[1:]:
449 qs = sys.argv[1]
450 else:
451 qs = ""
452 fp = StringIO(qs)
453 if headers is None:
454 headers = {'content-type':
455 "application/x-www-form-urlencoded"}
456 if headers is None:
457 headers = {}
458 if method == 'POST':
459 # Set default content-type for POST to what's traditional
460 headers['content-type'] = "application/x-www-form-urlencoded"
461 if environ.has_key('CONTENT_TYPE'):
462 headers['content-type'] = environ['CONTENT_TYPE']
463 if environ.has_key('CONTENT_LENGTH'):
464 headers['content-length'] = environ['CONTENT_LENGTH']
465 self.fp = fp or sys.stdin
466 self.headers = headers
467 self.outerboundary = outerboundary
469 # Process content-disposition header
470 cdisp, pdict = "", {}
471 if self.headers.has_key('content-disposition'):
472 cdisp, pdict = parse_header(self.headers['content-disposition'])
473 self.disposition = cdisp
474 self.disposition_options = pdict
475 self.name = None
476 if pdict.has_key('name'):
477 self.name = pdict['name']
478 self.filename = None
479 if pdict.has_key('filename'):
480 self.filename = pdict['filename']
482 # Process content-type header
484 # Honor any existing content-type header. But if there is no
485 # content-type header, use some sensible defaults. Assume
486 # outerboundary is "" at the outer level, but something non-false
487 # inside a multi-part. The default for an inner part is text/plain,
488 # but for an outer part it should be urlencoded. This should catch
489 # bogus clients which erroneously forget to include a content-type
490 # header.
492 # See below for what we do if there does exist a content-type header,
493 # but it happens to be something we don't understand.
494 if self.headers.has_key('content-type'):
495 ctype, pdict = parse_header(self.headers['content-type'])
496 elif self.outerboundary or method != 'POST':
497 ctype, pdict = "text/plain", {}
498 else:
499 ctype, pdict = 'application/x-www-form-urlencoded', {}
500 self.type = ctype
501 self.type_options = pdict
502 self.innerboundary = ""
503 if pdict.has_key('boundary'):
504 self.innerboundary = pdict['boundary']
505 clen = -1
506 if self.headers.has_key('content-length'):
507 try:
508 clen = int(self.headers['content-length'])
509 except:
510 pass
511 if maxlen and clen > maxlen:
512 raise ValueError, 'Maximum content length exceeded'
513 self.length = clen
515 self.list = self.file = None
516 self.done = 0
517 if ctype == 'application/x-www-form-urlencoded':
518 self.read_urlencoded()
519 elif ctype[:10] == 'multipart/':
520 self.read_multi(environ, keep_blank_values, strict_parsing)
521 else:
522 self.read_single()
524 def __repr__(self):
525 """Return a printable representation."""
526 return "FieldStorage(%s, %s, %s)" % (
527 `self.name`, `self.filename`, `self.value`)
529 def __getattr__(self, name):
530 if name != 'value':
531 raise AttributeError, name
532 if self.file:
533 self.file.seek(0)
534 value = self.file.read()
535 self.file.seek(0)
536 elif self.list is not None:
537 value = self.list
538 else:
539 value = None
540 return value
542 def __getitem__(self, key):
543 """Dictionary style indexing."""
544 if self.list is None:
545 raise TypeError, "not indexable"
546 found = []
547 for item in self.list:
548 if item.name == key: found.append(item)
549 if not found:
550 raise KeyError, key
551 if len(found) == 1:
552 return found[0]
553 else:
554 return found
556 def getvalue(self, key, default=None):
557 """Dictionary style get() method, including 'value' lookup."""
558 if self.has_key(key):
559 value = self[key]
560 if type(value) is type([]):
561 return map(lambda v: v.value, value)
562 else:
563 return value.value
564 else:
565 return default
567 def keys(self):
568 """Dictionary style keys() method."""
569 if self.list is None:
570 raise TypeError, "not indexable"
571 keys = []
572 for item in self.list:
573 if item.name not in keys: keys.append(item.name)
574 return keys
576 def has_key(self, key):
577 """Dictionary style has_key() method."""
578 if self.list is None:
579 raise TypeError, "not indexable"
580 for item in self.list:
581 if item.name == key: return 1
582 return 0
584 def __len__(self):
585 """Dictionary style len(x) support."""
586 return len(self.keys())
588 def read_urlencoded(self):
589 """Internal: read data in query string format."""
590 qs = self.fp.read(self.length)
591 self.list = list = []
592 for key, value in parse_qsl(qs, self.keep_blank_values,
593 self.strict_parsing):
594 list.append(MiniFieldStorage(key, value))
595 self.skip_lines()
597 FieldStorageClass = None
599 def read_multi(self, environ, keep_blank_values, strict_parsing):
600 """Internal: read a part that is itself multipart."""
601 ib = self.innerboundary
602 if not valid_boundary(ib):
603 raise ValueError, ('Invalid boundary in multipart form: %s'
604 % `ib`)
605 self.list = []
606 klass = self.FieldStorageClass or self.__class__
607 part = klass(self.fp, {}, ib,
608 environ, keep_blank_values, strict_parsing)
609 # Throw first part away
610 while not part.done:
611 headers = rfc822.Message(self.fp)
612 part = klass(self.fp, headers, ib,
613 environ, keep_blank_values, strict_parsing)
614 self.list.append(part)
615 self.skip_lines()
617 def read_single(self):
618 """Internal: read an atomic part."""
619 if self.length >= 0:
620 self.read_binary()
621 self.skip_lines()
622 else:
623 self.read_lines()
624 self.file.seek(0)
626 bufsize = 8*1024 # I/O buffering size for copy to file
628 def read_binary(self):
629 """Internal: read binary data."""
630 self.file = self.make_file('b')
631 todo = self.length
632 if todo >= 0:
633 while todo > 0:
634 data = self.fp.read(min(todo, self.bufsize))
635 if not data:
636 self.done = -1
637 break
638 self.file.write(data)
639 todo = todo - len(data)
641 def read_lines(self):
642 """Internal: read lines until EOF or outerboundary."""
643 self.file = self.__file = StringIO()
644 if self.outerboundary:
645 self.read_lines_to_outerboundary()
646 else:
647 self.read_lines_to_eof()
649 def __write(self, line):
650 if self.__file is not None:
651 if self.__file.tell() + len(line) > 1000:
652 self.file = self.make_file('')
653 self.file.write(self.__file.getvalue())
654 self.__file = None
655 self.file.write(line)
657 def read_lines_to_eof(self):
658 """Internal: read lines until EOF."""
659 while 1:
660 line = self.fp.readline()
661 if not line:
662 self.done = -1
663 break
664 self.__write(line)
666 def read_lines_to_outerboundary(self):
667 """Internal: read lines until outerboundary."""
668 next = "--" + self.outerboundary
669 last = next + "--"
670 delim = ""
671 while 1:
672 line = self.fp.readline()
673 if not line:
674 self.done = -1
675 break
676 if line[:2] == "--":
677 strippedline = line.strip()
678 if strippedline == next:
679 break
680 if strippedline == last:
681 self.done = 1
682 break
683 odelim = delim
684 if line[-2:] == "\r\n":
685 delim = "\r\n"
686 line = line[:-2]
687 elif line[-1] == "\n":
688 delim = "\n"
689 line = line[:-1]
690 else:
691 delim = ""
692 self.__write(odelim + line)
694 def skip_lines(self):
695 """Internal: skip lines until outer boundary if defined."""
696 if not self.outerboundary or self.done:
697 return
698 next = "--" + self.outerboundary
699 last = next + "--"
700 while 1:
701 line = self.fp.readline()
702 if not line:
703 self.done = -1
704 break
705 if line[:2] == "--":
706 strippedline = line.strip()
707 if strippedline == next:
708 break
709 if strippedline == last:
710 self.done = 1
711 break
713 def make_file(self, binary=None):
714 """Overridable: return a readable & writable file.
716 The file will be used as follows:
717 - data is written to it
718 - seek(0)
719 - data is read from it
721 The 'binary' argument is unused -- the file is always opened
722 in binary mode.
724 This version opens a temporary file for reading and writing,
725 and immediately deletes (unlinks) it. The trick (on Unix!) is
726 that the file can still be used, but it can't be opened by
727 another process, and it will automatically be deleted when it
728 is closed or when the current process terminates.
730 If you want a more permanent file, you derive a class which
731 overrides this method. If you want a visible temporary file
732 that is nevertheless automatically deleted when the script
733 terminates, try defining a __del__ method in a derived class
734 which unlinks the temporary files you have created.
737 import tempfile
738 return tempfile.TemporaryFile("w+b")
742 # Backwards Compatibility Classes
743 # ===============================
745 class FormContentDict(UserDict.UserDict):
746 """Form content as dictionary with a list of values per field.
748 form = FormContentDict()
750 form[key] -> [value, value, ...]
751 form.has_key(key) -> Boolean
752 form.keys() -> [key, key, ...]
753 form.values() -> [[val, val, ...], [val, val, ...], ...]
754 form.items() -> [(key, [val, val, ...]), (key, [val, val, ...]), ...]
755 form.dict == {key: [val, val, ...], ...}
758 def __init__(self, environ=os.environ):
759 self.dict = self.data = parse(environ=environ)
760 self.query_string = environ['QUERY_STRING']
763 class SvFormContentDict(FormContentDict):
764 """Form content as dictionary expecting a single value per field.
766 If you only expect a single value for each field, then form[key]
767 will return that single value. It will raise an IndexError if
768 that expectation is not true. If you expect a field to have
769 possible multiple values, than you can use form.getlist(key) to
770 get all of the values. values() and items() are a compromise:
771 they return single strings where there is a single value, and
772 lists of strings otherwise.
775 def __getitem__(self, key):
776 if len(self.dict[key]) > 1:
777 raise IndexError, 'expecting a single value'
778 return self.dict[key][0]
779 def getlist(self, key):
780 return self.dict[key]
781 def values(self):
782 result = []
783 for value in self.dict.values():
784 if len(value) == 1:
785 result.append(value[0])
786 else: result.append(value)
787 return result
788 def items(self):
789 result = []
790 for key, value in self.dict.items():
791 if len(value) == 1:
792 result.append((key, value[0]))
793 else: result.append((key, value))
794 return result
797 class InterpFormContentDict(SvFormContentDict):
798 """This class is present for backwards compatibility only."""
799 def __getitem__(self, key):
800 v = SvFormContentDict.__getitem__(self, key)
801 if v[0] in '0123456789+-.':
802 try: return int(v)
803 except ValueError:
804 try: return float(v)
805 except ValueError: pass
806 return v.strip()
807 def values(self):
808 result = []
809 for key in self.keys():
810 try:
811 result.append(self[key])
812 except IndexError:
813 result.append(self.dict[key])
814 return result
815 def items(self):
816 result = []
817 for key in self.keys():
818 try:
819 result.append((key, self[key]))
820 except IndexError:
821 result.append((key, self.dict[key]))
822 return result
825 class FormContent(FormContentDict):
826 """This class is present for backwards compatibility only."""
827 def values(self, key):
828 if self.dict.has_key(key) :return self.dict[key]
829 else: return None
830 def indexed_value(self, key, location):
831 if self.dict.has_key(key):
832 if len(self.dict[key]) > location:
833 return self.dict[key][location]
834 else: return None
835 else: return None
836 def value(self, key):
837 if self.dict.has_key(key): return self.dict[key][0]
838 else: return None
839 def length(self, key):
840 return len(self.dict[key])
841 def stripped(self, key):
842 if self.dict.has_key(key): return self.dict[key][0].strip()
843 else: return None
844 def pars(self):
845 return self.dict
848 # Test/debug code
849 # ===============
851 def test(environ=os.environ):
852 """Robust test CGI script, usable as main program.
854 Write minimal HTTP headers and dump all information provided to
855 the script in HTML form.
858 import traceback
859 print "Content-type: text/html"
860 print
861 sys.stderr = sys.stdout
862 try:
863 form = FieldStorage() # Replace with other classes to test those
864 print_directory()
865 print_arguments()
866 print_form(form)
867 print_environ(environ)
868 print_environ_usage()
869 def f():
870 exec "testing print_exception() -- <I>italics?</I>"
871 def g(f=f):
873 print "<H3>What follows is a test, not an actual exception:</H3>"
875 except:
876 print_exception()
878 print "<H1>Second try with a small maxlen...</H1>"
880 global maxlen
881 maxlen = 50
882 try:
883 form = FieldStorage() # Replace with other classes to test those
884 print_directory()
885 print_arguments()
886 print_form(form)
887 print_environ(environ)
888 except:
889 print_exception()
891 def print_exception(type=None, value=None, tb=None, limit=None):
892 if type is None:
893 type, value, tb = sys.exc_info()
894 import traceback
895 print
896 print "<H3>Traceback (most recent call last):</H3>"
897 list = traceback.format_tb(tb, limit) + \
898 traceback.format_exception_only(type, value)
899 print "<PRE>%s<B>%s</B></PRE>" % (
900 escape("".join(list[:-1])),
901 escape(list[-1]),
903 del tb
905 def print_environ(environ=os.environ):
906 """Dump the shell environment as HTML."""
907 keys = environ.keys()
908 keys.sort()
909 print
910 print "<H3>Shell Environment:</H3>"
911 print "<DL>"
912 for key in keys:
913 print "<DT>", escape(key), "<DD>", escape(environ[key])
914 print "</DL>"
915 print
917 def print_form(form):
918 """Dump the contents of a form as HTML."""
919 keys = form.keys()
920 keys.sort()
921 print
922 print "<H3>Form Contents:</H3>"
923 if not keys:
924 print "<P>No form fields."
925 print "<DL>"
926 for key in keys:
927 print "<DT>" + escape(key) + ":",
928 value = form[key]
929 print "<i>" + escape(`type(value)`) + "</i>"
930 print "<DD>" + escape(`value`)
931 print "</DL>"
932 print
934 def print_directory():
935 """Dump the current directory as HTML."""
936 print
937 print "<H3>Current Working Directory:</H3>"
938 try:
939 pwd = os.getcwd()
940 except os.error, msg:
941 print "os.error:", escape(str(msg))
942 else:
943 print escape(pwd)
944 print
946 def print_arguments():
947 print
948 print "<H3>Command Line Arguments:</H3>"
949 print
950 print sys.argv
951 print
953 def print_environ_usage():
954 """Dump a list of environment variables used by CGI as HTML."""
955 print """
956 <H3>These environment variables could have been set:</H3>
957 <UL>
958 <LI>AUTH_TYPE
959 <LI>CONTENT_LENGTH
960 <LI>CONTENT_TYPE
961 <LI>DATE_GMT
962 <LI>DATE_LOCAL
963 <LI>DOCUMENT_NAME
964 <LI>DOCUMENT_ROOT
965 <LI>DOCUMENT_URI
966 <LI>GATEWAY_INTERFACE
967 <LI>LAST_MODIFIED
968 <LI>PATH
969 <LI>PATH_INFO
970 <LI>PATH_TRANSLATED
971 <LI>QUERY_STRING
972 <LI>REMOTE_ADDR
973 <LI>REMOTE_HOST
974 <LI>REMOTE_IDENT
975 <LI>REMOTE_USER
976 <LI>REQUEST_METHOD
977 <LI>SCRIPT_NAME
978 <LI>SERVER_NAME
979 <LI>SERVER_PORT
980 <LI>SERVER_PROTOCOL
981 <LI>SERVER_ROOT
982 <LI>SERVER_SOFTWARE
983 </UL>
984 In addition, HTTP headers sent by the server may be passed in the
985 environment as well. Here are some common variable names:
986 <UL>
987 <LI>HTTP_ACCEPT
988 <LI>HTTP_CONNECTION
989 <LI>HTTP_HOST
990 <LI>HTTP_PRAGMA
991 <LI>HTTP_REFERER
992 <LI>HTTP_USER_AGENT
993 </UL>
997 # Utilities
998 # =========
1000 def escape(s, quote=None):
1001 """Replace special characters '&', '<' and '>' by SGML entities."""
1002 s = s.replace("&", "&amp;") # Must be done first!
1003 s = s.replace("<", "&lt;")
1004 s = s.replace(">", "&gt;")
1005 if quote:
1006 s = s.replace('"', "&quot;")
1007 return s
1009 def valid_boundary(s, _vb_pattern="^[ -~]{0,200}[!-~]$"):
1010 import re
1011 return re.match(_vb_pattern, s)
1013 # Invoke mainline
1014 # ===============
1016 # Call test() when this file is run as a script (not imported as a module)
1017 if __name__ == '__main__':
1018 test()