--- C:\DOCUME~1\PROPRI~1\LOCALS~1\Temp\cgi.py-revBASE.svn007.tmp.py	dim. janv.  9 12:45:18 2011
+++ C:\python-dev\cgi.py	dim. janv.  9 12:45:10 2011
@@ -31,7 +31,7 @@
 # Imports
 # =======
 
-from io import StringIO
+from io import StringIO, BytesIO, TextIOBase
 import sys
 import os
 import urllib.parse
@@ -109,7 +109,7 @@
 
         Arguments, all optional:
 
-        fp              : file pointer; default: sys.stdin
+        fp              : file pointer; default: sys.stdin.buffer
 
         environ         : environment dictionary; default: os.environ
 
@@ -126,6 +126,28 @@
     """
     if fp is None:
         fp = sys.stdin
+    if fp is sys.stdin:
+        # Windows needs stdio set for binary mode. This will be useless
+        # for Python 3.2+ : binary mode will be the default
+        try: 
+            import msvcrt
+            msvcrt.setmode (0, os.O_BINARY) # stdin  = 0
+            msvcrt.setmode (1, os.O_BINARY) # stdout = 1
+            msvcrt.setmode (2, os.O_BINARY) # stderr = 2
+        except ImportError:
+            pass
+
+    # field keys and values (except for files) are returned as strings
+    # an encoding is required to decode the bytes read from self.fp
+    if hasattr(fp,'encoding'):
+        encoding = fp.encoding
+    else:
+        encoding = 'latin-1' # ?
+
+    # fp.read() must return bytes
+    if isinstance(fp,TextIOBase):
+        fp = fp.buffer
+    
     if not 'REQUEST_METHOD' in environ:
         environ['REQUEST_METHOD'] = 'GET'       # For testing stand-alone
     if environ['REQUEST_METHOD'] == 'POST':
@@ -136,7 +158,7 @@
             clength = int(environ['CONTENT_LENGTH'])
             if maxlen and clength > maxlen:
                 raise ValueError('Maximum content length exceeded')
-            qs = fp.read(clength)
+            qs = fp.read(clength).decode(encoding) # str
         else:
             qs = ''                     # Unknown content-type
         if 'QUERY_STRING' in environ:
@@ -352,9 +374,10 @@
 
     value: the value as a *string*; for file uploads, this
         transparently reads the file every time you request the value
+        and returns *bytes*
 
-    file: the file(-like) object from which you can read the data;
-        None if the data is stored a simple string
+    file: the file(-like) object from which you can read the data *as
+        bytes* ; None if the data is stored a simple string
 
     type: the content-type, or None if not specified
 
@@ -375,14 +398,15 @@
     directory and unlinking them as soon as they have been opened.
 
     """
-
     def __init__(self, fp=None, headers=None, outerboundary="",
-                 environ=os.environ, keep_blank_values=0, strict_parsing=0):
+                 environ=os.environ, keep_blank_values=0, strict_parsing=0,
+                 limit=None):
         """Constructor.  Read multipart/* until last part.
 
         Arguments, all optional:
 
-        fp              : file pointer; default: sys.stdin
+        fp              : file pointer; must read *bytes* ;
+            default: sys.stdin.buffer
             (not used when the request method is GET)
 
         headers         : header dictionary-like object; default:
@@ -404,6 +428,10 @@
             If false (the default), errors are silently ignored.
             If true, errors raise a ValueError exception.
 
+        limit : used internally to read parts of multipart/form-data forms, 
+            to exit from the reading loop when reached. It is the difference 
+            between the form content-length and the number of bytes already
+            read
         """
         method = 'GET'
         self.keep_blank_values = keep_blank_values
@@ -418,7 +446,7 @@
                 qs = sys.argv[1]
             else:
                 qs = ""
-            fp = StringIO(qs)
+            fp = BytesIO(qs.encode('ascii')) # bytes
             if headers is None:
                 headers = {'content-type':
                            "application/x-www-form-urlencoded"}
@@ -433,9 +461,36 @@
                 self.qs_on_post = environ['QUERY_STRING']
             if 'CONTENT_LENGTH' in environ:
                 headers['content-length'] = environ['CONTENT_LENGTH']
-        self.fp = fp or sys.stdin
+        if fp is None:
+            fp = sys.stdin
+        if fp is sys.stdin:
+            # Windows needs stdio set for binary mode. This will be useless
+            # for Python 3.2+ : binary mode will be the default
+            try: 
+                import msvcrt
+                msvcrt.setmode (0, os.O_BINARY) # stdin  = 0
+                msvcrt.setmode (1, os.O_BINARY) # stdout = 1
+                msvcrt.setmode (2, os.O_BINARY) # stderr = 2
+            except ImportError:
+                pass
+        # self.fp.read() must return bytes
+        if isinstance(fp,TextIOBase):
+            self.fp = fp.buffer
+        else:
+            self.fp = fp
+
+        # field keys and values (except for files) are returned as strings
+        # an encoding is required to decode the bytes read from self.fp
+        if hasattr(fp,'encoding'):
+            self.fp.encoding = fp.encoding
+        else:
+            self.fp.encoding = 'latin-1' # ?
+
         self.headers = headers
         self.outerboundary = outerboundary
+        
+        self.bytes_read = 0
+        self.limit = limit
 
         # Process content-disposition header
         cdisp, pdict = "", {}
@@ -482,6 +537,8 @@
             if maxlen and clen > maxlen:
                 raise ValueError('Maximum content length exceeded')
         self.length = clen
+        if self.limit is None and clen:
+            self.limit = clen
 
         self.list = self.file = None
         self.done = 0
@@ -531,7 +588,7 @@
         """Dictionary style get() method, including 'value' lookup."""
         if key in self:
             value = self[key]
-            if type(value) is type([]):
+            if isinstance(value,list):
                 return [x.value for x in value]
             else:
                 return value.value
@@ -542,7 +599,7 @@
         """ Return the first value received."""
         if key in self:
             value = self[key]
-            if type(value) is type([]):
+            if isinstance(value,list):
                 return value[0].value
             else:
                 return value.value
@@ -553,7 +610,7 @@
         """ Return list of received values."""
         if key in self:
             value = self[key]
-            if type(value) is type([]):
+            if isinstance(value,list):
                 return [x.value for x in value]
             else:
                 return [value.value]
@@ -581,13 +638,13 @@
 
     def read_urlencoded(self):
         """Internal: read data in query string format."""
-        qs = self.fp.read(self.length)
+        qs = self.fp.read(self.length).decode(self.fp.encoding) # str
         if self.qs_on_post:
             qs += '&' + self.qs_on_post
-        self.list = list = []
+        self.list = []
         for key, value in urllib.parse.parse_qsl(qs, self.keep_blank_values,
                                 self.strict_parsing):
-            list.append(MiniFieldStorage(key, value))
+            self.list.append(MiniFieldStorage(key, value))
         self.skip_lines()
 
     FieldStorageClass = None
@@ -600,23 +657,35 @@
         self.list = []
         if self.qs_on_post:
             for key, value in urllib.parse.parse_qsl(self.qs_on_post,
-                                    self.keep_blank_values, self.strict_parsing):
+                                self.keep_blank_values, self.strict_parsing):
                 self.list.append(MiniFieldStorage(key, value))
             FieldStorageClass = None
 
         klass = self.FieldStorageClass or self.__class__
-        parser = email.parser.FeedParser()
-        # Create bogus content-type header for proper multipart parsing
-        parser.feed('Content-Type: %s; boundary=%s\r\n\r\n' % (self.type, ib))
-        parser.feed(self.fp.read())
-        full_msg = parser.close()
-        # Get subparts
-        msgs = full_msg.get_payload()
-        for msg in msgs:
-            fp = StringIO(msg.get_payload())
-            part = klass(fp, msg, ib, environ, keep_blank_values,
-                         strict_parsing)
+        first_line = self.fp.readline() # bytes
+        self.bytes_read += len(first_line)
+        # first line holds boundary ; ignore it, or check that
+        # "--"+ib == first_line.decode('ascii').strip() ?
+        while True:
+            parser = email.parser.FeedParser()
+            hdr_text = b""
+            while True:
+                data = self.fp.readline()
+                hdr_text += data
+                if not data.strip():
+                    break
+            if not hdr_text:
+                break
+            # parser takes strings, not bytes
+            self.bytes_read += len(hdr_text)
+            parser.feed(hdr_text.decode(self.fp.encoding))
+            headers = parser.close()
+            part = klass(self.fp, headers, ib, environ, keep_blank_values,
+                         strict_parsing,self.limit-self.bytes_read)
+            self.bytes_read += part.bytes_read
             self.list.append(part)
+            if self.bytes_read >= self.length:
+                break
         self.skip_lines()
 
     def read_single(self):
@@ -636,7 +705,8 @@
         todo = self.length
         if todo >= 0:
             while todo > 0:
-                data = self.fp.read(min(todo, self.bufsize))
+                data = self.fp.read(min(todo, self.bufsize)) # bytes
+                self.bytes_read += len(data)
                 if not data:
                     self.done = -1
                     break
@@ -645,42 +715,57 @@
 
     def read_lines(self):
         """Internal: read lines until EOF or outerboundary."""
-        self.file = self.__file = StringIO()
+        if self.filename is not None:
+            self.file = self.__file = BytesIO() # store data as bytes for files
+        else:
+            self.file = self.__file = StringIO() # as strings for other fields
         if self.outerboundary:
             self.read_lines_to_outerboundary()
         else:
             self.read_lines_to_eof()
 
     def __write(self, line):
+        """line is always bytes, not string"""
         if self.__file is not None:
             if self.__file.tell() + len(line) > 1000:
                 self.file = self.make_file()
                 data = self.__file.getvalue()
                 self.file.write(data)
                 self.__file = None
-        self.file.write(line)
-
+        if self.filename is not None:
+            self.file.write(line) # keep bytes
+        else:
+            self.file.write(line.decode(self.fp.encoding)) # decode to string
+       
     def read_lines_to_eof(self):
         """Internal: read lines until EOF."""
-        while 1:
-            line = self.fp.readline(1<<16)
+        while True:
+            line = self.fp.readline(1<<16) # bytes
+            self.bytes_read += len(line)
             if not line:
                 self.done = -1
                 break
             self.__write(line)
 
     def read_lines_to_outerboundary(self):
-        """Internal: read lines until outerboundary."""
-        next = "--" + self.outerboundary
-        last = next + "--"
-        delim = ""
+        """Internal: read lines until outerboundary.
+        Data is read as bytes : boundaries and line ends must be converted
+        to bytes for comparisons"""
+        next = b"--" + self.outerboundary.encode(self.fp.encoding)
+        last = next + b"--"
+        delim = b""
         last_line_lfend = True
-        while 1:
-            line = self.fp.readline(1<<16)
+        _read = 0
+        while True:
+            if _read >= self.limit:
+                break
+            line = self.fp.readline(1<<16) # bytes
+            self.bytes_read += len(line)
+            _read += len(line)
             if not line:
                 self.done = -1
                 break
-            if line[:2] == "--" and last_line_lfend:
+            if line[:2] == b"--" and last_line_lfend:
                 strippedline = line.strip()
                 if strippedline == next:
                     break
@@ -688,16 +773,16 @@
                     self.done = 1
                     break
             odelim = delim
-            if line[-2:] == "\r\n":
-                delim = "\r\n"
+            if line.endswith(b"\r\n"):
+                delim = b"\r\n"
                 line = line[:-2]
                 last_line_lfend = True
-            elif line[-1] == "\n":
-                delim = "\n"
+            elif line.endswith(b"\n"):
+                delim = b"\n"
                 line = line[:-1]
                 last_line_lfend = True
             else:
-                delim = ""
+                delim = b""
                 last_line_lfend = False
             self.__write(odelim + line)
 
@@ -705,22 +790,23 @@
         """Internal: skip lines until outer boundary if defined."""
         if not self.outerboundary or self.done:
             return
-        next = "--" + self.outerboundary
-        last = next + "--"
+        next = b"--" + self.outerboundary.encode(self.fp.encoding)
+        last = next + b"--"
         last_line_lfend = True
-        while 1:
+        while True:
             line = self.fp.readline(1<<16)
+            self.bytes_read += len(line)
             if not line:
                 self.done = -1
                 break
-            if line[:2] == "--" and last_line_lfend:
+            if line.endswith(b"--") and last_line_lfend:
                 strippedline = line.strip()
                 if strippedline == next:
                     break
                 if strippedline == last:
                     self.done = 1
                     break
-            last_line_lfend = line.endswith('\n')
+            last_line_lfend = line.endswith(b'\n')
 
     def make_file(self):
         """Overridable: return a readable & writable file.
@@ -730,7 +816,8 @@
         - seek(0)
         - data is read from it
 
-        The file is always opened in text mode.
+        The file is opened in binary mode for files, in text mode
+        for other fields
 
         This version opens a temporary file for reading and writing,
         and immediately deletes (unlinks) it.  The trick (on Unix!) is
@@ -746,7 +833,10 @@
 
         """
         import tempfile
-        return tempfile.TemporaryFile("w+", encoding="utf-8", newline="\n")
+        if self.filename is not None:
+            return tempfile.TemporaryFile("wb+")
+        else:
+            return tempfile.TemporaryFile("w+")
 
 
 # Test/debug code