--- PyXML-0.8.4/xml/parsers/xmlproc/xmlutils.py.orig 2009-12-30 11:43:21.000000000 +0100 +++ PyXML-0.8.4/xml/parsers/xmlproc/xmlutils.py 2009-12-30 11:44:12.000000000 +0100 @@ -720,6 +720,7 @@ # to the recoding. try: self.data = self.charset_converter(self.data) + self.datasize = len(self.data) except UnicodeError, e: self._handle_decoding_error(self.data, e) self.input_encoding = enc1