mirror of https://github.com/python/cpython.git
Patch #590913: PEP 263 support.
This commit is contained in:
parent
5428fff111
commit
eade4a1580
|
@ -1,4 +1,8 @@
|
||||||
import os
|
import os
|
||||||
|
import types
|
||||||
|
import sys
|
||||||
|
import codecs
|
||||||
|
import re
|
||||||
import tempfile
|
import tempfile
|
||||||
import tkFileDialog
|
import tkFileDialog
|
||||||
import tkMessageBox
|
import tkMessageBox
|
||||||
|
@ -24,6 +28,71 @@
|
||||||
#$ win <Control-p>
|
#$ win <Control-p>
|
||||||
#$ unix <Control-x><Control-p>
|
#$ unix <Control-x><Control-p>
|
||||||
|
|
||||||
|
try:
|
||||||
|
from codecs import BOM_UTF8
|
||||||
|
except ImportError:
|
||||||
|
# only available since Python 2.3
|
||||||
|
BOM_UTF8 = '\xef\xbb\xbf'
|
||||||
|
|
||||||
|
# Try setting the locale, so that we can find out
|
||||||
|
# what encoding to use
|
||||||
|
try:
|
||||||
|
import locale
|
||||||
|
locale.setlocale(locale.LC_CTYPE, "")
|
||||||
|
except ImportError:
|
||||||
|
pass
|
||||||
|
|
||||||
|
encoding = "ascii"
|
||||||
|
if sys.platform == 'win32':
|
||||||
|
# On Windows, we could use "mbcs". However, to give the user
|
||||||
|
# a portable encoding name, we need to find the code page
|
||||||
|
try:
|
||||||
|
encoding = locale.getdefaultlocale()[1]
|
||||||
|
codecs.lookup(encoding)
|
||||||
|
except LookupError:
|
||||||
|
pass
|
||||||
|
else:
|
||||||
|
try:
|
||||||
|
# Different things can fail here: the locale module may not be
|
||||||
|
# loaded, it may not offer nl_langinfo, or CODESET, or the
|
||||||
|
# resulting codeset may be unknown to Python. We ignore all
|
||||||
|
# these problems, falling back to ASCII
|
||||||
|
encoding = locale.nl_langinfo(locale.CODESET)
|
||||||
|
codecs.lookup(encoding)
|
||||||
|
except (NameError, AttributeError, LookupError):
|
||||||
|
# Try getdefaultlocale well: it parses environment variables,
|
||||||
|
# which may give a clue. Unfortunately, getdefaultlocale has
|
||||||
|
# bugs that can cause ValueError.
|
||||||
|
try:
|
||||||
|
encoding = locale.getdefaultlocale()[1]
|
||||||
|
codecs.lookup(encoding)
|
||||||
|
except (ValueError, LookupError):
|
||||||
|
pass
|
||||||
|
|
||||||
|
encoding = encoding.lower()
|
||||||
|
|
||||||
|
coding_re = re.compile("coding[:=]\s*([-\w_.]+)")
|
||||||
|
def coding_spec(str):
|
||||||
|
|
||||||
|
"""Return the encoding declaration according to PEP 263.
|
||||||
|
Raise LookupError if the encoding is declared but unknown."""
|
||||||
|
|
||||||
|
# Only consider the first two lines
|
||||||
|
str = str.split("\n")[:2]
|
||||||
|
str = "\n".join(str)
|
||||||
|
|
||||||
|
match = coding_re.search(str)
|
||||||
|
if not match:
|
||||||
|
return None
|
||||||
|
name = match.group(1)
|
||||||
|
# Check whether the encoding is known
|
||||||
|
import codecs
|
||||||
|
try:
|
||||||
|
codecs.lookup(name)
|
||||||
|
except LookupError:
|
||||||
|
# The standard encoding error does not indicate the encoding
|
||||||
|
raise LookupError, "Unknown encoding "+name
|
||||||
|
return name
|
||||||
|
|
||||||
class IOBinding:
|
class IOBinding:
|
||||||
|
|
||||||
|
@ -37,6 +106,7 @@ def __init__(self, editwin):
|
||||||
self.__id_savecopy = self.text.bind("<<save-copy-of-window-as-file>>",
|
self.__id_savecopy = self.text.bind("<<save-copy-of-window-as-file>>",
|
||||||
self.save_a_copy)
|
self.save_a_copy)
|
||||||
self.__id_print = self.text.bind("<<print-window>>", self.print_window)
|
self.__id_print = self.text.bind("<<print-window>>", self.print_window)
|
||||||
|
self.fileencoding = None
|
||||||
|
|
||||||
def close(self):
|
def close(self):
|
||||||
# Undo command bindings
|
# Undo command bindings
|
||||||
|
@ -101,6 +171,9 @@ def loadfile(self, filename):
|
||||||
except IOError, msg:
|
except IOError, msg:
|
||||||
tkMessageBox.showerror("I/O Error", str(msg), master=self.text)
|
tkMessageBox.showerror("I/O Error", str(msg), master=self.text)
|
||||||
return False
|
return False
|
||||||
|
|
||||||
|
chars = self.decode(chars)
|
||||||
|
|
||||||
self.text.delete("1.0", "end")
|
self.text.delete("1.0", "end")
|
||||||
self.set_filename(None)
|
self.set_filename(None)
|
||||||
self.text.insert("1.0", chars)
|
self.text.insert("1.0", chars)
|
||||||
|
@ -110,6 +183,54 @@ def loadfile(self, filename):
|
||||||
self.text.see("insert")
|
self.text.see("insert")
|
||||||
return True
|
return True
|
||||||
|
|
||||||
|
def decode(self, chars):
|
||||||
|
# Try to create a Unicode string. If that fails, let Tcl try
|
||||||
|
# its best
|
||||||
|
|
||||||
|
# Check presence of a UTF-8 signature first
|
||||||
|
if chars.startswith(BOM_UTF8):
|
||||||
|
try:
|
||||||
|
chars = chars[3:].decode("utf-8")
|
||||||
|
except UnicodeError:
|
||||||
|
# has UTF-8 signature, but fails to decode...
|
||||||
|
return chars
|
||||||
|
else:
|
||||||
|
# Indicates that this file originally had a BOM
|
||||||
|
self.fileencoding = BOM_UTF8
|
||||||
|
return chars
|
||||||
|
|
||||||
|
# Next look for coding specification
|
||||||
|
try:
|
||||||
|
enc = coding_spec(chars)
|
||||||
|
except LookupError, name:
|
||||||
|
tkMessageBox.showerror(
|
||||||
|
title="Error loading the file",
|
||||||
|
message="The encoding '%s' is not known to this Python "\
|
||||||
|
"installation. The file may not display correctly" % name,
|
||||||
|
master = self.text)
|
||||||
|
enc = None
|
||||||
|
|
||||||
|
if enc:
|
||||||
|
try:
|
||||||
|
return unicode(chars, enc)
|
||||||
|
except UnicodeError:
|
||||||
|
pass
|
||||||
|
|
||||||
|
# If it is ASCII, we need not to record anything
|
||||||
|
try:
|
||||||
|
return unicode(chars, 'ascii')
|
||||||
|
except UnicodeError:
|
||||||
|
pass
|
||||||
|
|
||||||
|
# Finally, try the locale's encoding. This is deprecated;
|
||||||
|
# the user should declare a non-ASCII encoding
|
||||||
|
try:
|
||||||
|
chars = unicode(chars, encoding)
|
||||||
|
self.fileencoding = encoding
|
||||||
|
except UnicodeError:
|
||||||
|
pass
|
||||||
|
return chars
|
||||||
|
|
||||||
def maybesave(self):
|
def maybesave(self):
|
||||||
if self.get_saved():
|
if self.get_saved():
|
||||||
return "yes"
|
return "yes"
|
||||||
|
@ -180,7 +301,7 @@ def print_window(self, event):
|
||||||
|
|
||||||
def writefile(self, filename):
|
def writefile(self, filename):
|
||||||
self.fixlastline()
|
self.fixlastline()
|
||||||
chars = str(self.text.get("1.0", "end-1c"))
|
chars = self.encode(self.text.get("1.0", "end-1c"))
|
||||||
try:
|
try:
|
||||||
f = open(filename, "w")
|
f = open(filename, "w")
|
||||||
f.write(chars)
|
f.write(chars)
|
||||||
|
@ -192,6 +313,68 @@ def writefile(self, filename):
|
||||||
master=self.text)
|
master=self.text)
|
||||||
return False
|
return False
|
||||||
|
|
||||||
|
def encode(self, chars):
|
||||||
|
if isinstance(chars, types.StringType):
|
||||||
|
# This is either plain ASCII, or Tk was returning mixed-encoding
|
||||||
|
# text to us. Don't try to guess further.
|
||||||
|
return chars
|
||||||
|
|
||||||
|
# See whether there is anything non-ASCII in it.
|
||||||
|
# If not, no need to figure out the encoding.
|
||||||
|
try:
|
||||||
|
return chars.encode('ascii')
|
||||||
|
except UnicodeError:
|
||||||
|
pass
|
||||||
|
|
||||||
|
# If there is an encoding declared, try this first.
|
||||||
|
try:
|
||||||
|
enc = coding_spec(chars)
|
||||||
|
failed = None
|
||||||
|
except LookupError, msg:
|
||||||
|
failed = msg
|
||||||
|
enc = None
|
||||||
|
if enc:
|
||||||
|
try:
|
||||||
|
return chars.encode(enc)
|
||||||
|
except UnicodeError:
|
||||||
|
failed = "Invalid encoding '%s'" % enc
|
||||||
|
|
||||||
|
if failed:
|
||||||
|
tkMessageBox.showerror(
|
||||||
|
"I/O Error",
|
||||||
|
"%s. Saving as UTF-8" % failed,
|
||||||
|
master = self.text)
|
||||||
|
|
||||||
|
# If there was a UTF-8 signature, use that. This should not fail
|
||||||
|
if self.fileencoding == BOM_UTF8 or failed:
|
||||||
|
return BOM_UTF8 + chars.encode("utf-8")
|
||||||
|
|
||||||
|
# Try the original file encoding next, if any
|
||||||
|
if self.fileencoding:
|
||||||
|
try:
|
||||||
|
return chars.encode(self.fileencoding)
|
||||||
|
except UnicodeError:
|
||||||
|
tkMessageBox.showerror(
|
||||||
|
"I/O Error",
|
||||||
|
"Cannot save this as '%s' anymore. Saving as UTF-8" % self.fileencoding,
|
||||||
|
master = self.text)
|
||||||
|
return BOM_UTF8 + chars.encode("utf-8")
|
||||||
|
|
||||||
|
# Nothing was declared, and we had not determined an encoding
|
||||||
|
# on loading. Recommend an encoding line.
|
||||||
|
try:
|
||||||
|
chars = chars.encode(encoding)
|
||||||
|
enc = encoding
|
||||||
|
except UnicodeError:
|
||||||
|
chars = BOM_UTF8 + chars.encode("utf-8")
|
||||||
|
enc = "utf-8"
|
||||||
|
tkMessageBox.showerror(
|
||||||
|
"I/O Error",
|
||||||
|
"Non-ASCII found, yet no encoding declared. Add a line like\n"
|
||||||
|
"# -*- coding: %s -*- \nto your file" % enc,
|
||||||
|
master = self.text)
|
||||||
|
return chars
|
||||||
|
|
||||||
def fixlastline(self):
|
def fixlastline(self):
|
||||||
c = self.text.get("end-2c")
|
c = self.text.get("end-2c")
|
||||||
if c != '\n':
|
if c != '\n':
|
||||||
|
|
|
@ -6,6 +6,7 @@
|
||||||
import getopt
|
import getopt
|
||||||
import re
|
import re
|
||||||
import warnings
|
import warnings
|
||||||
|
import types
|
||||||
|
|
||||||
import linecache
|
import linecache
|
||||||
from code import InteractiveInterpreter
|
from code import InteractiveInterpreter
|
||||||
|
@ -188,6 +189,9 @@ def runsource(self, source):
|
||||||
self.more = 0
|
self.more = 0
|
||||||
self.save_warnings_filters = warnings.filters[:]
|
self.save_warnings_filters = warnings.filters[:]
|
||||||
warnings.filterwarnings(action="error", category=SyntaxWarning)
|
warnings.filterwarnings(action="error", category=SyntaxWarning)
|
||||||
|
if isinstance(source, types.UnicodeType):
|
||||||
|
import IOBinding
|
||||||
|
source = source.encode(IOBinding.encoding)
|
||||||
try:
|
try:
|
||||||
return InteractiveInterpreter.runsource(self, source, filename)
|
return InteractiveInterpreter.runsource(self, source, filename)
|
||||||
finally:
|
finally:
|
||||||
|
|
Loading…
Reference in New Issue