From 948cfd3b7b40ae419c21c1688122f9c51a0e869f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Matox?= <jamatos@lyx.org>
Date: Tue, 24 Jul 2007 14:58:41 +0000
Subject: [PATCH] Backport lyx2lyx from 1.5.0

git-svn-id: svn://svn.lyx.org/lyx/lyx-devel/branches/BRANCH_1_4_X@19183 a592a061-630c-0410-9148-cb99ea01b6c8
---
 lib/ChangeLog                                 |    4 +
 lib/lyx2lyx/ChangeLog                         |    9 +-
 lib/lyx2lyx/LyX.py                            |  174 +-
 lib/lyx2lyx/Makefile.am                       |   15 +-
 lib/lyx2lyx/lyx2lyx                           |   26 +-
 lib/lyx2lyx/lyx2lyx_lang.py                   |  102 +
 .../{lyx_1_0_1.py => lyx2lyx_version.py}      |   10 +-
 lib/lyx2lyx/lyx_0_06.py                       |   28 +
 lib/lyx2lyx/lyx_0_08.py                       |   34 +
 lib/lyx2lyx/lyx_0_10.py                       |  138 ++
 lib/lyx2lyx/lyx_0_12.py                       |  161 +-
 lib/lyx2lyx/{lyx_1_0_0.py => lyx_1_0.py}      |   35 +-
 lib/lyx2lyx/{lyx_1_1_4.py => lyx_1_1.py}      |    7 +-
 lib/lyx2lyx/lyx_1_1_5.py                      |  129 +-
 lib/lyx2lyx/{lyx_1_1_6.py => lyx_1_1_6_0.py}  |   38 +-
 .../{lyx_1_1_6fix3.py => lyx_1_1_6_3.py}      |   35 +-
 lib/lyx2lyx/lyx_1_2.py                        |  218 +-
 lib/lyx2lyx/lyx_1_3.py                        |   35 +-
 lib/lyx2lyx/lyx_1_4.py                        | 1573 +++++++------
 lib/lyx2lyx/lyx_1_5.py                        | 2080 +++++++++++++++++
 lib/lyx2lyx/parser_tools.py                   |  253 +-
 lib/lyx2lyx/profiling.py                      |    4 +-
 lib/unicodesymbols                            | 1399 +++++++++++
 23 files changed, 5310 insertions(+), 1197 deletions(-)
 create mode 100644 lib/lyx2lyx/lyx2lyx_lang.py
 rename lib/lyx2lyx/{lyx_1_0_1.py => lyx2lyx_version.py} (83%)
 create mode 100644 lib/lyx2lyx/lyx_0_06.py
 create mode 100644 lib/lyx2lyx/lyx_0_08.py
 create mode 100644 lib/lyx2lyx/lyx_0_10.py
 rename lib/lyx2lyx/{lyx_1_0_0.py => lyx_1_0.py} (71%)
 rename lib/lyx2lyx/{lyx_1_1_4.py => lyx_1_1.py} (78%)
 rename lib/lyx2lyx/{lyx_1_1_6.py => lyx_1_1_6_0.py} (91%)
 rename lib/lyx2lyx/{lyx_1_1_6fix3.py => lyx_1_1_6_3.py} (80%)
 create mode 100644 lib/lyx2lyx/lyx_1_5.py
 create mode 100644 lib/unicodesymbols

diff --git a/lib/ChangeLog b/lib/ChangeLog
index 115ca58c28..1449591be8 100644
--- a/lib/ChangeLog
+++ b/lib/ChangeLog
@@ -1,3 +1,7 @@
+2007-07-24  José Matos  <jamatos@lyx.org>
+
+	* unicodesymbols: new file to read documents from 1.5.x
+
 2007-07-12  Jean-Pierre Chrétien  <chretien@cert.fr>
 
 	* layouts/beamer.layout: reorder layouts (bug 3141).
diff --git a/lib/lyx2lyx/ChangeLog b/lib/lyx2lyx/ChangeLog
index 9a9c311646..64a1a6e6fa 100644
--- a/lib/lyx2lyx/ChangeLog
+++ b/lib/lyx2lyx/ChangeLog
@@ -1,3 +1,8 @@
+2007-07-24  José Matos  <jamatos@lyx.org>
+
+	* (several) Backport lyx2lyx from 1.5.0 (modulo some files used
+	for testing).
+
 2006-08-09  Jean-Marc Lasgouttes  <lasgouttes@lyx.org>
 
 	* Makefile.am (dist_lyx2lyx_DATA): rename to dist_lyx2lyx_PYTHON;
@@ -5,9 +10,11 @@
 	(install-data-hook): new target: sets executable bit on lyx2lyx.
 
 2006-07-15  Bo Peng     <ben.bob@gmail.com>
+
 	* replace all tab in .py files by spaces
 
-2006-04-10  José Matos  <jamatos@lyx.org>	
+2006-04-10  José Matos  <jamatos@lyx.org>
+
 	* parser_tools.py (find_tokens_exact, find_tokens): replace range
 	with xrange.
 
diff --git a/lib/lyx2lyx/LyX.py b/lib/lyx2lyx/LyX.py
index a23c68e590..9f907f35c6 100644
--- a/lib/lyx2lyx/LyX.py
+++ b/lib/lyx2lyx/LyX.py
@@ -1,6 +1,7 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 Dekel Tsur <dekel@lyx.org>, José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 Dekel Tsur <dekel@lyx.org>
+# Copyright (C) 2002-2006 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -17,36 +18,66 @@
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
 from parser_tools import get_value, check_token, find_token,\
-     find_tokens, find_end_of, find_end_of_inset
+     find_tokens, find_end_of
 import os.path
 import gzip
+import locale
 import sys
 import re
-import string
 import time
 
-version_lyx2lyx = "1.4.1"
+try:
+    import lyx2lyx_version
+    version_lyx2lyx = lyx2lyx_version.version
+except: # we are running from build directory so assume the last version
+    version_lyx2lyx = '1.4.5'
+
 default_debug_level = 2
 
+####################################################################
+# Private helper functions
+
+def find_end_of_inset(lines, i):
+    " Find beginning of inset, where lines[i] is included."
+    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
+
+def generate_minor_versions(major, last_minor_version):
+    """ Generate minor versions, using major as prefix and minor
+    versions from 0 until last_minor_version, plus the generic version.
+
+    Example:
+
+      generate_minor_versions("1.2", 4) ->
+      [ "1.2", "1.2.0", "1.2.1", "1.2.2", "1.2.3"]
+    """
+    return [major] + [major + ".%d" % i for i in range(last_minor_version + 1)]
+
+
+# End of helper functions
+####################################################################
+
+
 # Regular expressions used
 format_re = re.compile(r"(\d)[\.,]?(\d\d)")
 fileformat = re.compile(r"\\lyxformat\s*(\S*)")
-original_version = re.compile(r"\#LyX (\S*)")
+original_version = re.compile(r".*?LyX ([\d.]*)")
 
 ##
 # file format information:
 #  file, supported formats, stable release versions
-format_relation = [("0_10",  [210], ["0.10.7","0.10"]),
-                   ("0_12",  [215], ["0.12","0.12.1","0.12"]),
-                   ("1_0_0", [215], ["1.0.0","1.0"]),
-                   ("1_0_1", [215], ["1.0.1","1.0.2","1.0.3","1.0.4", "1.1.2","1.1"]),
-                   ("1_1_4", [215], ["1.1.4","1.1"]),
-                   ("1_1_5", [216], ["1.1.5","1.1.5fix1","1.1.5fix2","1.1"]),
-                   ("1_1_6", [217], ["1.1.6","1.1.6fix1","1.1.6fix2","1.1"]),
-                   ("1_1_6fix3", [218], ["1.1.6fix3","1.1.6fix4","1.1"]),
-                   ("1_2", [220], ["1.2.0","1.2.1","1.2.3","1.2.4","1.2"]),
-                   ("1_3", [221], ["1.3.0","1.3.1","1.3.2","1.3.3","1.3.4","1.3.5","1.3.6","1.3"]),
-                   ("1_4", range(222,246), ["1.4.0cvs","1.4"])]
+format_relation = [("0_06",    [200], generate_minor_versions("0.6" , 4)),
+                   ("0_08",    [210], generate_minor_versions("0.8" , 6) + ["0.7"]),
+                   ("0_10",    [210], generate_minor_versions("0.10", 7) + ["0.9"]),
+                   ("0_12",    [215], generate_minor_versions("0.12", 1) + ["0.11"]),
+                   ("1_0",     [215], generate_minor_versions("1.0" , 4)),
+                   ("1_1",     [215], generate_minor_versions("1.1" , 4)),
+                   ("1_1_5",   [216], ["1.1.5","1.1.5.1","1.1.5.2","1.1"]),
+                   ("1_1_6_0", [217], ["1.1.6","1.1.6.1","1.1.6.2","1.1"]),
+                   ("1_1_6_3", [218], ["1.1.6.3","1.1.6.4","1.1"]),
+                   ("1_2",     [220], generate_minor_versions("1.2" , 4)),
+                   ("1_3",     [221], generate_minor_versions("1.3" , 7)),
+                   ("1_4", range(222,246), generate_minor_versions("1.4" , 5)),
+                   ("1_5", range(246,277), generate_minor_versions("1.5" , 0))]
 
 
 def formats_list():
@@ -81,12 +112,37 @@ def trim_eol(line):
         return line[:-1]
 
 
+def get_encoding(language, inputencoding, format, cjk_encoding):
+    if format > 248:
+        return "utf8"
+    # CJK-LyX encodes files using the current locale encoding.
+    # This means that files created by CJK-LyX can only be converted using
+    # the correct locale settings unless the encoding is given as commandline
+    # argument.
+    if cjk_encoding == 'auto':
+        return locale.getpreferredencoding()
+    elif cjk_encoding != '':
+        return cjk_encoding
+    from lyx2lyx_lang import lang
+    if inputencoding == "auto" or inputencoding == "default":
+        return lang[language][3]
+    if inputencoding == "":
+        return "latin1"
+    # python does not know the alias latin9
+    if inputencoding == "latin9":
+        return "iso-8859-15"
+    return inputencoding
+
 ##
 # Class
 #
 class LyX_Base:
     """This class carries all the information of the LyX file."""
-    def __init__(self, end_format = 0, input = "", output = "", error = "", debug = default_debug_level, try_hard = 0):
+    
+    def __init__(self, end_format = 0, input = "", output = "", error
+                 = "", debug = default_debug_level, try_hard = 0, cjk_encoding = '',
+                 language = "english", encoding = "auto"):
+
         """Arguments:
         end_format: final format that the file should be converted. (integer)
         input: the name of the input source, if empty resort to standard input.
@@ -103,6 +159,7 @@ class LyX_Base:
 
         self.debug = debug
         self.try_hard = try_hard
+        self.cjk_encoding = cjk_encoding
 
         if end_format:
             self.end_format = self.lyxformat(end_format)
@@ -119,6 +176,8 @@ class LyX_Base:
         self.preamble = []
         self.body = []
         self.status = 0
+        self.encoding = encoding
+        self.language = language
 
 
     def warning(self, message, debug_level= default_debug_level):
@@ -156,7 +215,7 @@ class LyX_Base:
                     if check_token(line, '\\end_preamble'):
                         break
                     
-                    if string.split(line)[:0] in ("\\layout", "\\begin_layout", "\\begin_body"):
+                    if line.split()[:0] in ("\\layout", "\\begin_layout", "\\begin_body"):
                         self.warning("Malformed LyX file: Missing '\\end_preamble'.")
                         self.warning("Adding it now and hoping for the best.")
 
@@ -165,35 +224,45 @@ class LyX_Base:
             if check_token(line, '\\end_preamble'):
                 continue
 
-            line = string.strip(line)
+            line = line.strip()
             if not line:
                 continue
 
-            if string.split(line)[0] in ("\\layout", "\\begin_layout", "\\begin_body"):
+            if line.split()[0] in ("\\layout", "\\begin_layout", "\\begin_body", "\\begin_deeper"):
                 self.body.append(line)
                 break
 
             self.header.append(line)
 
-        while 1:
-            line = self.input.readline()
-            if not line:
-                break
-            self.body.append(trim_eol(line))
-
         self.textclass = get_value(self.header, "\\textclass", 0)
         self.backend = get_backend(self.textclass)
         self.format  = self.read_format()
-        self.language = get_value(self.header, "\\language", 0)
-        if self.language == "":
-            self.language = "english"
+        self.language = get_value(self.header, "\\language", 0, default = "english")
+        self.inputencoding = get_value(self.header, "\\inputencoding", 0, default = "auto")
+        self.encoding = get_encoding(self.language, self.inputencoding, self.format, self.cjk_encoding)
         self.initial_version = self.read_version()
 
+        # Second pass over header and preamble, now we know the file encoding
+        for i in range(len(self.header)):
+            self.header[i] = self.header[i].decode(self.encoding)
+        for i in range(len(self.preamble)):
+            self.preamble[i] = self.preamble[i].decode(self.encoding)
+
+        # Read document body
+        while 1:
+            line = self.input.readline().decode(self.encoding)
+            if not line:
+                break
+            self.body.append(trim_eol(line))
+
 
     def write(self):
         " Writes the LyX file to self.output."
         self.set_version()
         self.set_format()
+        self.set_textclass()
+        if self.encoding == "auto":
+            self.encoding = get_encoding(self.language, self.encoding, self.format, self.cjk_encoding)
 
         if self.preamble:
             i = find_token(self.header, '\\textclass', 0) + 1
@@ -206,7 +275,7 @@ class LyX_Base:
             header = self.header
 
         for line in header + [''] + self.body:
-            self.output.write(line+"\n")
+            self.output.write(line.encode(self.encoding)+"\n")
 
 
     def choose_io(self, input, output):
@@ -227,6 +296,7 @@ class LyX_Base:
             except:
                 self.input = open(input)
         else:
+            self.dir = ''
             self.input = sys.stdin
 
 
@@ -235,6 +305,8 @@ class LyX_Base:
         result = format_re.match(format)
         if result:
             format = int(result.group(1) + result.group(2))
+        elif format == '2':
+            format = 200
         else:
             self.error(str(format) + ": " + "Invalid LyX file.")
 
@@ -252,9 +324,19 @@ class LyX_Base:
             if line[0] != "#":
                 return None
 
+            line = line.replace("fix",".")
             result = original_version.match(line)
             if result:
-                return result.group(1)
+                # Special know cases: reLyX and KLyX
+                if line.find("reLyX") != -1 or line.find("KLyX") != -1:
+                    return "0.12"
+
+                res = result.group(1)
+                if not res:
+                    self.warning(line)
+                #self.warning("Version %s" % result.group(1))
+                return res
+        self.warning(str(self.header[:2]))
         return None
 
 
@@ -286,6 +368,11 @@ class LyX_Base:
         self.header[i] = "\\lyxformat %s" % format
 
 
+    def set_textclass(self):
+        i = find_token(self.header, "\\textclass", 0)
+        self.header[i] = "\\textclass %s" % self.textclass
+
+
     def set_parameter(self, param, value):
         " Set the value of the header parameter."
         i = find_token(self.header, '\\' + param, 0)
@@ -359,7 +446,7 @@ class LyX_Base:
 
         if not correct_version:
             if format <= 215:
-                self.warning("Version does not match file format, discarding it.")
+                self.warning("Version does not match file format, discarding it. (Version %s, format %d)" %(self.initial_version, self.format))
             for rel in format_relation:
                 if format in rel[1]:
                     initial_step = rel[0]
@@ -426,7 +513,7 @@ class LyX_Base:
                 self.warning('Incomplete file.', 0)
                 break
 
-            section = string.split(self.body[i])[1]
+            section = self.body[i].split()[1]
             if section[-1] == '*':
                 section = section[:-1]
 
@@ -434,12 +521,12 @@ class LyX_Base:
 
             k = i + 1
             # skip paragraph parameters
-            while not string.strip(self.body[k]) or string.split(self.body[k])[0] in allowed_parameters:
+            while not self.body[k].strip() or self.body[k].split()[0] in allowed_parameters:
                 k = k +1
 
             while k < j:
                 if check_token(self.body[k], '\\begin_inset'):
-                    inset = string.split(self.body[k])[1]
+                    inset = self.body[k].split()[1]
                     end = find_end_of_inset(self.body, k)
                     if end == -1 or end > j:
                         self.warning('Malformed file.', 0)
@@ -452,7 +539,7 @@ class LyX_Base:
                     k = k + 1
 
             # trim empty lines in the end.
-            while string.strip(par[-1]) == '' and par:
+            while par[-1].strip() == '' and par:
                 par.pop()
 
             toc_par.append(Paragraph(section, par))
@@ -464,8 +551,8 @@ class LyX_Base:
 
 class File(LyX_Base):
     " This class reads existing LyX files."
-    def __init__(self, end_format = 0, input = "", output = "", error = "", debug = default_debug_level, try_hard = 0):
-        LyX_Base.__init__(self, end_format, input, output, error, debug, try_hard)
+    def __init__(self, end_format = 0, input = "", output = "", error = "", debug = default_debug_level, try_hard = 0, cjk_encoding = ''):
+        LyX_Base.__init__(self, end_format, input, output, error, debug, try_hard, cjk_encoding)
         self.read()
 
 
@@ -481,7 +568,14 @@ class NewFile(LyX_Base):
             "\\textclass article",
             "\\language english",
             "\\inputencoding auto",
-            "\\fontscheme default",
+            "\\font_roman default",
+            "\\font_sans default",
+            "\\font_typewriter default",
+            "\\font_default_family default",
+            "\\font_sc false",
+            "\\font_osf false",
+            "\\font_sf_scale 100",
+            "\\font_tt_scale 100",
             "\\graphics default",
             "\\paperfontsize default",
             "\\papersize default",
diff --git a/lib/lyx2lyx/Makefile.am b/lib/lyx2lyx/Makefile.am
index 4de3c2c374..3c3aeb5e0d 100644
--- a/lib/lyx2lyx/Makefile.am
+++ b/lib/lyx2lyx/Makefile.am
@@ -7,18 +7,23 @@ CHMOD = chmod
 lyx2lyxdir = $(pkgdatadir)/lyx2lyx
 dist_lyx2lyx_PYTHON = \
 	lyx2lyx \
+	lyx2lyx_version.py \
+	lyx2lyx_lang.py \
 	parser_tools.py \
 	LyX.py \
+	lyx_0_06.py \
+	lyx_0_08.py \
+	lyx_0_10.py \
 	lyx_0_12.py \
-	lyx_1_0_0.py \
-	lyx_1_0_1.py \
-	lyx_1_1_4.py \
+	lyx_1_0.py \
+	lyx_1_1.py \
 	lyx_1_1_5.py \
-	lyx_1_1_6.py \
-	lyx_1_1_6fix3.py \
+	lyx_1_1_6_0.py \
+	lyx_1_1_6_3.py \
 	lyx_1_2.py \
 	lyx_1_3.py \
 	lyx_1_4.py \
+	lyx_1_5.py \
 	profiling.py
 
 install-data-hook:
diff --git a/lib/lyx2lyx/lyx2lyx b/lib/lyx2lyx/lyx2lyx
index ce0e45278d..8c7b98b263 100755
--- a/lib/lyx2lyx/lyx2lyx
+++ b/lib/lyx2lyx/lyx2lyx
@@ -1,6 +1,6 @@
 #! /usr/bin/env python
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -36,25 +36,30 @@ Options:
     -t, --to version		final version (optional)
     -o, --output name		name of the output file or else goes to stdout
     -n, --try-hard		try hard (ignore any convertion errors)
+    -c, --cjk [encoding]	files in format 248 and lower are read and
+				written in the format of CJK-LyX.
+				If encoding is not given or 'auto' the encoding
+				is determined from the locale.
     -q, --quiet			same as --debug=0"""
 
 
 def parse_options(argv):
-    _options =  ["help", "version", "list", "debug=", "err=", "from=", "to=", "output=", "try-hard", "quiet"]
+    _options =  ["help", "version", "list", "debug=", "err=", "from=", "to=", "output=", "try-hard", "cjk", "quiet"]
     try:
-       opts, args = getopt.getopt(argv[1:], "d:e:f:hlno:qt:v", _options)
+       opts, args = getopt.getopt(argv[1:], "c:d:e:f:hlno:qt:v", _options)
     except getopt.error:
         usage()
         sys.exit(2)
 
     end_format, input, output, error, debug, try_hard = 0, "", "", "", LyX.default_debug_level, 0
+    cjk_encoding = ''
     for o, a in opts:
         if o in ("-h", "--help"):
             usage()
             sys.exit()
         if o in ("-v", "--version"):
             print "lyx2lyx, version %s" %(LyX.version_lyx2lyx)
-            print "Copyright (C) 2002-2004 José Matos and Dekel Tsur"
+            print "Copyright (C) 2002-2004 JosĂŠ Matos and Dekel Tsur"
             sys.exit()
         if o in ("-d", "--debug"):
             debug = int(a)
@@ -71,15 +76,20 @@ def parse_options(argv):
             error = a
         if o in ("-n", "--try-hard"):
             try_hard = 1
+        if o in ("-c", "--cjk"):
+            if a == '':
+                cjk_encoding = 'auto'
+            else:
+                cjk_encoding = a
     if args:
         input = args[0]
 
-    return end_format, input, output, error, debug, try_hard
+    return end_format, input, output, error, debug, try_hard, cjk_encoding
 
 
 def main(argv):
-    end_format, input, output, error, debug, try_hard = parse_options(argv)
-    file = LyX.File(end_format, input, output, error, debug, try_hard)
+    end_format, input, output, error, debug, try_hard, cjk_encoding = parse_options(argv)
+    file = LyX.File(end_format, input, output, error, debug, try_hard, cjk_encoding)
 
     file.convert()
     file.write()
diff --git a/lib/lyx2lyx/lyx2lyx_lang.py b/lib/lyx2lyx/lyx2lyx_lang.py
new file mode 100644
index 0000000000..d5b76d2d03
--- /dev/null
+++ b/lib/lyx2lyx/lyx2lyx_lang.py
@@ -0,0 +1,102 @@
+# This file is generated by generate_incoding_info.py from lib/languages file.
+# Do not change this file directly.
+
+lang = {'afrikaans': ['afrikaans', 'Afrikaans', 'false', 'iso8859-1', 'af_ZA', ''],
+ 'american': ['american', 'American', 'false', 'iso8859-1', 'en_US', ''],
+ 'arabic': ['arabic', 'Arabic', 'true', 'iso8859-6', 'ar_SA', ''],
+ 'austrian': ['austrian', 'Austrian', 'false', 'iso8859-1', 'de_AT', ''],
+ 'bahasa': ['bahasa', 'Bahasa', 'false', 'iso8859-1', 'in_ID', ''],
+ 'basque': ['basque', 'Basque', 'false', 'iso8859-1', 'eu_ES', ''],
+ 'belarusian': ['belarusian', 'Belarusian', 'false', 'cp1251', 'be_BY', ''],
+ 'brazil': ['brazil',
+            'Portuguese (Brazil)',
+            'false',
+            'iso8859-1',
+            'pt_BR',
+            ''],
+ 'breton': ['breton', 'Breton', 'false', 'iso8859-1', 'br_FR', ''],
+ 'british': ['british', 'British', 'false', 'iso8859-1', 'en_GB', ''],
+ 'bulgarian': ['bulgarian', 'Bulgarian', 'false', 'cp1251', 'bg_BG', ''],
+ 'canadian': ['canadian', 'Canadian', 'false', 'iso8859-1', 'en_CA', ''],
+ 'canadien': ['canadien',
+              'French Canadian',
+              'false',
+              'iso8859-1',
+              'fr_CA',
+              ''],
+ 'catalan': ['catalan', 'Catalan', 'false', 'iso8859-1', 'ca_ES', ''],
+ 'croatian': ['croatian', 'Croatian', 'false', 'iso8859-2', 'hr_HR', ''],
+ 'czech': ['czech', 'Czech', 'false', 'iso8859-2', 'cs_CZ', ''],
+ 'danish': ['danish', 'Danish', 'false', 'iso8859-1', 'da_DK', ''],
+ 'dutch': ['dutch', 'Dutch', 'false', 'iso8859-1', 'nl_NL', ''],
+ 'english': ['english', 'English', 'false', 'iso8859-1', 'en_US', ''],
+ 'esperanto': ['esperanto', 'Esperanto', 'false', 'iso8859-3', 'eo', ''],
+ 'estonian': ['estonian', 'Estonian', 'false', 'iso8859-1', 'et_EE', ''],
+ 'finnish': ['finnish', 'Finnish', 'false', 'iso8859-1', 'fi_FI', ''],
+ 'french': ['french',
+            'French',
+            'false',
+            'iso8859-1',
+            'fr_FR',
+            '\\addto\\extrasfrench{\\providecommand{\\og}{\\leavevmode\\flqq~}\\providecommand{\\fg}{\\ifdim\\lastskip>\\z@\\unskip\\fi~\\frqq}}'],
+ 'frenchb': ['french', 'French', 'false', 'iso8859-1', 'fr_FR', ''], # for compatibility reasons
+ 'galician': ['galician', 'Galician', 'false', 'iso8859-1', 'gl_ES', ''],
+ 'german': ['german', 'German', 'false', 'iso8859-1', 'de_DE', ''],
+ 'greek': ['greek', 'Greek', 'false', 'iso8859-7', 'el_GR', ''],
+ 'hebrew': ['hebrew', 'Hebrew', 'true', 'cp1255', 'he_IL', ''],
+ 'icelandic': ['icelandic', 'Icelandic', 'false', 'iso8859-1', 'is_IS', ''],
+ 'irish': ['irish', 'Irish', 'false', 'iso8859-1', 'ga_IE', ''],
+ 'italian': ['italian', 'Italian', 'false', 'iso8859-1', 'it_IT', ''],
+ 'kazakh': ['kazakh', 'Kazakh', 'false', 'pt154', 'kk_KZ', ''],
+ 'latvian': ['latvian', 'Latvian', 'false', 'iso8859-13', 'lv_LV', ''],
+ 'lithuanian': ['lithuanian',
+                'Lithuanian',
+                'false',
+                'iso8859-13',
+                'lt_LT',
+                ''],
+ 'magyar': ['magyar', 'Magyar', 'false', 'iso8859-2', 'hu_HU', ''],
+ 'naustrian': ['naustrian',
+               'Austrian (new spelling)',
+               'false',
+               'iso8859-1',
+               'de_AT',
+               ''],
+ 'ngerman': ['ngerman',
+             'German (new spelling)',
+             'false',
+             'iso8859-1',
+             'de_DE',
+             ''],
+ 'norsk': ['norsk', 'Norsk', 'false', 'iso8859-1', 'no_NO', ''],
+ 'nynorsk': ['nynorsk', 'Nynorsk', 'false', 'iso8859-1', 'nn_NO', ''],
+ 'polish': ['polish', 'Polish', 'false', 'iso8859-2', 'pl_PL', ''],
+ 'portuges': ['portuges', 'Portugese', 'false', 'iso8859-1', 'pt_PT', ''],
+ 'romanian': ['romanian', 'Romanian', 'false', 'iso8859-2', 'ro_RO', ''],
+ 'russian': ['russian', 'Russian', 'false', 'koi8', 'ru_RU', ''],
+ 'scottish': ['scottish', 'Scottish', 'false', 'iso8859-1', 'gd_GB', ''],
+ 'serbian': ['croatian', 'Serbian', 'false', 'iso8859-5', 'sr_HR', ''],
+ 'serbocroatian': ['croatian',
+                   'Serbo-Croatian',
+                   'false',
+                   'iso8859-2',
+                   'sh_HR',
+                   ''],
+ 'slovak': ['slovak', 'Slovak', 'false', 'iso8859-2', 'sk_SK', ''],
+ 'slovene': ['slovene', 'Slovene', 'false', 'iso8859-2', 'sl_SI', ''],
+ 'spanish': ['spanish',
+             'Spanish',
+             'false',
+             'iso8859-1',
+             'es_ES',
+             '\\deactivatetilden'],
+ 'swedish': ['swedish', 'Swedish', 'false', 'iso8859-1', 'sv_SE', ''],
+ 'thai': ['thai',
+          'Thai',
+          'false',
+          'tis620-0',
+          'th_TH',
+          '\\usepackage{thswitch}'],
+ 'turkish': ['turkish', 'Turkish', 'false', 'iso8859-9', 'tr_TR', ''],
+ 'ukrainian': ['ukrainian', 'Ukrainian', 'false', 'koi8-u', 'uk_UA', ''],
+ 'welsh': ['welsh', 'Welsh', 'false', 'iso8859-1', 'cy_GB', '']}
diff --git a/lib/lyx2lyx/lyx_1_0_1.py b/lib/lyx2lyx/lyx2lyx_version.py
similarity index 83%
rename from lib/lyx2lyx/lyx_1_0_1.py
rename to lib/lyx2lyx/lyx2lyx_version.py
index 199fb3022a..35378747c3 100644
--- a/lib/lyx2lyx/lyx_1_0_1.py
+++ b/lib/lyx2lyx/lyx2lyx_version.py
@@ -1,6 +1,6 @@
-# This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# This file is part of lyx2lyx -*- python -*-
+# -*- coding: utf-8 -*-
+# Copyright (C) 2006 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,9 +16,7 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
-convert = [[215, []]]
-revert  = []
-
+version = "1.4.5"
 
 if __name__ == "__main__":
     pass
diff --git a/lib/lyx2lyx/lyx_0_06.py b/lib/lyx2lyx/lyx_0_06.py
new file mode 100644
index 0000000000..f518cbcde6
--- /dev/null
+++ b/lib/lyx2lyx/lyx_0_06.py
@@ -0,0 +1,28 @@
+# This file is part of lyx2lyx
+# -*- coding: utf-8 -*-
+# Copyright (C) 2006 JosĂŠ Matos <jamatos@lyx.org>
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+""" Convert files to the file format generated by lyx 0.6"""
+
+supported_versions = ["0.6.%d" % i for i in range(5)] + ["0.6"]
+convert = [[200, []]]
+revert  = []
+
+
+if __name__ == "__main__":
+    pass
+
diff --git a/lib/lyx2lyx/lyx_0_08.py b/lib/lyx2lyx/lyx_0_08.py
new file mode 100644
index 0000000000..0186decbf2
--- /dev/null
+++ b/lib/lyx2lyx/lyx_0_08.py
@@ -0,0 +1,34 @@
+# This file is part of lyx2lyx
+# -*- coding: utf-8 -*-
+# Copyright (C) 2006 JosĂŠ Matos <jamatos@lyx.org>
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+""" Convert files to the file format generated by lyx 0.8"""
+
+def add_inputencoding(document):
+    " Add the input encoding, latin1"
+    document.header.append('\\inputencoding latin1')
+    document.inputencoding = "latin1"
+
+
+supported_versions = ["0.8.%d" % i for i in range(7)] + ["0.8"]
+convert = [[210, [add_inputencoding]]]
+revert  = []
+
+
+if __name__ == "__main__":
+    pass
+
diff --git a/lib/lyx2lyx/lyx_0_10.py b/lib/lyx2lyx/lyx_0_10.py
new file mode 100644
index 0000000000..ebbbf0fc46
--- /dev/null
+++ b/lib/lyx2lyx/lyx_0_10.py
@@ -0,0 +1,138 @@
+# This file is part of lyx2lyx
+# -*- coding: utf-8 -*-
+# Copyright (C) 2006 JosĂŠ Matos <jamatos@lyx.org>
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+""" Convert files to the file format generated by lyx 0.10"""
+
+def regularise_header(document):
+    " Put each entry in header into a separate line. "
+    i = 0
+    while i < len(document.header):
+        line = document.header[i]
+        if len(line.split('\\')) > 1:
+            tmp = [ '\\'+ token.strip() for token in line.split('\\')][1:]
+            document.header[i: i+1] = tmp
+            i += len(tmp)
+        i += 1
+
+
+def find_next_space(line, j):
+    """ Return position of next space or backslash, which one comes
+    first, starting from position k, if not existing return last
+    position in line."""
+    l = line.find(' ', j)
+    if l == -1:
+        l = len(line)
+    k = line.find('\\', j)
+    if k == -1:
+        k = len(line)
+
+    if k < l:
+        return k
+    return l
+
+
+def regularise_body(document):
+    """ Place tokens starting with a backslash into a separate line. """
+
+    getline_tokens = ["added_space_bottom", "added_space_top",
+                      "align", "layout", "fill_bottom", "fill_top",
+                      "labelwidthstring", "pagebreak_top",
+                      "pagebreak_bottom", "noindent"]
+
+    noargs_tokens = ["backslash", "begin_deeper", "end_deeper",
+                     "end_float", "end_inset", "hfill", "newline",
+                     "protected_separator"]
+
+    onearg_tokens = ["bar", "begin_float", "family", "latex", "shape",
+                     "size", "series", "cursor"]
+
+    i = 0
+    while i < len(document.body):
+        line = document.body[i]
+        j = 0
+        tmp = []
+        while j < len(line):
+            k = line.find('\\', j)
+
+            if k == -1:
+                tmp += [line[j:]]
+                break
+
+            if k != j:
+                tmp += [line[j: k]]
+                j = k
+
+            k = find_next_space(line, j+1)
+
+            # These tokens take the rest of the line
+            token = line[j+1:k]
+            if token in getline_tokens:
+                tmp += [line[j:]]
+                break
+
+            # These tokens take no arguments
+            if token in noargs_tokens:
+                tmp += [line[j:k]]
+                j = k
+                continue
+
+            # These tokens take one argument
+            if token in onearg_tokens:
+                k = find_next_space(line, k + 1)
+                tmp += [line[j:k]]
+                j = k
+                continue
+
+            # Special treatment for insets
+            if token in ["begin_inset"]:
+                l = find_next_space(line, k + 1)
+                inset = line[k+1: l]
+
+                if inset == "Latex":
+                    tmp += [line[j:l]]
+                    j = l
+                    continue
+
+                if inset in ["LatexCommand", "LatexDel"]:
+                    tmp += [line[j:]]
+                    break
+
+                if inset == "Quotes":
+                    l = find_next_space(line, l + 1)
+                    tmp += [line[j:l]]
+                    j = l
+                    continue
+
+                document.warning("unkown inset %s" % line)
+                assert(False)
+
+            # We are inside a latex inset, pass the text verbatim
+            tmp += [line[j:]]
+            break
+
+        document.body[i: i+1] = tmp
+        i += len(tmp)
+
+
+supported_versions = ["0.10.%d" % i for i in range(8)] + ["0.10"]
+convert = [[210, [regularise_header, regularise_body]]]
+revert  = []
+
+
+if __name__ == "__main__":
+    pass
diff --git a/lib/lyx2lyx/lyx_0_12.py b/lib/lyx2lyx/lyx_0_12.py
index 8b07ac493d..f381eb817d 100644
--- a/lib/lyx2lyx/lyx_0_12.py
+++ b/lib/lyx2lyx/lyx_0_12.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2003-2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2003-2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,41 +16,46 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 0.12"""
+
 import re
-import string
 from parser_tools import find_token, find_re, check_token
 
 
-def space_before_layout(file):
-    lines = file.body
+def space_before_layout(document):
+    " Remove empty line before \\layout. "
+    lines = document.body
     i = 2 # skip first layout
     while 1:
         i = find_token(lines, '\\layout', i)
         if i == -1:
             break
 
-        if lines[i - 1] == '' and string.find(lines[i-2],'\\protected_separator') == -1:
+        prot_space = lines[i-2].find('\\protected_separator')
+        if lines[i - 1] == '' and prot_space == -1:
             del lines[i-1]
         i = i + 1
 
 
-def formula_inset_space_eat(file):
-    lines = file.body
-    i=0
+def formula_inset_space_eat(document):
+    " Remove space after inset formula."
+    lines = document.body
+    i = 0
     while 1:
         i = find_token(lines, "\\begin_inset Formula", i)
-        if i == -1: break
+        if i == -1:
+            break
 
         if len(lines[i]) > 22 and lines[i][21] == ' ':
             lines[i] = lines[i][:20] + lines[i][21:]
         i = i + 1
 
 
-# Update from tabular format 1 or 2 to 4
-def update_tabular(file):
-    lines = file.body
+def update_tabular(document):
+    " Update from tabular format 1 or 2 to 4."
+    lines = document.body
     lyxtable_re = re.compile(r".*\\LyXTable$")
-    i=0
+    i = 0
     while 1:
         i = find_re(lines, lyxtable_re, i)
         if i == -1:
@@ -58,10 +63,10 @@ def update_tabular(file):
         i = i + 1
         format = lines[i][8:]
 
-        lines[i]='multicol4'
+        lines[i] = 'multicol4'
         i = i + 1
-        rows = int(string.split(lines[i])[0])
-        columns = int(string.split(lines[i])[1])
+        rows = int(lines[i].split()[0])
+        columns = int(lines[i].split()[1])
 
         lines[i] = lines[i] + ' 0 0 -1 -1 -1 -1'
         i = i + 1
@@ -74,27 +79,34 @@ def update_tabular(file):
             lines[i] = lines[i] + ' '
             i = i + 1
 
-        while string.strip(lines[i]):
+        while lines[i].strip():
             if not format:
                 lines[i] = lines[i] + ' 1 1'
             lines[i] = lines[i] + ' 0 0 0'
             i = i + 1
 
-        lines[i] = string.strip(lines[i])
+        lines[i] = lines[i].strip()
 
-def final_dot(file):
-    lines = file.body
+
+def final_dot(document):
+    " Merge lines if the dot is the final character."
+    lines = document.body
     i = 0
     while i < len(lines):
-        if lines[i][-1:] == '.' and lines[i+1][:1] != '\\' and  lines[i+1][:1] != ' ' and len(lines[i]) + len(lines[i+1])<= 72 and lines[i+1] != '':
+        
+        if lines[i][-1:] == '.' and lines[i+1][:1] != '\\' and \
+               lines[i+1][:1] != ' ' and len(lines[i]) + len(lines[i+1])<= 72 \
+               and lines[i+1] != '':
+
             lines[i] = lines[i] + lines[i+1]
             del lines[i+1]
         else:
             i = i + 1
 
 
-def update_inset_label(file):
-    lines = file.body
+def update_inset_label(document):
+    " Update inset Label."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, '\\begin_inset Label', i)
@@ -104,26 +116,32 @@ def update_inset_label(file):
         i = i + 1
 
 
-def update_latexdel(file):
-    lines = file.body
+def update_latexdel(document):
+    " Update inset LatexDel."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, '\\begin_inset LatexDel', i)
         if i == -1:
             return
-        lines[i] = string.replace(lines[i],'\\begin_inset LatexDel', '\\begin_inset LatexCommand')
+        lines[i] = lines[i].replace('\\begin_inset LatexDel',
+                                    '\\begin_inset LatexCommand')
         i = i + 1
 
 
-def update_vfill(file):
-    lines = file.body
+def update_vfill(document):
+    " Update fill_top and fill_bottom."
+    lines = document.body
     for i in range(len(lines)):
-        lines[i] = string.replace(lines[i],'\\fill_top','\\added_space_top vfill')
-        lines[i] = string.replace(lines[i],'\\fill_bottom','\\added_space_bottom vfill')
+        lines[i] = lines[i].replace('\\fill_top',
+                                    '\\added_space_top vfill')
+        lines[i] = lines[i].replace('\\fill_bottom',
+                                    '\\added_space_bottom vfill')
 
 
-def update_space_units(file):
-    lines = file.body
+def update_space_units(document):
+    " Update space units."
+    lines = document.body
     added_space_bottom = re.compile(r'\\added_space_bottom ([^ ]*)')
     added_space_top    = re.compile(r'\\added_space_top ([^ ]*)')
     for i in range(len(lines)):
@@ -131,17 +149,18 @@ def update_space_units(file):
         if result:
             old = '\\added_space_bottom ' + result.group(1)
             new = '\\added_space_bottom ' + str(float(result.group(1))) + 'cm'
-            lines[i] = string.replace(lines[i], old, new)
+            lines[i] = lines[i].replace(old, new)
 
         result = added_space_top.search(lines[i])
         if result:
             old = '\\added_space_top ' + result.group(1)
             new = '\\added_space_top ' + str(float(result.group(1))) + 'cm'
-            lines[i] = string.replace(lines[i], old, new)
+            lines[i] = lines[i].replace(old, new)
 
 
-def remove_cursor(file):
-    lines = file.body
+def remove_cursor(document):
+    " Remove cursor, it is not saved on the file anymore."
+    lines = document.body
     i = 0
     cursor_re = re.compile(r'.*(\\cursor \d*)')
     while 1:
@@ -149,15 +168,16 @@ def remove_cursor(file):
         if i == -1:
             break
         cursor = cursor_re.search(lines[i]).group(1)
-        lines[i]= string.replace(lines[i], cursor, '')
+        lines[i] = lines[i].replace(cursor, '')
         i = i + 1
 
 
-def remove_empty_insets(file):
-    lines = file.body
+def remove_empty_insets(document):
+    " Remove empty insets."
+    lines = document.body
     i = 0
     while 1:
-        i = find_token(lines, '\\begin_inset ',i)
+        i = find_token(lines, '\\begin_inset ', i)
         if i == -1:
             break
         if lines[i] == '\\begin_inset ' and lines[i+1] == '\\end_inset ':
@@ -166,8 +186,9 @@ def remove_empty_insets(file):
         i = i + 1
 
 
-def remove_formula_latex(file):
-    lines = file.body
+def remove_formula_latex(document):
+    " Remove formula latex."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, '\\latex formula_latex ', i)
@@ -181,15 +202,17 @@ def remove_formula_latex(file):
         del lines[i]
 
 
-def add_end_document(file):
-    lines = file.body
+def add_end_document(document):
+    " Add \\the_end to the end of the document."
+    lines = document.body
     i = find_token(lines, '\\the_end', 0)
     if i == -1:
         lines.append('\\the_end')
 
 
-def header_update(file):
-    lines = file.header
+def header_update(document):
+    " Update document header."
+    lines = document.header
     i = 0
     l = len(lines)
     while i < l:
@@ -197,12 +220,12 @@ def header_update(file):
             lines[i] = lines[i][:-1]
 
         if check_token(lines[i], '\\epsfig'):
-            lines[i] = string.replace(lines[i], '\\epsfig', '\\graphics')
+            lines[i] = lines[i].replace('\\epsfig', '\\graphics')
             i = i + 1
             continue
 
         if check_token(lines[i], '\\papersize'):
-            size = string.split(lines[i])[1]
+            size = lines[i].split()[1]
             new_size = size
             paperpackage = ""
 
@@ -225,7 +248,7 @@ def header_update(file):
 
 
         if check_token(lines[i], '\\baselinestretch'):
-            size = string.split(lines[i])[1]
+            size = lines[i].split()[1]
             if size == '1.00':
                 name = 'single'
             elif size == '1.50':
@@ -241,17 +264,18 @@ def header_update(file):
         i = i + 1
 
 
-def update_latexaccents(file):
-    body = file.body
+def update_latexaccents(document):
+    " Update latex accent insets."
+    body = document.body
     i = 1
     while 1:
         i = find_token(body, '\\i ', i)
         if i == -1:
             return
 
-        contents = string.strip(body[i][2:])
+        contents = body[i][2:].strip()
 
-        if string.find(contents, '{') != -1 and string.find(contents, '}') != -1:
+        if contents.find('{') != -1 and contents.find('}') != -1:
             i = i + 1
             continue
 
@@ -269,26 +293,47 @@ def update_latexaccents(file):
         i = i + 1
 
 
-def obsolete_latex_title(file):
-    body = file.body
+def obsolete_latex_title(document):
+    " Replace layout Latex_Title with Title."
+    body = document.body
     i = 0
     while 1:
         i = find_token(body, '\\layout', i)
         if i == -1:
             return
 
-        if string.find(string.lower(body[i]),'latex_title') != -1:
+        if body[i].lower().find('latex_title') != -1:
             body[i] = '\\layout Title'
 
         i = i + 1
 
 
+def remove_inset_latex(document):
+    "Replace inset latex with layout LaTeX"
+    body = document.body
+
+    i = 0
+    while 1:
+        i = find_token(body, '\\begin_inset Latex', i)
+        if i == -1:
+            return
+
+        body[i] = body[i].replace('\\begin_inset Latex', '\\layout LaTeX')
+        i = find_token(body, '\\end_inset', i)
+        if i == -1:
+            #this should not happen
+            return
+        del body[i]
+        
+    
+supported_versions = ["0.12.0","0.12.1","0.12"]
 convert = [[215, [header_update, add_end_document, remove_cursor,
                   final_dot, update_inset_label, update_latexdel,
                   update_space_units, space_before_layout,
                   formula_inset_space_eat, update_tabular,
                   update_vfill, remove_empty_insets,
-                  remove_formula_latex, update_latexaccents, obsolete_latex_title]]]
+                  remove_formula_latex, update_latexaccents,
+                  obsolete_latex_title, remove_inset_latex]]]
 revert  = []
 
 
diff --git a/lib/lyx2lyx/lyx_1_0_0.py b/lib/lyx2lyx/lyx_1_0.py
similarity index 71%
rename from lib/lyx2lyx/lyx_1_0_0.py
rename to lib/lyx2lyx/lyx_1_0.py
index 6ca27628b4..7862b61d96 100644
--- a/lib/lyx2lyx/lyx_1_0_0.py
+++ b/lib/lyx2lyx/lyx_1_0.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,29 +16,33 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 1.0"""
+
 import re
-import string
 from parser_tools import find_token, find_re
 
-def obsolete_latex_title(file):
-    body = file.body
+def obsolete_latex_title(document):
+    " Replace LatexTitle layout with Title. "
+
+    body = document.body
     i = 0
     while 1:
         i = find_token(body, '\\layout', i)
         if i == -1:
             return
 
-        if string.find(string.lower(body[i]),'latex title') != -1:
+        if body[i].lower().find('latex title') != -1:
             body[i] = '\\layout Title'
 
         i = i + 1
 
 
-# Update from tabular format 3 to 4 if necessary
-def update_tabular(file):
-    lines = file.body
+def update_tabular(document):
+    " Update from tabular format 3 to 4 if necessary."
+
+    lines = document.body
     lyxtable_re = re.compile(r".*\\LyXTable$")
-    i=0
+    i = 0
     while 1:
         i = find_re(lines, lyxtable_re, i)
         if i == -1:
@@ -49,10 +53,10 @@ def update_tabular(file):
         if format != '3':
             continue
 
-        lines[i]='multicol4'
+        lines[i] = 'multicol4'
         i = i + 1
-        rows = int(string.split(lines[i])[0])
-        columns = int(string.split(lines[i])[1])
+        rows = int(lines[i].split()[0])
+        columns = int(lines[i].split()[1])
 
         lines[i] = lines[i] + ' 0 0 -1 -1 -1 -1'
         i = i + 1
@@ -65,13 +69,14 @@ def update_tabular(file):
             lines[i] = lines[i] + ' '
             i = i + 1
 
-        while string.strip(lines[i]):
+        while lines[i].strip():
             lines[i] = lines[i] + ' 0 0 0'
             i = i + 1
 
-        lines[i] = string.strip(lines[i])
+        lines[i] = lines[i].strip()
 
 
+supported_versions = ["1.0.%d" % i for i in range(5)] + ["1.0"]
 convert = [[215, [obsolete_latex_title, update_tabular]]]
 revert  = []
 
diff --git a/lib/lyx2lyx/lyx_1_1_4.py b/lib/lyx2lyx/lyx_1_1.py
similarity index 78%
rename from lib/lyx2lyx/lyx_1_1_4.py
rename to lib/lyx2lyx/lyx_1_1.py
index 199fb3022a..5927c0f37e 100644
--- a/lib/lyx2lyx/lyx_1_1_4.py
+++ b/lib/lyx2lyx/lyx_1_1.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,6 +16,9 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 1.1 series, until 1.1.4"""
+
+supported_versions = ["1.1.%d" % i for i in range(5)] + ["1.1"]
 convert = [[215, []]]
 revert  = []
 
diff --git a/lib/lyx2lyx/lyx_1_1_5.py b/lib/lyx2lyx/lyx_1_1_5.py
index d8dc59006e..8720cfcefb 100644
--- a/lib/lyx2lyx/lyx_1_1_5.py
+++ b/lib/lyx2lyx/lyx_1_1_5.py
@@ -1,6 +1,6 @@
-# This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
+# This document is part of lyx2lyx
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,15 +16,29 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
-import re
-import string
-from parser_tools import find_token, find_token_backwards, find_re, get_layout
+""" Convert files to the file format generated by lyx 1.1.5"""
 
+import re
+from parser_tools import find_token, find_token_backwards, find_re
+
+####################################################################
+# Private helper functions
+
+def get_layout(line, default_layout):
+    " Get the line layout, beware of the empty layout."
+    tokens = line.split()
+    if len(tokens) > 1:
+        return tokens[1]
+    return default_layout
+
+
+####################################################################
 
 math_env = ["\\[","\\begin{eqnarray*}","\\begin{eqnarray}","\\begin{equation}"]
 
-def replace_protected_separator(file):
-    lines = file.body
+def replace_protected_separator(document):
+    " Replace protected separator. "
+    lines = document.body
     i=0
     while 1:
         i = find_token(lines, "\\protected_separator", i)
@@ -32,7 +46,7 @@ def replace_protected_separator(file):
             break
         j = find_token_backwards(lines, "\\layout", i)
         #if j == -1: print error
-        layout = get_layout(lines[j], file.default_layout)
+        layout = get_layout(lines[j], document.default_layout)
 
         if layout == "LyX-Code":
             result = ""
@@ -47,8 +61,9 @@ def replace_protected_separator(file):
         del lines[i]
 
 
-def merge_formula_inset(file):
-    lines = file.body
+def merge_formula_inset(document):
+    " Merge formula insets. "
+    lines = document.body
     i=0
     while 1:
         i = find_token(lines, "\\begin_inset Formula", i)
@@ -59,9 +74,9 @@ def merge_formula_inset(file):
         i = i + 1
 
 
-# Update from tabular format 4 to 5 if necessary
-def update_tabular(file):
-    lines = file.body
+def update_tabular(document):
+    " Update from tabular format 4 to 5 if necessary. "
+    lines = document.body
     lyxtable_re = re.compile(r".*\\LyXTable$")
     i=0
     while 1:
@@ -75,16 +90,16 @@ def update_tabular(file):
 
         lines[i]='multicol5'
         i = i + 1
-        rows = int(string.split(lines[i])[0])
-        columns = int(string.split(lines[i])[1])
+        rows = int(lines[i].split()[0])
+        columns = int(lines[i].split()[1])
 
         i = i + rows + 1
         for j in range(columns):
-            col_info = string.split(lines[i])
+            col_info = lines[i].split()
             if len(col_info) == 3:
                 lines[i] = lines[i] + '"" ""'
             else:
-                lines[i] = string.join(col_info[:3]) + ' "%s" ""' % col_info[3]
+                lines[i] = " ".join(col_info[:3]) + ' "%s" ""' % col_info[3]
             i = i + 1
 
         while lines[i]:
@@ -92,26 +107,30 @@ def update_tabular(file):
             i = i + 1
 
 
-def update_toc(file):
-    lines = file.body
+def update_toc(document):
+    " Update table of contents. "
+    lines = document.body
     i = 0
     while 1:
-        i = find_token(lines, '\\begin_inset LatexCommand \\tableofcontents', i)
+        i = find_token(lines,
+                       '\\begin_inset LatexCommand \\tableofcontents', i)
         if i == -1:
             break
         lines[i] = lines[i] + '{}'
         i = i + 1
 
 
-def remove_cursor(file):
-    lines = file.body
+def remove_cursor(document):
+    " Remove cursor. "
+    lines = document.body
     i = find_token(lines, '\\cursor', 0)
     if i != -1:
         del lines[i]
 
 
-def remove_vcid(file):
-    lines = file.header
+def remove_vcid(document):
+    " Remove \\lyxvcid and \\lyxrcsid. "
+    lines = document.header
     i = find_token(lines, '\\lyxvcid', 0)
     if i != -1:
         del lines[i]
@@ -120,16 +139,18 @@ def remove_vcid(file):
         del lines[i]
 
 
-def first_layout(file):
-    lines = file.body
+def first_layout(document):
+    " Fix first layout, if empty use the default layout."
+    lines = document.body
     while (lines[0] == ""):
         del lines[0]
     if lines[0][:7] != "\\layout":
-        lines[:0] = ['\\layout %s' % file.default_layout, '']
+        lines[:0] = ['\\layout %s' % document.default_layout, '']
 
 
-def remove_space_in_units(file):
-    lines = file.header
+def remove_space_in_units(document):
+    " Remove space in units. "
+    lines = document.header
     margins = ["\\topmargin","\\rightmargin",
                "\\leftmargin","\\bottommargin"]
 
@@ -148,8 +169,9 @@ def remove_space_in_units(file):
             i = i + 1
 
 
-def latexdel_getargs(file, i):
-    lines = file.body
+def latexdel_getargs(document, i):
+    " Get arguments from latexdel insets. "
+    lines = document.body
 
     # play safe, clean empty lines
     while 1:
@@ -162,10 +184,10 @@ def latexdel_getargs(file, i):
     if i == j:
         del lines[i]
     else:
-        file.warning("Unexpected end of inset.")
+        document.warning("Unexpected end of inset.")
     j = find_token(lines, '\\begin_inset LatexDel }{', i)
 
-    ref = string.join(lines[i:j])
+    ref = " ".join(lines[i:j])
     del lines[i:j + 1]
 
     # play safe, clean empty lines
@@ -178,57 +200,64 @@ def latexdel_getargs(file, i):
     if i == j:
         del lines[i]
     else:
-        file.warning("Unexpected end of inset.")
+        document.warning("Unexpected end of inset.")
     j = find_token(lines, '\\begin_inset LatexDel }', i)
-    label = string.join(lines[i:j])
+    label = " ".join(lines[i:j])
     del lines[i:j + 1]
 
     return ref, label
 
 
-def update_ref(file):
-    lines = file.body
+def update_ref(document):
+    " Update reference inset. "
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, '\\begin_inset LatexCommand', i)
         if i == -1:
             return
 
-        if string.split(lines[i])[-1] == "\\ref{":
+        if lines[i].split()[-1] == "\\ref{":
             i = i + 1
-            ref, label = latexdel_getargs(file, i)
+            ref, label = latexdel_getargs(document, i)
             lines[i - 1] = "%s[%s]{%s}" % (lines[i - 1][:-1], ref, label)
 
         i = i + 1
 
 
-def update_latexdel(file):
-    lines = file.body
+def update_latexdel(document):
+    " Remove latexdel insets. "
+    lines = document.body
     i = 0
     latexdel_re = re.compile(r".*\\begin_inset LatexDel")
     while 1:
         i = find_re(lines, latexdel_re, i)
         if i == -1:
             return
-        lines[i] = string.replace(lines[i],'\\begin_inset LatexDel', '\\begin_inset LatexCommand')
+        lines[i] = lines[i].replace('\\begin_inset LatexDel',
+                                    '\\begin_inset LatexCommand')
 
-        j = string.find(lines[i],'\\begin_inset')
+        j = lines[i].find('\\begin_inset')
         lines.insert(i+1, lines[i][j:])
-        lines[i] = string.strip(lines[i][:j])
+        lines[i] = lines[i][:j].strip()
         i = i + 1
 
-        if string.split(lines[i])[-1] in ("\\url{", "\\htmlurl{"):
+        if lines[i].split()[-1] in ("\\url{", "\\htmlurl{"):
             i = i + 1
 
-            ref, label = latexdel_getargs(file, i)
+            ref, label = latexdel_getargs(document, i)
             lines[i -1] = "%s[%s]{%s}" % (lines[i-1][:-1], label, ref)
 
         i = i + 1
 
 
-convert = [[216, [first_layout, remove_vcid, remove_cursor, update_toc,
-                  replace_protected_separator, merge_formula_inset,
-                  update_tabular, remove_space_in_units, update_ref, update_latexdel]]]
+supported_versions = ["1.1.5","1.1.5fix1","1.1.5fix2","1.1"]
+convert = [[216, [first_layout, remove_vcid, remove_cursor,
+                  update_toc, replace_protected_separator,
+                  merge_formula_inset, update_tabular,
+                  remove_space_in_units, update_ref,
+                  update_latexdel]]]
+
 revert  = []
 
 if __name__ == "__main__":
diff --git a/lib/lyx2lyx/lyx_1_1_6.py b/lib/lyx2lyx/lyx_1_1_6_0.py
similarity index 91%
rename from lib/lyx2lyx/lyx_1_1_6.py
rename to lib/lyx2lyx/lyx_1_1_6_0.py
index 8d9773235f..56de363325 100644
--- a/lib/lyx2lyx/lyx_1_1_6.py
+++ b/lib/lyx2lyx/lyx_1_1_6_0.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,14 +16,15 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 1.1.6, until fix2"""
+
 import re
-import string
 from parser_tools import find_re, find_tokens, find_token, check_token
 
-
 lyxtable_re = re.compile(r".*\\LyXTable$")
-def update_tabular(file):
-    lines = file.body
+def update_tabular(document):
+    " Update tabular to version 1 (xml like syntax). "
+    lines = document.body
     i=0
     while 1:
         i = find_re(lines, lyxtable_re, i)
@@ -41,7 +42,7 @@ def update_tabular(file):
         i = i + 1
         lines[i] = "\\begin_inset  Tabular"
         i = i + 1
-        head = string.split(lines[i])
+        head = lines[i].split()
         rows = int(head[0])
         columns = int(head[1])
 
@@ -54,8 +55,8 @@ def update_tabular(file):
         row_info = []
         cont_row = []
         for j in range(rows):
-            row_info.append(string.split(lines[i]))
-            if string.split(lines[i])[2] == '1':
+            row_info.append(lines[i].split())
+            if lines[i].split()[2] == '1':
                 cont_row.append(j)
             del lines[i]
 
@@ -100,13 +101,13 @@ def update_tabular(file):
                     continue
 
                 if l == ncells -1:
-                    # the end variable refers to cell end, not to file end.
+                    # the end variable refers to cell end, not to document end.
                     end = find_tokens(lines, ['\\layout','\\the_end','\\end_deeper','\\end_float'], i)
                 else:
                     end = find_token(lines, '\\newline', i)
 
                 if end == -1:
-                    file.error("Malformed LyX file.")
+                    document.error("Malformed LyX file.")
 
                 end = end - i
                 while end > 0:
@@ -114,7 +115,7 @@ def update_tabular(file):
                     del lines[i]
                     end = end -1
 
-                if string.find(lines[i],'\\newline') != -1:
+                if lines[i].find('\\newline') != -1:
                     del lines[i]
                 l = l + 1
 
@@ -146,7 +147,7 @@ def update_tabular(file):
                 tmp.append('<Cell multicolumn="%s" alignment="%s" valignment="0" topline="%s" bottomline="%s" leftline="%d" rightline="%d" rotate="%s" usebox="%s" width=%s special=%s>' % (cell_info[m][0],cell_info[m][1],cell_info[m][2],cell_info[m][3],leftline,rightline,cell_info[m][5],cell_info[m][6],cell_info[m][7],cell_info[m][8]))
                 tmp.append('\\begin_inset Text')
                 tmp.append('')
-                tmp.append('\\layout %s' % file.default_layout)
+                tmp.append('\\layout %s' % document.default_layout)
                 tmp.append('')
 
                 if cell_info[m][0] != '2':
@@ -179,8 +180,8 @@ def update_tabular(file):
 
 
 prop_exp = re.compile(r"\\(\S*)\s*(\S*)")
-
 def set_paragraph_properties(lines, prop_dict):
+    " Set paragraph properties."
     # we need to preserve the order of options
     properties = ["family","series","shape","size",
                   "emph","bar","noun","latex","color"]
@@ -263,19 +264,22 @@ def set_paragraph_properties(lines, prop_dict):
     return result[:]
 
 
-def update_language(file):
-    header = file.header
+def update_language(document):
+    """ Update document language, if language is default convert it to
+    english."""
+    header = document.header
     i = find_token(header, "\\language", 0)
     if i == -1:
         # no language, should emit a warning
         header.append('\\language english')
         return
     # This is the lyx behaviour: defaults to english
-    if string.split(header[i])[1] == 'default':
+    if header[i].split()[1] == 'default':
         header[i] = '\\language english'
     return
 
 
+supported_versions = ["1.1.6","1.1.6fix1","1.1.6fix2","1.1"]
 convert = [[217, [update_tabular, update_language]]]
 revert  = []
 
diff --git a/lib/lyx2lyx/lyx_1_1_6fix3.py b/lib/lyx2lyx/lyx_1_1_6_3.py
similarity index 80%
rename from lib/lyx2lyx/lyx_1_1_6fix3.py
rename to lib/lyx2lyx/lyx_1_1_6_3.py
index f7656d796a..f0be612103 100644
--- a/lib/lyx2lyx/lyx_1_1_6fix3.py
+++ b/lib/lyx2lyx/lyx_1_1_6_3.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,11 +16,13 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 1.1.6, fix3 and fix4"""
+
 import re
-import string
 from parser_tools import find_token, find_re
 
 def bool_table(item):
+    " Convert 0, 1 to false, true."
     if item == "0":
         return "false"
     # should emit a warning if item != "1"
@@ -32,9 +34,10 @@ align_table = {"0": "top", "2": "left", "4": "right", "8": "center"}
 use_table = {"0": "none", "1": "parbox"}
 table_meta_re = re.compile(r'<LyXTabular version="?1"? rows="?(\d*)"? columns="?(\d*)"?>')
 
-def update_tabular(file):
+def update_tabular(document):
+    " Update tabular format to version 2 (xml like syntax)."
     regexp = re.compile(r'^\\begin_inset\s+Tabular')
-    lines = file.body
+    lines = document.body
     i=0
     while 1:
         i = find_re(lines, regexp, i)
@@ -51,7 +54,7 @@ def update_tabular(file):
 
         j = find_token(lines, '</LyXTabular>', i) + 1
         if j == 0:
-            file.warning( "Error: Bad lyx format i=%d j=%d" % (i,j))
+            document.warning( "Error: Bad lyx format i=%d j=%d" % (i,j))
             break
 
         new_table = table_update(lines[i:j])
@@ -65,7 +68,8 @@ features_re = re.compile(r'<features rotate="?(\d)"? islongtable="?(\d)"? endhea
 row_re = re.compile(r'<row topline="?(\d)"? bottomline="?(\d)"? newpage="?(\d)"?>')
 
 def table_update(lines):
-    lines[1] = string.replace(lines[1], '<Features', '<features')
+    " Update table's internal content to format 2."
+    lines[1] = lines[1].replace('<Features', '<features')
     res = features_re.match( lines[1] )
     if res:
         val = res.groups()
@@ -76,14 +80,14 @@ def table_update(lines):
     i = 2
     col_info = []
     while i < len(lines):
-        lines[i] = string.replace(lines[i], '<Cell', '<cell')
-        lines[i] = string.replace(lines[i], '</Cell', '</cell')
-        lines[i] = string.replace(lines[i], '<Row', '<row')
-        lines[i] = string.replace(lines[i], '</Row', '</row')
-        lines[i] = string.replace(lines[i], '<Column', '<column')
-        lines[i] = string.replace(lines[i], '</Column', '</column')
-        lines[i] = string.replace(lines[i], '</LyXTabular', '</lyxtabular')
-        k = string.find (lines[i], '<column ')
+        lines[i] = lines[i].replace('<Cell', '<cell')
+        lines[i] = lines[i].replace('</Cell', '</cell')
+        lines[i] = lines[i].replace('<Row', '<row')
+        lines[i] = lines[i].replace('</Row', '</row')
+        lines[i] = lines[i].replace('<Column', '<column')
+        lines[i] = lines[i].replace('</Column', '</column')
+        lines[i] = lines[i].replace('</LyXTabular', '</lyxtabular')
+        k = lines[i].find ('<column ')
         if k != -1:
             col_info.append(lines[i])
             del lines[i]
@@ -116,6 +120,7 @@ def table_update(lines):
     return lines[:2] + col_info + lines[2:]
 
 
+supported_versions = ["1.1.6fix3","1.1.6fix4","1.1"]
 convert = [[218, [update_tabular]]]
 revert  = []
 
diff --git a/lib/lyx2lyx/lyx_1_2.py b/lib/lyx2lyx/lyx_1_2.py
index 3ac5d9cfb9..029c852e9e 100644
--- a/lib/lyx2lyx/lyx_1_2.py
+++ b/lib/lyx2lyx/lyx_1_2.py
@@ -1,7 +1,7 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
+# -*- coding: utf-8 -*-
 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# Copyright (C) 2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -17,13 +17,86 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
-import string
+""" Convert files to the file format generated by lyx 1.2"""
+
 import re
 
-from parser_tools import find_token, find_token_backwards, get_next_paragraph,\
-                         find_tokens, find_end_of_inset, find_re, \
-                         is_nonempty_line, get_paragraph, find_nonempty_line, \
-                         get_value, get_tabular_lines, check_token, get_layout
+from parser_tools import find_token, find_token_backwards, \
+                         find_tokens, find_tokens_backwards, \
+                         find_beginning_of, find_end_of, find_re, \
+                         is_nonempty_line, find_nonempty_line, \
+                         get_value, check_token
+
+####################################################################
+# Private helper functions
+
+def get_layout(line, default_layout):
+    " Get layout, if empty return the default layout."
+    tokens = line.split()
+    if len(tokens) > 1:
+        return tokens[1]
+    return default_layout
+
+
+def get_paragraph(lines, i, format):
+    " Finds the paragraph that contains line i."
+    begin_layout = "\\layout"
+
+    while i != -1:
+        i = find_tokens_backwards(lines, ["\\end_inset", begin_layout], i)
+        if i == -1: return -1
+        if check_token(lines[i], begin_layout):
+            return i
+        i = find_beginning_of_inset(lines, i)
+    return -1
+
+
+def get_next_paragraph(lines, i, format):
+    " Finds the paragraph after the paragraph that contains line i."
+    tokens = ["\\begin_inset", "\\layout", "\\end_float", "\\the_end"]
+
+    while i != -1:
+        i = find_tokens(lines, tokens, i)
+        if not check_token(lines[i], "\\begin_inset"):
+            return i
+        i = find_end_of_inset(lines, i)
+    return -1
+
+
+def find_beginning_of_inset(lines, i):
+    " Find beginning of inset, where lines[i] is included."
+    return find_beginning_of(lines, i, "\\begin_inset", "\\end_inset")
+
+
+def find_end_of_inset(lines, i):
+    " Finds the matching \end_inset"
+    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
+
+
+def find_end_of_tabular(lines, i):
+    " Finds the matching end of tabular."
+    return find_end_of(lines, i, "<lyxtabular", "</lyxtabular")
+
+
+def get_tabular_lines(lines, i):
+    " Returns a lists of tabular lines."
+    result = []
+    i = i+1
+    j = find_end_of_tabular(lines, i)
+    if j == -1:
+        return []
+
+    while i <= j:
+        if check_token(lines[i], "\\begin_inset"):
+            i = find_end_of_inset(lines, i)+1
+        else:
+            result.append(i)
+            i = i+1
+    return result
+
+# End of helper functions
+####################################################################
+
 
 floats = {
     "footnote": ["\\begin_inset Foot",
@@ -59,6 +132,7 @@ pextra_rexp = re.compile(r"\\pextra_type\s+(\S+)"+\
 
 
 def get_width(mo):
+    " Get width from a regular expression. "
     if mo.group(10):
         if mo.group(9) == "\\pextra_widthp":
             return mo.group(10)+"col%"
@@ -68,11 +142,9 @@ def get_width(mo):
         return "100col%"
 
 
-#
-# Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
-#
-def remove_oldfloat(file):
-    lines = file.body
+def remove_oldfloat(document):
+    " Change \begin_float .. \end_float into \begin_inset Float .. \end_inset"
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_float", i)
@@ -81,9 +153,9 @@ def remove_oldfloat(file):
         # There are no nested floats, so finding the end of the float is simple
         j = find_token(lines, "\\end_float", i+1)
 
-        floattype = string.split(lines[i])[1]
+        floattype = lines[i].split()[1]
         if not floats.has_key(floattype):
-            file.warning("Error! Unknown float type " + floattype)
+            document.warning("Error! Unknown float type " + floattype)
             floattype = "fig"
 
         # skip \end_deeper tokens
@@ -91,7 +163,7 @@ def remove_oldfloat(file):
         while check_token(lines[i2], "\\end_deeper"):
             i2 = i2+1
         if i2 > i+1:
-            j2 = get_next_paragraph(lines, j + 1, file.format + 1)
+            j2 = get_next_paragraph(lines, j + 1, document.format + 1)
             lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
 
         new = floats[floattype]+[""]
@@ -116,7 +188,7 @@ def remove_oldfloat(file):
         # as extra '\foo default' commands are ignored.
         # In fact, it might be safer to output '\foo default' for all
         # font attributes.
-        k = get_paragraph(lines, i, file.format + 1)
+        k = get_paragraph(lines, i, document.format + 1)
         flag = 0
         for token in font_tokens:
             if find_token(lines, token, k, i) != -1:
@@ -126,7 +198,7 @@ def remove_oldfloat(file):
                     flag = 1
                     new.append("")
                 if token == "\\lang":
-                    new.append(token+" "+ file.language)
+                    new.append(token+" "+ document.language)
                 else:
                     new.append(token+" default ")
 
@@ -138,8 +210,9 @@ pextra_type2_rexp = re.compile(r".*\\pextra_type\s+[12]")
 pextra_type2_rexp2 = re.compile(r".*(\\layout|\\pextra_type\s+2)")
 pextra_widthp = re.compile(r"\\pextra_widthp")
 
-def remove_pextra(file):
-    lines = file.body
+def remove_pextra(document):
+    " Remove pextra token."
+    lines = document.body
     i = 0
     flag = 0
     while 1:
@@ -179,10 +252,10 @@ def remove_pextra(file):
             if hfill:
                 start = ["","\hfill",""]+start
         else:
-            start = ['\\layout %s' % file.default_layout,''] + start
+            start = ['\\layout %s' % document.default_layout,''] + start
 
         j0 = find_token_backwards(lines,"\\layout", i-1)
-        j = get_next_paragraph(lines, i, file.format + 1)
+        j = get_next_paragraph(lines, i, document.format + 1)
 
         count = 0
         while 1:
@@ -210,6 +283,7 @@ def remove_pextra(file):
 
 
 def is_empty(lines):
+    " Are all the lines empty?"
     return filter(is_nonempty_line, lines) == []
 
 
@@ -218,13 +292,14 @@ ert_rexp = re.compile(r"\\begin_inset|\\hfill|.*\\SpecialChar")
 spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
 
 
-def remove_oldert(file):
+def remove_oldert(document):
+    " Remove old ERT inset."
     ert_begin = ["\\begin_inset ERT",
                  "status Collapsed",
                  "",
-                 '\\layout %s' % file.default_layout,
+                 '\\layout %s' % document.default_layout,
                  ""]
-    lines = file.body
+    lines = document.body
     i = 0
     while 1:
         i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
@@ -249,7 +324,7 @@ def remove_oldert(file):
         new = []
         new2 = []
         if check_token(lines[i], "\\layout LaTeX"):
-            new = ['\layout %s' % file.default_layout, "", ""]
+            new = ['\layout %s' % document.default_layout, "", ""]
 
         k = i+1
         while 1:
@@ -331,9 +406,9 @@ def remove_oldert(file):
         del lines[i]
 
 
-# ERT insert are hidden feature of lyx 1.1.6. This might be removed in the future.
-def remove_oldertinset(file):
-    lines = file.body
+def remove_oldertinset(document):
+    " ERT insert are hidden feature of lyx 1.1.6. This might be removed in the future."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset ERT", i)
@@ -341,7 +416,7 @@ def remove_oldertinset(file):
             break
         j = find_end_of_inset(lines, i)
         k = find_token(lines, "\\layout", i+1)
-        l = get_paragraph(lines, i, file.format + 1)
+        l = get_paragraph(lines, i, document.format + 1)
         if lines[k] == lines[l]: # same layout
             k = k+1
         new = lines[k:j]
@@ -349,11 +424,12 @@ def remove_oldertinset(file):
         i = i+1
 
 
-def is_ert_paragraph(file, i):
-    lines = file.body
+def is_ert_paragraph(document, i):
+    " Is this a ert paragraph? "
+    lines = document.body
     if not check_token(lines[i], "\\layout"):
         return 0
-    if not file.is_default_layout(get_layout(lines[i], file.default_layout)):
+    if not document.is_default_layout(get_layout(lines[i], document.default_layout)):
         return 0
 
     i = find_nonempty_line(lines, i+1)
@@ -365,17 +441,18 @@ def is_ert_paragraph(file, i):
     return check_token(lines[k], "\\layout")
 
 
-def combine_ert(file):
-    lines = file.body
+def combine_ert(document):
+    " Combine ERT paragraphs."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset ERT", i)
         if i == -1:
             break
-        j = get_paragraph(lines, i, file.format + 1)
+        j = get_paragraph(lines, i, document.format + 1)
         count = 0
         text = []
-        while is_ert_paragraph(file, j):
+        while is_ert_paragraph(document, j):
 
             count = count+1
             i2 = find_token(lines, "\\layout", j+1)
@@ -395,20 +472,23 @@ def combine_ert(file):
 oldunits = ["pt", "cm", "in", "text%", "col%"]
 
 def get_length(lines, name, start, end):
+    " Get lenght."
     i = find_token(lines, name, start, end)
     if i == -1:
         return ""
-    x = string.split(lines[i])
+    x = lines[i].split()
     return x[2]+oldunits[int(x[1])]
 
 
 def write_attribute(x, token, value):
+    " Write attribute."
     if value != "":
         x.append("\t"+token+" "+value)
 
 
-def remove_figinset(file):
-    lines = file.body
+def remove_figinset(document):
+    " Remove figinset."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset Figure", i)
@@ -416,9 +496,9 @@ def remove_figinset(file):
             break
         j = find_end_of_inset(lines, i)
 
-        if ( len(string.split(lines[i])) > 2 ):
-            lyxwidth = string.split(lines[i])[3]+"pt"
-            lyxheight = string.split(lines[i])[4]+"pt"
+        if ( len(lines[i].split()) > 2 ):
+            lyxwidth = lines[i].split()[3]+"pt"
+            lyxheight = lines[i].split()[4]+"pt"
         else:
             lyxwidth = ""
             lyxheight = ""
@@ -476,15 +556,13 @@ def remove_figinset(file):
         lines[i:j+1] = new
 
 
-##
-# Convert tabular format 2 to 3
-#
 attr_re = re.compile(r' \w*="(false|0|)"')
 line_re = re.compile(r'<(features|column|row|cell)')
 
-def update_tabular(file):
+def update_tabular(document):
+    " Convert tabular format 2 to 3."
     regexp = re.compile(r'^\\begin_inset\s+Tabular')
-    lines = file.body
+    lines = document.body
     i = 0
     while 1:
         i = find_re(lines, regexp, i)
@@ -493,9 +571,9 @@ def update_tabular(file):
 
         for k in get_tabular_lines(lines, i):
             if check_token(lines[k], "<lyxtabular"):
-                lines[k] = string.replace(lines[k], 'version="2"', 'version="3"')
+                lines[k] = lines[k].replace('version="2"', 'version="3"')
             elif check_token(lines[k], "<column"):
-                lines[k] = string.replace(lines[k], 'width=""', 'width="0pt"')
+                lines[k] = lines[k].replace('width=""', 'width="0pt"')
 
             if line_re.match(lines[k]):
                 lines[k] = re.sub(attr_re, "", lines[k])
@@ -520,8 +598,8 @@ def update_tabular(file):
 false = 0
 true = 1
 
-# simple data structure to deal with long table info
 class row:
+    " Simple data structure to deal with long table info."
     def __init__(self):
         self.endhead = false                # header row
         self.endfirsthead = false        # first header row
@@ -530,6 +608,7 @@ class row:
 
 
 def haveLTFoot(row_info):
+    " Does row has LTFoot?"
     for row_ in row_info:
         if row_.endfoot:
             return true
@@ -537,6 +616,7 @@ def haveLTFoot(row_info):
 
 
 def setHeaderFooterRows(hr, fhr, fr, lfr, rows_, row_info):
+    " Set Header/Footer rows."
     endfirsthead_empty = false
     endlastfoot_empty = false
     # set header info
@@ -603,7 +683,8 @@ def setHeaderFooterRows(hr, fhr, fr, lfr, rows_, row_info):
 
 
 def insert_attribute(lines, i, attribute):
-    last = string.find(lines[i],'>')
+    " Insert attribute in lines[i]."
+    last = lines[i].find('>')
     lines[i] = lines[i][:last] + ' ' + attribute + lines[i][last:]
 
 
@@ -611,9 +692,10 @@ rows_re = re.compile(r'rows="(\d*)"')
 longtable_re = re.compile(r'islongtable="(\w)"')
 ltvalues_re = re.compile(r'endhead="(-?\d*)" endfirsthead="(-?\d*)" endfoot="(-?\d*)" endlastfoot="(-?\d*)"')
 lt_features_re = re.compile(r'(endhead="-?\d*" endfirsthead="-?\d*" endfoot="-?\d*" endlastfoot="-?\d*")')
-def update_longtables(file):
+def update_longtables(document):
+    " Update longtables to new format."
     regexp = re.compile(r'^\\begin_inset\s+Tabular')
-    body = file.body
+    body = document.body
     i = 0
     while 1:
         i = find_re(body, regexp, i)
@@ -643,7 +725,7 @@ def update_longtables(file):
             # remove longtable elements from features
             features = lt_features_re.search(body[i])
             if features:
-                body[i] = string.replace(body[i], features.group(1), "")
+                body[i] = body[i].replace(features.group(1), "")
             continue
 
         row_info = row() * rows
@@ -680,9 +762,9 @@ def update_longtables(file):
             i = i + 1
 
 
-# Figure insert are hidden feature of lyx 1.1.6. This might be removed in the future.
-def fix_oldfloatinset(file):
-    lines = file.body
+def fix_oldfloatinset(document):
+    " Figure insert are hidden feature of lyx 1.1.6. This might be removed in the future."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset Float ", i)
@@ -694,8 +776,9 @@ def fix_oldfloatinset(file):
         i = i+1
 
 
-def change_listof(file):
-    lines = file.body
+def change_listof(document):
+    " Change listof insets."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset LatexCommand \\listof", i)
@@ -706,14 +789,15 @@ def change_listof(file):
         i = i+1
 
 
-def change_infoinset(file):
-    lines = file.body
+def change_infoinset(document):
+    " Change info inset."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset Info", i)
         if i == -1:
             break
-        txt = string.lstrip(lines[i][18:])
+        txt = lines[i][18:].lstrip()
         new = ["\\begin_inset Note", "collapsed true", ""]
         j = find_token(lines, "\\end_inset", i)
         if j == -1:
@@ -724,8 +808,8 @@ def change_infoinset(file):
             note_lines = [txt]+note_lines
 
         for line in note_lines:
-            new = new + ['\layout %s' % file.default_layout, ""]
-            tmp = string.split(line, '\\')
+            new = new + ['\layout %s' % document.default_layout, ""]
+            tmp = line.split('\\')
             new = new + [tmp[0]]
             for x in tmp[1:]:
                 new = new + ["\\backslash ", x]
@@ -733,8 +817,9 @@ def change_infoinset(file):
         i = i+5
 
 
-def change_header(file):
-    lines = file.header
+def change_header(document):
+    " Update header."
+    lines = document.header
     i = find_token(lines, "\\use_amsmath", 0)
     if i == -1:
         return
@@ -742,6 +827,7 @@ def change_header(file):
                       "\use_numerical_citations 0"]
 
 
+supported_versions = ["1.2.%d" % i for i in range(5)] + ["1.2"]
 convert = [[220, [change_header, change_listof, fix_oldfloatinset,
                   update_tabular, update_longtables, remove_pextra,
                   remove_oldfloat, remove_figinset, remove_oldertinset,
diff --git a/lib/lyx2lyx/lyx_1_3.py b/lib/lyx2lyx/lyx_1_3.py
index acb8d9f62f..91dae09ec0 100644
--- a/lib/lyx2lyx/lyx_1_3.py
+++ b/lib/lyx2lyx/lyx_1_3.py
@@ -1,7 +1,7 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
+# -*- coding: utf-8 -*-
 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# Copyright (C) 2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -17,13 +17,26 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
-import string
+""" Convert files to the file format generated by lyx 1.3"""
+
 import re
-from parser_tools import find_token, find_end_of_inset, get_value,\
+from parser_tools import find_token, find_end_of, get_value,\
                          find_token_exact, del_token
 
-def change_insetgraphics(file):
-    lines = file.body
+####################################################################
+# Private helper functions
+
+def find_end_of_inset(lines, i):
+    "Finds the matching \end_inset"
+    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
+
+# End of helper functions
+####################################################################
+
+
+def change_insetgraphics(document):
+    " Change inset Graphics."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "\\begin_inset Graphics", i)
@@ -49,7 +62,7 @@ def change_insetgraphics(file):
         if k == -1:
             k = find_token_exact(lines, "size_kind", i, j)
         if k != -1:
-            size_type = string.split(lines[k])[1]
+            size_type = lines[k].split()[1]
             del lines[k]
             j = j-1
             if size_type in ["0", "original"]:
@@ -68,7 +81,7 @@ def change_insetgraphics(file):
         if k == -1:
             k = find_token_exact(lines, "lyxsize_kind", i, j)
         if k != -1:
-            lyxsize_type = string.split(lines[k])[1]
+            lyxsize_type = lines[k].split()[1]
             del lines[k]
             j = j-1
             j = del_token(lines, "lyxwidth", i, j)
@@ -80,8 +93,9 @@ def change_insetgraphics(file):
         i = i+1
 
 
-def change_tabular(file):
-    lines = file.body
+def change_tabular(document):
+    " Change tabular."
+    lines = document.body
     i = 0
     while 1:
         i = find_token(lines, "<column", i)
@@ -92,6 +106,7 @@ def change_tabular(file):
         i = i+1
 
 
+supported_versions = ["1.3.%d" % i for i in range(8)] + ["1.3"]
 convert = [[221, [change_insetgraphics, change_tabular]]]
 revert  = []
 
diff --git a/lib/lyx2lyx/lyx_1_4.py b/lib/lyx2lyx/lyx_1_4.py
index 28a7743d32..06c6a23e1f 100644
--- a/lib/lyx2lyx/lyx_1_4.py
+++ b/lib/lyx2lyx/lyx_1_4.py
@@ -1,7 +1,7 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
+# -*- coding: utf-8 -*-
 # Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
-# Copyright (C) 2002-2004 José Matos <jamatos@lyx.org>
+# Copyright (C) 2002-2004 JosĂŠ Matos <jamatos@lyx.org>
 # Copyright (C) 2004-2005 Georg Baum <Georg.Baum@post.rwth-aachen.de>
 #
 # This program is free software; you can redistribute it and/or
@@ -18,53 +18,108 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
+""" Convert files to the file format generated by lyx 1.4"""
+
 import re
 from os import access, F_OK
 import os.path
-from parser_tools import find_token, find_end_of_inset, get_next_paragraph, \
-                         get_paragraph, get_value, del_token, is_nonempty_line,\
-                         find_tokens, find_end_of, find_token_exact, find_tokens_exact,\
-                         find_re, get_layout
+from parser_tools import check_token, find_token, \
+                         get_value, del_token, is_nonempty_line, \
+                         find_tokens, find_end_of, find_beginning_of, find_token_exact, find_tokens_exact, \
+                         find_re, find_tokens_backwards
 from sys import stdin
-from string import replace, split, find, strip, join
 
 from lyx_0_12 import update_latexaccents
 
-##
-# Remove \color default
-#
-def remove_color_default(file):
+####################################################################
+# Private helper functions
+
+def get_layout(line, default_layout):
+    " Get layout, if empty return the default layout."
+    tokens = line.split()
+    if len(tokens) > 1:
+        return tokens[1]
+    return default_layout
+
+
+def get_paragraph(lines, i, format):
+    "Finds the paragraph that contains line i."
+
+    if format < 225:
+        begin_layout = "\\layout"
+    else:
+        begin_layout = "\\begin_layout"
+    while i != -1:
+        i = find_tokens_backwards(lines, ["\\end_inset", begin_layout], i)
+        if i == -1: return -1
+        if check_token(lines[i], begin_layout):
+            return i
+        i = find_beginning_of_inset(lines, i)
+    return -1
+
+
+def find_beginning_of_inset(lines, i):
+    " Find beginning of inset, where lines[i] is included."
+    return find_beginning_of(lines, i, "\\begin_inset", "\\end_inset")
+
+
+def get_next_paragraph(lines, i, format):
+    "Finds the paragraph after the paragraph that contains line i."
+
+    if format < 225:
+        tokens = ["\\begin_inset", "\\layout", "\\end_float", "\\the_end"]
+    elif format < 236:
+        tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_document"]
+    else:
+        tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_body", "\\end_document"]
+    while i != -1:
+        i = find_tokens(lines, tokens, i)
+        if not check_token(lines[i], "\\begin_inset"):
+            return i
+        i = find_end_of_inset(lines, i)
+    return -1
+
+
+def find_end_of_inset(lines, i):
+    "Finds the matching \end_inset"
+    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
+
+# End of helper functions
+####################################################################
+
+def remove_color_default(document):
+    " Remove \color default"
     i = 0
     while 1:
-        i = find_token(file.body, "\\color default", i)
+        i = find_token(document.body, "\\color default", i)
         if i == -1:
             return
-        file.body[i] = replace(file.body[i], "\\color default",
-                           "\\color inherit")
+        document.body[i] = document.body[i].replace("\\color default",
+                                                    "\\color inherit")
 
 
-##
-# Add \end_header
-#
-def add_end_header(file):
-    file.header.append("\\end_header");
+def add_end_header(document):
+    " Add \end_header"
+    document.header.append("\\end_header");
 
 
-def rm_end_header(file):
-    i = find_token(file.header, "\\end_header", 0)
+def rm_end_header(document):
+    " Remove \end_header"
+    i = find_token(document.header, "\\end_header", 0)
     if i == -1:
         return
-    del file.header[i]
+    del document.header[i]
 
 
-def convert_amsmath(file):
-    i = find_token(file.header, "\\use_amsmath", 0)
+def convert_amsmath(document):
+    " Convert \\use_amsmath"
+    i = find_token(document.header, "\\use_amsmath", 0)
     if i == -1:
-        file.warning("Malformed LyX file: Missing '\\use_amsmath'.")
+        document.warning("Malformed LyX document: Missing '\\use_amsmath'.")
         return
-    tokens = split(file.header[i])
+    tokens = document.header[i].split()
     if len(tokens) != 2:
-        file.warning("Malformed LyX file: Could not parse line '%s'." % file.header[i])
+        document.warning("Malformed LyX document: Could not parse line '%s'." % document.header[i])
         use_amsmath = '0'
     else:
         use_amsmath = tokens[1]
@@ -72,19 +127,20 @@ def convert_amsmath(file):
     # new: 0 == off, 1 == auto, 2 == on
     # translate off -> auto, since old format 'off' means auto in reality
     if use_amsmath == '0':
-        file.header[i] = "\\use_amsmath 1"
+        document.header[i] = "\\use_amsmath 1"
     else:
-        file.header[i] = "\\use_amsmath 2"
+        document.header[i] = "\\use_amsmath 2"
 
 
-def revert_amsmath(file):
-    i = find_token(file.header, "\\use_amsmath", 0)
+def revert_amsmath(document):
+    " Revert \\use_amsmath"
+    i = find_token(document.header, "\\use_amsmath", 0)
     if i == -1:
-        file.warning("Malformed LyX file: Missing '\\use_amsmath'.")
+        document.warning("Malformed LyX document: Missing '\\use_amsmath'.")
         return
-    tokens = split(file.header[i])
+    tokens = document.header[i].split()
     if len(tokens) != 2:
-        file.warning("Malformed LyX file: Could not parse line '%s'." % file.header[i])
+        document.warning("Malformed LyX document: Could not parse line '%s'." % document.header[i])
         use_amsmath = '0'
     else:
         use_amsmath = tokens[1]
@@ -92,58 +148,61 @@ def revert_amsmath(file):
     # new: 0 == off, 1 == auto, 2 == on
     # translate auto -> off, since old format 'off' means auto in reality
     if use_amsmath == '2':
-        file.header[i] = "\\use_amsmath 1"
+        document.header[i] = "\\use_amsmath 1"
     else:
-        file.header[i] = "\\use_amsmath 0"
+        document.header[i] = "\\use_amsmath 0"
 
 
-##
-# \SpecialChar ~ -> \InsetSpace ~
-#
-def convert_spaces(file):
-    for i in range(len(file.body)):
-        file.body[i] = replace(file.body[i],"\\SpecialChar ~","\\InsetSpace ~")
+def convert_spaces(document):
+    " \SpecialChar ~ -> \InsetSpace ~"
+    for i in range(len(document.body)):
+        document.body[i] = document.body[i].replace("\\SpecialChar ~",
+                                                    "\\InsetSpace ~")
 
 
-def revert_spaces(file):
+def revert_spaces(document):
+    " \InsetSpace ~ -> \SpecialChar ~"
     regexp = re.compile(r'(.*)(\\InsetSpace\s+)(\S+)')
     i = 0
     while 1:
-        i = find_re(file.body, regexp, i)
+        i = find_re(document.body, regexp, i)
         if i == -1:
             break
-        space = regexp.match(file.body[i]).group(3)
-        prepend = regexp.match(file.body[i]).group(1)
+        space = regexp.match(document.body[i]).group(3)
+        prepend = regexp.match(document.body[i]).group(1)
         if space == '~':
-            file.body[i] = regexp.sub(prepend + '\\SpecialChar ~', file.body[i])
+            document.body[i] = regexp.sub(prepend + '\\SpecialChar ~', document.body[i])
             i = i + 1
         else:
-            file.body[i] = regexp.sub(prepend, file.body[i])
-            file.body[i+1:i+1] = ''
+            document.body[i] = regexp.sub(prepend, document.body[i])
+            document.body[i+1:i+1] = ''
             if space == "\\space":
                 space = "\\ "
-            i = insert_ert(file.body, i+1, 'Collapsed', space, file.format - 1, file.default_layout)
-
-##
-# \InsetSpace \, -> \InsetSpace \thinspace{}
-# \InsetSpace \space -> \InsetSpace \space{}
-#
-def rename_spaces(file):
-    for i in range(len(file.body)):
-        file.body[i] = replace(file.body[i],"\\InsetSpace \\space","\\InsetSpace \\space{}")
-        file.body[i] = replace(file.body[i],"\\InsetSpace \,","\\InsetSpace \\thinspace{}")
+            i = insert_ert(document.body, i+1, 'Collapsed', space, document.format - 1, document.default_layout)
 
 
-def revert_space_names(file):
-    for i in range(len(file.body)):
-        file.body[i] = replace(file.body[i],"\\InsetSpace \\space{}","\\InsetSpace \\space")
-        file.body[i] = replace(file.body[i],"\\InsetSpace \\thinspace{}","\\InsetSpace \\,")
+def rename_spaces(document):
+    """ \InsetSpace \, -> \InsetSpace \thinspace{}
+        \InsetSpace \space -> \InsetSpace \space{}"""
+    for i in range(len(document.body)):
+        document.body[i] = document.body[i].replace("\\InsetSpace \\space",
+                                                    "\\InsetSpace \\space{}")
+        document.body[i] = document.body[i].replace("\\InsetSpace \,",
+                                                    "\\InsetSpace \\thinspace{}")
+
+
+def revert_space_names(document):
+    """ \InsetSpace \thinspace{} -> \InsetSpace \,
+         \InsetSpace \space{} -> \InsetSpace \space"""
+    for i in range(len(document.body)):
+        document.body[i] = document.body[i].replace("\\InsetSpace \\space{}",
+                                                    "\\InsetSpace \\space")
+        document.body[i] = document.body[i].replace("\\InsetSpace \\thinspace{}",
+                                                    "\\InsetSpace \\,")
 
 
-##
-# equivalent to lyx::support::escape()
-#
 def lyx_support_escape(lab):
+    " Equivalent to pre-unicode lyx::support::escape()"
     hexdigit = ['0', '1', '2', '3', '4', '5', '6', '7',
                 '8', '9', 'A', 'B', 'C', 'D', 'E', 'F']
     enc = ""
@@ -158,62 +217,55 @@ def lyx_support_escape(lab):
     return enc;
 
 
-##
-# \begin_inset LatexCommand \eqref -> ERT
-#
-def revert_eqref(file):
+def revert_eqref(document):
+    "\\begin_inset LatexCommand \\eqref -> ERT"
     regexp = re.compile(r'^\\begin_inset\s+LatexCommand\s+\\eqref')
     i = 0
     while 1:
-        i = find_re(file.body, regexp, i)
+        i = find_re(document.body, regexp, i)
         if i == -1:
             break
-        eqref = lyx_support_escape(regexp.sub("", file.body[i]))
-        file.body[i:i+1] = ["\\begin_inset ERT", "status Collapsed", "",
-                            '\\layout %s' % file.default_layout, "", "\\backslash ",
+        eqref = lyx_support_escape(regexp.sub("", document.body[i]))
+        document.body[i:i+1] = ["\\begin_inset ERT", "status Collapsed", "",
+                            '\\layout %s' % document.default_layout, "", "\\backslash ",
                             "eqref" + eqref]
         i = i + 7
 
 
-##
-# BibTeX changes
-#
-def convert_bibtex(file):
-    for i in range(len(file.body)):
-        file.body[i] = replace(file.body[i],"\\begin_inset LatexCommand \\BibTeX",
-                                  "\\begin_inset LatexCommand \\bibtex")
+def convert_bibtex(document):
+    " Convert BibTeX changes."
+    for i in range(len(document.body)):
+        document.body[i] = document.body[i].replace("\\begin_inset LatexCommand \\BibTeX",
+                                                    "\\begin_inset LatexCommand \\bibtex")
 
 
-def revert_bibtex(file):
-    for i in range(len(file.body)):
-        file.body[i] = replace(file.body[i], "\\begin_inset LatexCommand \\bibtex",
-                                  "\\begin_inset LatexCommand \\BibTeX")
+def revert_bibtex(document):
+    " Revert BibTeX changes."
+    for i in range(len(document.body)):
+        document.body[i] = document.body[i].replace("\\begin_inset LatexCommand \\bibtex",
+                                                    "\\begin_inset LatexCommand \\BibTeX")
 
 
-##
-# Remove \lyxparent
-#
-def remove_insetparent(file):
+def remove_insetparent(document):
+    " Remove \lyxparent"
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset LatexCommand \\lyxparent", i)
+        i = find_token(document.body, "\\begin_inset LatexCommand \\lyxparent", i)
         if i == -1:
             break
-        del file.body[i:i+3]
+        del document.body[i:i+3]
 
 
-##
-#  Inset External
-#
-def convert_external(file):
+def convert_external(document):
+    " Convert inset External."
     external_rexp = re.compile(r'\\begin_inset External ([^,]*),"([^"]*)",')
     external_header = "\\begin_inset External"
     i = 0
     while 1:
-        i = find_token(file.body, external_header, i)
+        i = find_token(document.body, external_header, i)
         if i == -1:
             break
-        look = external_rexp.search(file.body[i])
+        look = external_rexp.search(document.body[i])
         args = ['','']
         if look:
             args[0] = look.group(1)
@@ -225,7 +277,7 @@ def convert_external(file):
             top = "\\begin_inset Graphics"
             if args[1]:
                 filename = "\tfilename " + args[1]
-            file.body[i:i+1] = [top, filename]
+            document.body[i:i+1] = [top, filename]
             i = i + 1
         else:
             # Convert the old External Inset format to the new.
@@ -233,137 +285,136 @@ def convert_external(file):
             template = "\ttemplate " + args[0]
             if args[1]:
                 filename = "\tfilename " + args[1]
-                file.body[i:i+1] = [top, template, filename]
+                document.body[i:i+1] = [top, template, filename]
                 i = i + 2
             else:
-                file.body[i:i+1] = [top, template]
+                document.body[i:i+1] = [top, template]
                 i = i + 1
 
 
-def revert_external_1(file):
+def revert_external_1(document):
+    " Revert inset External."
     external_header = "\\begin_inset External"
     i = 0
     while 1:
-        i = find_token(file.body, external_header, i)
+        i = find_token(document.body, external_header, i)
         if i == -1:
             break
 
-        template = split(file.body[i+1])
+        template = document.body[i+1].split()
         template.reverse()
-        del file.body[i+1]
+        del document.body[i+1]
 
-        filename = split(file.body[i+1])
+        filename = document.body[i+1].split()
         filename.reverse()
-        del file.body[i+1]
+        del document.body[i+1]
 
-        params = split(file.body[i+1])
+        params = document.body[i+1].split()
         params.reverse()
-        if file.body[i+1]: del file.body[i+1]
+        if document.body[i+1]: del document.body[i+1]
 
-        file.body[i] = file.body[i] + " " + template[0]+ ', "' + filename[0] + '", " '+ join(params[1:]) + '"'
+        document.body[i] = document.body[i] + " " + template[0]+ ', "' + filename[0] + '", " '+ " ".join(params[1:]) + '"'
         i = i + 1
 
 
-def revert_external_2(file):
+def revert_external_2(document):
+    " Revert inset External. (part II)"
     draft_token = '\tdraft'
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_inset External', i)
+        i = find_token(document.body, '\\begin_inset External', i)
         if i == -1:
             break
-        j = find_end_of_inset(file.body, i + 1)
+        j = find_end_of_inset(document.body, i + 1)
         if j == -1:
             #this should not happen
             break
-        k = find_token(file.body, draft_token, i+1, j-1)
-        if (k != -1 and len(draft_token) == len(file.body[k])):
-            del file.body[k]
+        k = find_token(document.body, draft_token, i+1, j-1)
+        if (k != -1 and len(draft_token) == len(document.body[k])):
+            del document.body[k]
         i = j + 1
 
 
-##
-# Comment
-#
-def convert_comment(file):
+def convert_comment(document):
+    " Convert \\layout comment"
     i = 0
     comment = "\\layout Comment"
     while 1:
-        i = find_token(file.body, comment, i)
+        i = find_token(document.body, comment, i)
         if i == -1:
             return
 
-        file.body[i:i+1] = ['\\layout %s' % file.default_layout,"","",
+        document.body[i:i+1] = ['\\layout %s' % document.default_layout,"","",
                         "\\begin_inset Comment",
                         "collapsed true","",
-                        '\\layout %s' % file.default_layout]
+                        '\\layout %s' % document.default_layout]
         i = i + 7
 
         while 1:
                 old_i = i
-                i = find_token(file.body, "\\layout", i)
+                i = find_token(document.body, "\\layout", i)
                 if i == -1:
-                    i = len(file.body) - 1
-                    file.body[i:i] = ["\\end_inset","",""]
+                    i = len(document.body) - 1
+                    document.body[i:i] = ["\\end_inset","",""]
                     return
 
-                j = find_token(file.body, '\\begin_deeper', old_i, i)
+                j = find_token(document.body, '\\begin_deeper', old_i, i)
                 if j == -1: j = i + 1
-                k = find_token(file.body, '\\begin_inset', old_i, i)
+                k = find_token(document.body, '\\begin_inset', old_i, i)
                 if k == -1: k = i + 1
 
                 if j < i and j < k:
                     i = j
-                    del file.body[i]
-                    i = find_end_of( file.body, i, "\\begin_deeper","\\end_deeper")
+                    del document.body[i]
+                    i = find_end_of( document.body, i, "\\begin_deeper","\\end_deeper")
                     if i == -1:
                         #This case should not happen
                         #but if this happens deal with it greacefully adding
                         #the missing \end_deeper.
-                        i = len(file.body) - 1
-                        file.body[i:i] = ["\end_deeper",""]
+                        i = len(document.body) - 1
+                        document.body[i:i] = ["\\end_deeper",""]
                         return
                     else:
-                        del file.body[i]
+                        del document.body[i]
                         continue
 
                 if k < i:
                     i = k
-                    i = find_end_of( file.body, i, "\\begin_inset","\\end_inset")
+                    i = find_end_of( document.body, i, "\\begin_inset","\\end_inset")
                     if i == -1:
                         #This case should not happen
                         #but if this happens deal with it greacefully adding
                         #the missing \end_inset.
-                        i = len(file.body) - 1
-                        file.body[i:i] = ["\\end_inset","","","\\end_inset","",""]
+                        i = len(document.body) - 1
+                        document.body[i:i] = ["\\end_inset","","","\\end_inset","",""]
                         return
                     else:
                         i = i + 1
                         continue
 
-                if find(file.body[i], comment) == -1:
-                    file.body[i:i] = ["\\end_inset"]
+                if document.body[i].find(comment) == -1:
+                    document.body[i:i] = ["\\end_inset"]
                     i = i + 1
                     break
-                file.body[i:i+1] = ['\\layout %s' % file.default_layout]
+                document.body[i:i+1] = ['\\layout %s' % document.default_layout]
                 i = i + 1
 
 
-def revert_comment(file):
+def revert_comment(document):
+    " Revert comments"
     i = 0
     while 1:
-        i = find_tokens(file.body, ["\\begin_inset Comment", "\\begin_inset Greyedout"], i)
+        i = find_tokens(document.body, ["\\begin_inset Comment", "\\begin_inset Greyedout"], i)
 
         if i == -1:
             return
-        file.body[i] = "\\begin_inset Note"
+        document.body[i] = "\\begin_inset Note"
         i = i + 1
 
 
-##
-# Add \end_layout
-#
-def add_end_layout(file):
-    i = find_token(file.body, '\\layout', 0)
+def add_end_layout(document):
+    " Add \end_layout"
+    i = find_token(document.body, '\\layout', 0)
 
     if i == -1:
         return
@@ -372,15 +423,15 @@ def add_end_layout(file):
     struct_stack = ["\\layout"]
 
     while 1:
-        i = find_tokens(file.body, ["\\begin_inset", "\\end_inset", "\\layout",
+        i = find_tokens(document.body, ["\\begin_inset", "\\end_inset", "\\layout",
                                 "\\begin_deeper", "\\end_deeper", "\\the_end"], i)
 
         if i != -1:
-            token = split(file.body[i])[0]
+            token = document.body[i].split()[0]
         else:
-            file.warning("Truncated file.")
-            i = len(file.body)
-            file.body.insert(i, '\\the_end')
+            document.warning("Truncated document.")
+            i = len(document.body)
+            document.body.insert(i, '\\the_end')
             token = ""
 
         if token == "\\begin_inset":
@@ -391,8 +442,8 @@ def add_end_layout(file):
         if token == "\\end_inset":
             tail = struct_stack.pop()
             if tail == "\\layout":
-                file.body.insert(i,"")
-                file.body.insert(i,"\\end_layout")
+                document.body.insert(i,"")
+                document.body.insert(i,"\\end_layout")
                 i = i + 2
                 #Check if it is the correct tag
                 struct_stack.pop()
@@ -402,8 +453,8 @@ def add_end_layout(file):
         if token == "\\layout":
             tail = struct_stack.pop()
             if tail == token:
-                file.body.insert(i,"")
-                file.body.insert(i,"\\end_layout")
+                document.body.insert(i,"")
+                document.body.insert(i,"\\end_layout")
                 i = i + 3
             else:
                 struct_stack.append(tail)
@@ -412,192 +463,196 @@ def add_end_layout(file):
             continue
 
         if token == "\\begin_deeper":
-            file.body.insert(i,"")
-            file.body.insert(i,"\\end_layout")
+            document.body.insert(i,"")
+            document.body.insert(i,"\\end_layout")
             i = i + 3
+            # consecutive begin_deeper only insert one end_layout
+            while document.body[i].startswith('\\begin_deeper'):
+                i += 1
             struct_stack.append(token)
             continue
 
         if token == "\\end_deeper":
             if struct_stack[-1] == '\\layout':
-                file.body.insert(i, '\\end_layout')
+                document.body.insert(i, '\\end_layout')
                 i = i + 1
                 struct_stack.pop()
             i = i + 1
             continue
 
         #case \end_document
-        file.body.insert(i, "")
-        file.body.insert(i, "\\end_layout")
+        document.body.insert(i, "")
+        document.body.insert(i, "\\end_layout")
         return
 
 
-def rm_end_layout(file):
+def rm_end_layout(document):
+    " Remove \end_layout"
     i = 0
     while 1:
-        i = find_token(file.body, '\\end_layout', i)
+        i = find_token(document.body, '\\end_layout', i)
 
         if i == -1:
             return
 
-        del file.body[i]
+        del document.body[i]
 
 
-##
-# Handle change tracking keywords
-#
-def insert_tracking_changes(file):
-    i = find_token(file.header, "\\tracking_changes", 0)
+def insert_tracking_changes(document):
+    " Handle change tracking keywords."
+    i = find_token(document.header, "\\tracking_changes", 0)
     if i == -1:
-        file.header.append("\\tracking_changes 0")
+        document.header.append("\\tracking_changes 0")
 
 
-def rm_tracking_changes(file):
-    i = find_token(file.header, "\\author", 0)
+def rm_tracking_changes(document):
+    " Remove change tracking keywords."
+    i = find_token(document.header, "\\author", 0)
     if i != -1:
-        del file.header[i]
+        del document.header[i]
 
-    i = find_token(file.header, "\\tracking_changes", 0)
+    i = find_token(document.header, "\\tracking_changes", 0)
     if i == -1:
         return
-    del file.header[i]
+    del document.header[i]
 
 
-def rm_body_changes(file):
+def rm_body_changes(document):
+    " Remove body changes."
     i = 0
     while 1:
-        i = find_token(file.body, "\\change_", i)
+        i = find_token(document.body, "\\change_", i)
         if i == -1:
             return
 
-        del file.body[i]
+        del document.body[i]
 
 
-##
-# \layout -> \begin_layout
-#
-def layout2begin_layout(file):
+def layout2begin_layout(document):
+    " \layout -> \begin_layout "
     i = 0
     while 1:
-        i = find_token(file.body, '\\layout', i)
+        i = find_token(document.body, '\\layout', i)
         if i == -1:
             return
 
-        file.body[i] = replace(file.body[i], '\\layout', '\\begin_layout')
+        document.body[i] = document.body[i].replace('\\layout', '\\begin_layout')
         i = i + 1
 
 
-def begin_layout2layout(file):
+def begin_layout2layout(document):
+    " \begin_layout -> \layout "
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_layout', i)
+        i = find_token(document.body, '\\begin_layout', i)
         if i == -1:
             return
 
-        file.body[i] = replace(file.body[i], '\\begin_layout', '\\layout')
+        document.body[i] = document.body[i].replace('\\begin_layout', '\\layout')
         i = i + 1
 
 
-##
-# valignment="center" -> valignment="middle"
-#
 def convert_valignment_middle(body, start, end):
+    'valignment="center" -> valignment="middle"'
     for i in range(start, end):
         if re.search('^<(column|cell) .*valignment="center".*>$', body[i]):
-            body[i] = replace(body[i], 'valignment="center"', 'valignment="middle"')
+            body[i] = body[i].replace('valignment="center"', 'valignment="middle"')
 
 
-def convert_table_valignment_middle(file):
+def convert_table_valignment_middle(document):
+    " Convert table  valignment, center -> middle"
     regexp = re.compile(r'^\\begin_inset\s+Tabular')
     i = 0
     while 1:
-        i = find_re(file.body, regexp, i)
+        i = find_re(document.body, regexp, i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i + 1)
+        j = find_end_of_inset(document.body, i + 1)
         if j == -1:
             #this should not happen
-            convert_valignment_middle(file.body, i + 1, len(file.body))
+            convert_valignment_middle(document.body, i + 1, len(document.body))
             return
-        convert_valignment_middle(file.body, i + 1, j)
+        convert_valignment_middle(document.body, i + 1, j)
         i = j + 1
 
 
 def revert_table_valignment_middle(body, start, end):
+    " valignment, middle -> center"
     for i in range(start, end):
         if re.search('^<(column|cell) .*valignment="middle".*>$', body[i]):
-            body[i] = replace(body[i], 'valignment="middle"', 'valignment="center"')
+            body[i] = body[i].replace('valignment="middle"', 'valignment="center"')
 
 
-def revert_valignment_middle(file):
+def revert_valignment_middle(document):
+    " Convert table  valignment, middle -> center"
     regexp = re.compile(r'^\\begin_inset\s+Tabular')
     i = 0
     while 1:
-        i = find_re(file.body, regexp, i)
+        i = find_re(document.body, regexp, i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i + 1)
+        j = find_end_of_inset(document.body, i + 1)
         if j == -1:
             #this should not happen
-            revert_table_valignment_middle(file.body, i + 1, len(file.body))
+            revert_table_valignment_middle(document.body, i + 1, len(document.body))
             return
-        revert_table_valignment_middle(file.body, i + 1, j)
+        revert_table_valignment_middle(document.body, i + 1, j)
         i = j + 1
 
 
-##
-#  \the_end -> \end_document
-#
-def convert_end_document(file):
-    i = find_token(file.body, "\\the_end", 0)
+def convert_end_document(document):
+    "\\the_end -> \\end_document"
+    i = find_token(document.body, "\\the_end", 0)
     if i == -1:
-        file.body.append("\\end_document")
+        document.body.append("\\end_document")
         return
-    file.body[i] = "\\end_document"
+    document.body[i] = "\\end_document"
 
 
-def revert_end_document(file):
-    i = find_token(file.body, "\\end_document", 0)
+def revert_end_document(document):
+    "\\end_document -> \\the_end"
+    i = find_token(document.body, "\\end_document", 0)
     if i == -1:
-        file.body.append("\\the_end")
+        document.body.append("\\the_end")
         return
-    file.body[i] = "\\the_end"
+    document.body[i] = "\\the_end"
 
 
-##
-# Convert line and page breaks
-# Old:
-#\layout Standard
-#\line_top \line_bottom \pagebreak_top \pagebreak_bottom \added_space_top xxx \added_space_bottom yyy
-#0
-#
-# New:
-#\begin layout Standard
-#
-#\newpage
-#
-#\lyxline
-#\begin_inset ERT
-#\begin layout Standard
-#\backslash
-#vspace{-1\backslash
-#parskip}
-#\end_layout
-#\end_inset
-#
-#\begin_inset VSpace xxx
-#\end_inset
-#
-#0
-#
-#\begin_inset VSpace xxx
-#\end_inset
-#\lyxline
-#
-#\newpage
-#
-#\end_layout
-def convert_breaks(file):
+def convert_breaks(document):
+    r"""
+Convert line and page breaks
+ Old:
+\layout Standard
+\line_top \line_bottom \pagebreak_top \pagebreak_bottom \added_space_top xxx \added_space_bottom yyy
+0
+
+ New:
+\begin layout Standard
+
+\newpage
+
+\lyxline
+\begin_inset ERT
+\begin layout Standard
+\backslash
+vspace{-1\backslash
+parskip}
+\end_layout
+\end_inset
+
+\begin_inset VSpace xxx
+\end_inset
+
+0
+
+\begin_inset VSpace xxx
+\end_inset
+\lyxline
+
+\newpage
+
+\end_layout
+    """
     par_params = ('added_space_bottom', 'added_space_top', 'align',
                  'labelwidthstring', 'line_bottom', 'line_top', 'noindent',
                  'pagebreak_bottom', 'pagebreak_top', 'paragraph_spacing',
@@ -605,28 +660,28 @@ def convert_breaks(file):
     font_attributes = ['\\family', '\\series', '\\shape', '\\emph',
                        '\\numeric', '\\bar', '\\noun', '\\color', '\\lang']
     attribute_values = ['default', 'default', 'default', 'default',
-                        'default', 'default', 'default', 'none', file.language]
+                        'default', 'default', 'default', 'none', document.language]
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_layout", i)
+        i = find_token(document.body, "\\begin_layout", i)
         if i == -1:
             return
-        layout = get_layout(file.body[i], file.default_layout)
+        layout = get_layout(document.body[i], document.default_layout)
         i = i + 1
 
         # Merge all paragraph parameters into a single line
         # We cannot check for '\\' only because paragraphs may start e.g.
         # with '\\backslash'
-        while file.body[i + 1][:1] == '\\' and split(file.body[i + 1][1:])[0] in par_params:
-            file.body[i] = file.body[i + 1] + ' ' + file.body[i]
-            del file.body[i+1]
+        while document.body[i + 1][:1] == '\\' and document.body[i + 1][1:].split()[0] in par_params:
+            document.body[i] = document.body[i + 1] + ' ' + document.body[i]
+            del document.body[i+1]
 
-        line_top   = find(file.body[i],"\\line_top")
-        line_bot   = find(file.body[i],"\\line_bottom")
-        pb_top     = find(file.body[i],"\\pagebreak_top")
-        pb_bot     = find(file.body[i],"\\pagebreak_bottom")
-        vspace_top = find(file.body[i],"\\added_space_top")
-        vspace_bot = find(file.body[i],"\\added_space_bottom")
+        line_top   = document.body[i].find("\\line_top")
+        line_bot   = document.body[i].find("\\line_bottom")
+        pb_top     = document.body[i].find("\\pagebreak_top")
+        pb_bot     = document.body[i].find("\\pagebreak_bottom")
+        vspace_top = document.body[i].find("\\added_space_top")
+        vspace_bot = document.body[i].find("\\added_space_bottom")
 
         if line_top == -1 and line_bot == -1 and pb_bot == -1 and pb_top == -1 and vspace_top == -1 and vspace_bot == -1:
             continue
@@ -638,41 +693,41 @@ def convert_breaks(file):
         # We want to avoid new paragraphs if possible becauase we want to
         # inherit font sizes.
         nonstandard = 0
-        if (not file.is_default_layout(layout) or
-            find(file.body[i],"\\align") != -1 or
-            find(file.body[i],"\\labelwidthstring") != -1 or
-            find(file.body[i],"\\noindent") != -1):
+        if (not document.is_default_layout(layout) or
+            document.body[i].find("\\align") != -1 or
+            document.body[i].find("\\labelwidthstring") != -1 or
+            document.body[i].find("\\noindent") != -1):
             nonstandard = 1
 
         # get the font size of the beginning of this paragraph, since we need
         # it for the lyxline inset
         j = i + 1
-        while not is_nonempty_line(file.body[j]):
+        while not is_nonempty_line(document.body[j]):
             j = j + 1
         size_top = ""
-        if find(file.body[j], "\\size") != -1:
-            size_top = split(file.body[j])[1]
+        if document.body[j].find("\\size") != -1:
+            size_top = document.body[j].split()[1]
 
         for tag in "\\line_top", "\\line_bottom", "\\pagebreak_top", "\\pagebreak_bottom":
-            file.body[i] = replace(file.body[i], tag, "")
+            document.body[i] = document.body[i].replace(tag, "")
 
         if vspace_top != -1:
             # the position could be change because of the removal of other
             # paragraph properties above
-            vspace_top = find(file.body[i],"\\added_space_top")
-            tmp_list = split(file.body[i][vspace_top:])
+            vspace_top = document.body[i].find("\\added_space_top")
+            tmp_list = document.body[i][vspace_top:].split()
             vspace_top_value = tmp_list[1]
-            file.body[i] = file.body[i][:vspace_top] + join(tmp_list[2:])
+            document.body[i] = document.body[i][:vspace_top] + " ".join(tmp_list[2:])
 
         if vspace_bot != -1:
             # the position could be change because of the removal of other
             # paragraph properties above
-            vspace_bot = find(file.body[i],"\\added_space_bottom")
-            tmp_list = split(file.body[i][vspace_bot:])
+            vspace_bot = document.body[i].find("\\added_space_bottom")
+            tmp_list = document.body[i][vspace_bot:].split()
             vspace_bot_value = tmp_list[1]
-            file.body[i] = file.body[i][:vspace_bot] + join(tmp_list[2:])
+            document.body[i] = document.body[i][:vspace_bot] + " ".join(tmp_list[2:])
 
-        file.body[i] = strip(file.body[i])
+        document.body[i] = document.body[i].strip()
         i = i + 1
 
         # Create an empty paragraph or paragraph fragment for line and
@@ -682,7 +737,7 @@ def convert_breaks(file):
             paragraph_above = list()
             if nonstandard:
                 # We need to create an extra paragraph for nonstandard environments
-                paragraph_above = ['\\begin_layout %s' % file.default_layout, '']
+                paragraph_above = ['\\begin_layout %s' % document.default_layout, '']
 
             if pb_top != -1:
                 paragraph_above.extend(['\\newpage ',''])
@@ -697,21 +752,21 @@ def convert_breaks(file):
                 # We can't use the vspace inset because it does not know \parskip.
                 paragraph_above.extend(['\\lyxline ', '', ''])
                 insert_ert(paragraph_above, len(paragraph_above) - 1, 'Collapsed',
-                           '\\vspace{-1\\parskip}\n', file.format + 1, file.default_layout)
+                           '\\vspace{-1\\parskip}\n', document.format + 1, document.default_layout)
                 paragraph_above.extend([''])
 
             if nonstandard:
                 paragraph_above.extend(['\\end_layout ',''])
                 # insert new paragraph above the current paragraph
-                file.body[i-2:i-2] = paragraph_above
+                document.body[i-2:i-2] = paragraph_above
             else:
                 # insert new lines at the beginning of the current paragraph
-                file.body[i:i] = paragraph_above
+                document.body[i:i] = paragraph_above
 
             i = i + len(paragraph_above)
 
         # Ensure that nested style are converted later.
-        k = find_end_of(file.body, i, "\\begin_layout", "\\end_layout")
+        k = find_end_of(document.body, i, "\\begin_layout", "\\end_layout")
 
         if k == -1:
             return
@@ -722,22 +777,22 @@ def convert_breaks(file):
             size_bot = size_top
             j = i + 1
             while j < k:
-                if find(file.body[j], "\\size") != -1:
-                    size_bot = split(file.body[j])[1]
+                if document.body[j].find("\\size") != -1:
+                    size_bot = document.body[j].split()[1]
                     j = j + 1
-                elif find(file.body[j], "\\begin_inset") != -1:
+                elif document.body[j].find("\\begin_inset") != -1:
                     # skip insets
-                    j = find_end_of_inset(file.body, j)
+                    j = find_end_of_inset(document.body, j)
                 else:
                     j = j + 1
 
             paragraph_below = list()
             if nonstandard:
                 # We need to create an extra paragraph for nonstandard environments
-                paragraph_below = ['', '\\begin_layout %s' % file.default_layout, '']
+                paragraph_below = ['', '\\begin_layout %s' % document.default_layout, '']
             else:
                 for a in range(len(font_attributes)):
-                    if find_token(file.body, font_attributes[a], i, k) != -1:
+                    if find_token(document.body, font_attributes[a], i, k) != -1:
                         paragraph_below.extend([font_attributes[a] + ' ' + attribute_values[a]])
 
             if line_bot != -1:
@@ -756,47 +811,44 @@ def convert_breaks(file):
             if nonstandard:
                 paragraph_below.extend(['\\end_layout '])
                 # insert new paragraph below the current paragraph
-                file.body[k+1:k+1] = paragraph_below
+                document.body[k+1:k+1] = paragraph_below
             else:
                 # insert new lines at the end of the current paragraph
-                file.body[k:k] = paragraph_below
+                document.body[k:k] = paragraph_below
 
 
-##
-#  Notes
-#
-def convert_note(file):
+def convert_note(document):
+    " Convert Notes. "
     i = 0
     while 1:
-        i = find_tokens(file.body, ["\\begin_inset Note",
+        i = find_tokens(document.body, ["\\begin_inset Note",
                                 "\\begin_inset Comment",
                                 "\\begin_inset Greyedout"], i)
         if i == -1:
             break
 
-        file.body[i] = file.body[i][0:13] + 'Note ' + file.body[i][13:]
+        document.body[i] = document.body[i][0:13] + 'Note ' + document.body[i][13:]
         i = i + 1
 
 
-def revert_note(file):
+def revert_note(document):
+    " Revert Notes. "
     note_header = "\\begin_inset Note "
     i = 0
     while 1:
-        i = find_token(file.body, note_header, i)
+        i = find_token(document.body, note_header, i)
         if i == -1:
             break
 
-        file.body[i] = "\\begin_inset " + file.body[i][len(note_header):]
+        document.body[i] = "\\begin_inset " + document.body[i][len(note_header):]
         i = i + 1
 
 
-##
-# Box
-#
-def convert_box(file):
+def convert_box(document):
+    " Convert Boxes. "
     i = 0
     while 1:
-        i = find_tokens(file.body, ["\\begin_inset Boxed",
+        i = find_tokens(document.body, ["\\begin_inset Boxed",
                                 "\\begin_inset Doublebox",
                                 "\\begin_inset Frameless",
                                 "\\begin_inset ovalbox",
@@ -805,29 +857,28 @@ def convert_box(file):
         if i == -1:
             break
 
-        file.body[i] = file.body[i][0:13] + 'Box ' + file.body[i][13:]
+        document.body[i] = document.body[i][0:13] + 'Box ' + document.body[i][13:]
         i = i + 1
 
 
-def revert_box(file):
+def revert_box(document):
+    " Revert Boxes."
     box_header = "\\begin_inset Box "
     i = 0
     while 1:
-        i = find_token(file.body, box_header, i)
+        i = find_token(document.body, box_header, i)
         if i == -1:
             break
 
-        file.body[i] = "\\begin_inset " + file.body[i][len(box_header):]
+        document.body[i] = "\\begin_inset " + document.body[i][len(box_header):]
         i = i + 1
 
 
-##
-# Collapse
-#
-def convert_collapsable(file):
+def convert_collapsable(document):
+    " Convert collapsed insets. "
     i = 0
     while 1:
-        i = find_tokens_exact(file.body, ["\\begin_inset Box",
+        i = find_tokens_exact(document.body, ["\\begin_inset Box",
                                 "\\begin_inset Branch",
                                 "\\begin_inset CharStyle",
                                 "\\begin_inset Float",
@@ -844,24 +895,25 @@ def convert_collapsable(file):
         # (_always_ present) then break with a warning message
         i = i + 1
         while 1:
-            if (file.body[i] == "collapsed false"):
-                file.body[i] = "status open"
+            if (document.body[i] == "collapsed false"):
+                document.body[i] = "status open"
                 break
-            elif (file.body[i] == "collapsed true"):
-                file.body[i] = "status collapsed"
+            elif (document.body[i] == "collapsed true"):
+                document.body[i] = "status collapsed"
                 break
-            elif (file.body[i][:13] == "\\begin_layout"):
-                file.warning("Malformed LyX file: Missing 'collapsed'.")
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed LyX document: Missing 'collapsed'.")
                 break
             i = i + 1
 
         i = i + 1
 
 
-def revert_collapsable(file):
+def revert_collapsable(document):
+    " Revert collapsed insets. "
     i = 0
     while 1:
-        i = find_tokens_exact(file.body, ["\\begin_inset Box",
+        i = find_tokens_exact(document.body, ["\\begin_inset Box",
                                 "\\begin_inset Branch",
                                 "\\begin_inset CharStyle",
                                 "\\begin_inset Float",
@@ -878,28 +930,26 @@ def revert_collapsable(file):
         # (_always_ present) then break with a warning message
         i = i + 1
         while 1:
-            if (file.body[i] == "status open"):
-                file.body[i] = "collapsed false"
+            if (document.body[i] == "status open"):
+                document.body[i] = "collapsed false"
                 break
-            elif (file.body[i] == "status collapsed" or
-                  file.body[i] == "status inlined"):
-                file.body[i] = "collapsed true"
+            elif (document.body[i] == "status collapsed" or
+                  document.body[i] == "status inlined"):
+                document.body[i] = "collapsed true"
                 break
-            elif (file.body[i][:13] == "\\begin_layout"):
-                file.warning("Malformed LyX file: Missing 'status'.")
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed LyX document: Missing 'status'.")
                 break
             i = i + 1
 
         i = i + 1
 
 
-##
-#  ERT
-#
-def convert_ert(file):
+def convert_ert(document):
+    " Convert ERT. "
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset ERT", i)
+        i = find_token(document.body, "\\begin_inset ERT", i)
         if i == -1:
             break
 
@@ -908,27 +958,28 @@ def convert_ert(file):
         # (_always_ present) then break with a warning message
         i = i + 1
         while 1:
-            if (file.body[i] == "status Open"):
-                file.body[i] = "status open"
+            if (document.body[i] == "status Open"):
+                document.body[i] = "status open"
                 break
-            elif (file.body[i] == "status Collapsed"):
-                file.body[i] = "status collapsed"
+            elif (document.body[i] == "status Collapsed"):
+                document.body[i] = "status collapsed"
                 break
-            elif (file.body[i] == "status Inlined"):
-                file.body[i] = "status inlined"
+            elif (document.body[i] == "status Inlined"):
+                document.body[i] = "status inlined"
                 break
-            elif (file.body[i][:13] == "\\begin_layout"):
-                file.warning("Malformed LyX file: Missing 'status'.")
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed LyX document: Missing 'status'.")
                 break
             i = i + 1
 
         i = i + 1
 
 
-def revert_ert(file):
+def revert_ert(document):
+    " Revert ERT. "
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset ERT", i)
+        i = find_token(document.body, "\\begin_inset ERT", i)
         if i == -1:
             break
 
@@ -937,27 +988,24 @@ def revert_ert(file):
         # (_always_ present) then break with a warning message
         i = i + 1
         while 1:
-            if (file.body[i] == "status open"):
-                file.body[i] = "status Open"
+            if (document.body[i] == "status open"):
+                document.body[i] = "status Open"
                 break
-            elif (file.body[i] == "status collapsed"):
-                file.body[i] = "status Collapsed"
+            elif (document.body[i] == "status collapsed"):
+                document.body[i] = "status Collapsed"
                 break
-            elif (file.body[i] == "status inlined"):
-                file.body[i] = "status Inlined"
+            elif (document.body[i] == "status inlined"):
+                document.body[i] = "status Inlined"
                 break
-            elif (file.body[i][:13] == "\\begin_layout"):
-                file.warning("Malformed LyX file : Missing 'status'.")
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed LyX document : Missing 'status'.")
                 break
             i = i + 1
 
         i = i + 1
 
 
-##
-# Minipages
-#
-def convert_minipage(file):
+def convert_minipage(document):
     """ Convert minipages to the box inset.
     We try to use the same order of arguments as lyx does.
     """
@@ -966,55 +1014,55 @@ def convert_minipage(file):
 
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset Minipage", i)
+        i = find_token(document.body, "\\begin_inset Minipage", i)
         if i == -1:
             return
 
-        file.body[i] = "\\begin_inset Box Frameless"
+        document.body[i] = "\\begin_inset Box Frameless"
         i = i + 1
 
         # convert old to new position using the pos list
-        if file.body[i][:8] == "position":
-            file.body[i] = 'position "%s"' % pos[int(file.body[i][9])]
+        if document.body[i][:8] == "position":
+            document.body[i] = 'position "%s"' % pos[int(document.body[i][9])]
         else:
-            file.body.insert(i, 'position "%s"' % pos[0])
+            document.body.insert(i, 'position "%s"' % pos[0])
         i = i + 1
 
-        file.body.insert(i, 'hor_pos "c"')
+        document.body.insert(i, 'hor_pos "c"')
         i = i + 1
-        file.body.insert(i, 'has_inner_box 1')
+        document.body.insert(i, 'has_inner_box 1')
         i = i + 1
 
         # convert the inner_position
-        if file.body[i][:14] == "inner_position":
-            innerpos = inner_pos[int(file.body[i][15])]
-            del file.body[i]    
+        if document.body[i][:14] == "inner_position":
+            innerpos = inner_pos[int(document.body[i][15])]
+            del document.body[i]    
         else:
             innerpos = inner_pos[0]
 
         # We need this since the new file format has a height and width
         # in a different order.
-        if file.body[i][:6] == "height":
-            height = file.body[i][6:]
+        if document.body[i][:6] == "height":
+            height = document.body[i][6:]
             # test for default value of 221 and convert it accordingly
             if height == ' "0pt"' or height == ' "0"':
                 height = ' "1pt"'
-            del file.body[i]
+            del document.body[i]
         else:
             height = ' "1pt"'
 
-        if file.body[i][:5] == "width":
-            width = file.body[i][5:]
-            del file.body[i]
+        if document.body[i][:5] == "width":
+            width = document.body[i][5:]
+            del document.body[i]
         else:
             width = ' "0"'
 
-        if file.body[i][:9] == "collapsed":
-            if file.body[i][9:] == "true":
+        if document.body[i][:9] == "collapsed":
+            if document.body[i][9:] == "true":
                 status = "collapsed"
             else:
                 status = "open"
-            del file.body[i]
+            del document.body[i]
         else:
             status = "collapsed"
 
@@ -1022,26 +1070,27 @@ def convert_minipage(file):
         if height == ' "1pt"' and innerpos == 'c':
             innerpos = 't'
 
-        file.body.insert(i, 'inner_pos "' + innerpos + '"')
+        document.body.insert(i, 'inner_pos "' + innerpos + '"')
         i = i + 1
-        file.body.insert(i, 'use_parbox 0')
+        document.body.insert(i, 'use_parbox 0')
         i = i + 1
-        file.body.insert(i, 'width' + width)
+        document.body.insert(i, 'width' + width)
         i = i + 1
-        file.body.insert(i, 'special "none"')
+        document.body.insert(i, 'special "none"')
         i = i + 1
-        file.body.insert(i, 'height' + height)
+        document.body.insert(i, 'height' + height)
         i = i + 1
-        file.body.insert(i, 'height_special "totalheight"')
+        document.body.insert(i, 'height_special "totalheight"')
         i = i + 1
-        file.body.insert(i, 'status ' + status)
+        document.body.insert(i, 'status ' + status)
         i = i + 1
 
 
-# -------------------------------------------------------------------------------------------
-# Convert backslashes and '\n' into valid ERT code, append the converted
-# text to body[i] and return the (maybe incremented) line index i
 def convert_ertbackslash(body, i, ert, format, default_layout):
+    r""" -------------------------------------------------------------------------------------------
+    Convert backslashes and '\n' into valid ERT code, append the converted
+    text to body[i] and return the (maybe incremented) line index i"""
+
     for c in ert:
         if c == '\\':
             body[i] = body[i] + '\\backslash '
@@ -1059,9 +1108,10 @@ def convert_ertbackslash(body, i, ert, format, default_layout):
     return i
 
 
-# Converts lines in ERT code to LaTeX
-# The surrounding \begin_layout ... \end_layout pair must not be included
 def ert2latex(lines, format):
+    r""" Converts lines in ERT code to LaTeX
+    The surrounding \begin_layout ... \end_layout pair must not be included"""
+
     backslash = re.compile(r'\\backslash\s*$')
     newline = re.compile(r'\\newline\s*$')
     if format <= 224:
@@ -1086,9 +1136,9 @@ def ert2latex(lines, format):
     return ert
 
 
-# get all paragraph parameters. They can be all on one line or on several lines.
-# lines[i] must be the first parameter line
 def get_par_params(lines, i):
+    """ get all paragraph parameters. They can be all on one line or on several lines.
+    lines[i] must be the first parameter line"""
     par_params = ('added_space_bottom', 'added_space_top', 'align',
                  'labelwidthstring', 'line_bottom', 'line_top', 'noindent',
                  'pagebreak_bottom', 'pagebreak_top', 'paragraph_spacing',
@@ -1096,14 +1146,14 @@ def get_par_params(lines, i):
     # We cannot check for '\\' only because paragraphs may start e.g.
     # with '\\backslash'
     params = ''
-    while lines[i][:1] == '\\' and split(lines[i][1:])[0] in par_params:
-        params = params + ' ' + strip(lines[i])
+    while lines[i][:1] == '\\' and lines[i][1:].split()[0] in par_params:
+        params = params + ' ' + lines[i].strip()
         i = i + 1
-    return strip(params)
+    return params.strip()
 
 
-# convert LyX font size to LaTeX fontsize
 def lyxsize2latexsize(lyxsize):
+    " Convert LyX font size to LaTeX fontsize. "
     sizes = {"tiny" : "tiny", "scriptsize" : "scriptsize",
              "footnotesize" : "footnotesize", "small" : "small",
              "normal" : "normalsize", "large" : "large", "larger" : "Large",
@@ -1113,16 +1163,16 @@ def lyxsize2latexsize(lyxsize):
     return ''
 
 
-# Change vspace insets, page breaks and lyxlines to paragraph options
-# (if possible) or ERT
-def revert_breaks(file):
+def revert_breaks(document):
+    """ Change vspace insets, page breaks and lyxlines to paragraph options
+    (if possible) or ERT"""
 
     # Get default spaceamount
-    i = find_token(file.header, '\\defskip', 0)
+    i = find_token(document.header, '\\defskip', 0)
     if i == -1:
         defskipamount = 'medskip'
     else:
-        defskipamount = split(file.header[i])[1]
+        defskipamount = document.header[i].split()[1]
 
     keys = {"\\begin_inset" : "vspace", "\\lyxline" : "lyxline",
             "\\newpage" : "newpage"}
@@ -1135,31 +1185,31 @@ def revert_breaks(file):
     # Convert the insets
     i = 0
     while 1:
-        i = find_tokens(file.body, tokens, i)
+        i = find_tokens(document.body, tokens, i)
         if i == -1:
             return
 
         # Are we at the beginning of a paragraph?
         paragraph_start = 1
-        this_par = get_paragraph(file.body, i, file.format - 1)
+        this_par = get_paragraph(document.body, i, document.format - 1)
         start = this_par + 1
-        params = get_par_params(file.body, start)
+        params = get_par_params(document.body, start)
         size = "normal"
         # Paragraph parameters may be on one or more lines.
         # Find the start of the real paragraph text.
-        while file.body[start][:1] == '\\' and split(file.body[start])[0] in params:
+        while document.body[start][:1] == '\\' and document.body[start].split()[0] in params:
             start = start + 1
         for k in range(start, i):
-            if find(file.body[k], "\\size") != -1:
+            if document.body[k].find("\\size") != -1:
                 # store font size
-                size = split(file.body[k])[1]
-            elif is_nonempty_line(file.body[k]):
+                size = document.body[k].split()[1]
+            elif is_nonempty_line(document.body[k]):
                 paragraph_start = 0
                 break
         # Find the end of the real paragraph text.
-        next_par = get_next_paragraph(file.body, i, file.format - 1)
+        next_par = get_next_paragraph(document.body, i, document.format - 1)
         if next_par == -1:
-            file.warning("Malformed LyX file: Missing next paragraph.")
+            document.warning("Malformed LyX document: Missing next paragraph.")
             i = i + 1
             continue
 
@@ -1184,28 +1234,28 @@ def revert_breaks(file):
         n = 0
         k = inset_start
         while k < next_par:
-            if find_tokens(file.body, tokens, k) == k:
+            if find_tokens(document.body, tokens, k) == k:
                 # inset to convert
-                lines.append(split(file.body[k]))
+                lines.append(document.body[k].split())
                 insets.append(keys[lines[n][0]])
                 del_lines.append([k, k])
                 top.append(0)
                 sizes.append(size)
                 n = n + 1
                 inset_end = k
-            elif find(file.body[k], "\\size") != -1:
+            elif document.body[k].find("\\size") != -1:
                 # store font size
-                size = split(file.body[k])[1]
-            elif find_token(file.body, "\\begin_inset ERT", k) == k:
-                ert_begin = find_token(file.body, "\\layout", k) + 1
+                size = document.body[k].split()[1]
+            elif find_token(document.body, "\\begin_inset ERT", k) == k:
+                ert_begin = find_token(document.body, "\\layout", k) + 1
                 if ert_begin == 0:
-                    file.warning("Malformed LyX file: Missing '\\layout'.")
+                    document.warning("Malformed LyX document: Missing '\\layout'.")
                     continue
-                ert_end = find_end_of_inset(file.body, k)
+                ert_end = find_end_of_inset(document.body, k)
                 if ert_end == -1:
-                    file.warning("Malformed LyX file: Missing '\\end_inset'.")
+                    document.warning("Malformed LyX document: Missing '\\end_inset'.")
                     continue
-                ert = ert2latex(file.body[ert_begin:ert_end], file.format - 1)
+                ert = ert2latex(document.body[ert_begin:ert_end], document.format - 1)
                 if (n > 0 and insets[n - 1] == "lyxline" and
                     ert == '\\vspace{-1\\parskip}\n'):
                     # vspace ERT created by convert_breaks() for top lyxline
@@ -1217,11 +1267,11 @@ def revert_breaks(file):
                     paragraph_end = 0
                     break
             elif (n > 0 and insets[n - 1] == "vspace" and
-                  find_token(file.body, "\\end_inset", k) == k):
+                  find_token(document.body, "\\end_inset", k) == k):
                 # ignore end of vspace inset
                 del_lines[n - 1][1] = k
                 inset_end = k
-            elif is_nonempty_line(file.body[k]):
+            elif is_nonempty_line(document.body[k]):
                 paragraph_end = 0
                 break
             k = k + 1
@@ -1270,23 +1320,23 @@ def revert_breaks(file):
                 # First try to merge with the previous paragraph.
                 # We try the previous paragraph first because we would
                 # otherwise need ERT for two subsequent vspaces.
-                prev_par = get_paragraph(file.body, this_par - 1, file.format - 1) + 1
+                prev_par = get_paragraph(document.body, this_par - 1, document.format - 1) + 1
                 if prev_par > 0 and not before:
-                    prev_params = get_par_params(file.body, prev_par + 1)
+                    prev_params = get_par_params(document.body, prev_par + 1)
                     ert = 0
                     # determine font size
                     prev_size = "normal"
                     k = prev_par + 1
-                    while file.body[k][:1] == '\\' and split(file.body[k])[0] in prev_params:
+                    while document.body[k][:1] == '\\' and document.body[k].split()[0] in prev_params:
                         k = k + 1
                     while k < this_par:
-                        if find(file.body[k], "\\size") != -1:
-                            prev_size = split(file.body[k])[1]
+                        if document.body[k].find("\\size") != -1:
+                            prev_size = document.body[k].split()[1]
                             break
-                        elif find(file.body[k], "\\begin_inset") != -1:
+                        elif document.body[k].find("\\begin_inset") != -1:
                             # skip insets
-                            k = find_end_of_inset(file.body, k)
-                        elif is_nonempty_line(file.body[k]):
+                            k = find_end_of_inset(document.body, k)
+                        elif is_nonempty_line(document.body[k]):
                             break
                         k = k + 1
                     for k in range(n):
@@ -1296,25 +1346,25 @@ def revert_breaks(file):
                             break
                     if not ert:
                         for k in range(n):
-                            file.body.insert(prev_par + 1,
+                            document.body.insert(prev_par + 1,
                                              keywords_bot[insets[k]] + arguments[k])
-                        del file.body[this_par+n:next_par-1+n]
+                        del document.body[this_par+n:next_par-1+n]
                         i = this_par + n
                         continue
                 # Then try next paragraph
                 if next_par > 0 and not after:
-                    next_params = get_par_params(file.body, next_par + 1)
+                    next_params = get_par_params(document.body, next_par + 1)
                     ert = 0
-                    while file.body[k][:1] == '\\' and split(file.body[k])[0] in next_params:
+                    while document.body[k][:1] == '\\' and document.body[k].split()[0] in next_params:
                         k = k + 1
                     # determine font size
                     next_size = "normal"
                     k = next_par + 1
                     while k < this_par:
-                        if find(file.body[k], "\\size") != -1:
-                            next_size = split(file.body[k])[1]
+                        if document.body[k].find("\\size") != -1:
+                            next_size = document.body[k].split()[1]
                             break
-                        elif is_nonempty_line(file.body[k]):
+                        elif is_nonempty_line(document.body[k]):
                             break
                         k = k + 1
                     for k in range(n):
@@ -1324,9 +1374,9 @@ def revert_breaks(file):
                             break
                     if not ert:
                         for k in range(n):
-                            file.body.insert(next_par + 1,
+                            document.body.insert(next_par + 1,
                                              keywords_top[insets[k]] + arguments[k])
-                        del file.body[this_par:next_par-1]
+                        del document.body[this_par:next_par-1]
                         i = this_par
                         continue
         elif paragraph_start or paragraph_end:
@@ -1344,12 +1394,12 @@ def revert_breaks(file):
                     break
             if not ert:
                 for k in range(n):
-                    file.body.insert(this_par + 1,
+                    document.body.insert(this_par + 1,
                                      keywords[insets[k]] + arguments[k])
                     for j in range(k, n):
                         del_lines[j][0] = del_lines[j][0] + 1
                         del_lines[j][1] = del_lines[j][1] + 1
-                    del file.body[del_lines[k][0]:del_lines[k][1]+1]
+                    del document.body[del_lines[k][0]:del_lines[k][1]+1]
                     deleted = del_lines[k][1] - del_lines[k][0] + 1
                     for j in range(k + 1, n):
                         del_lines[j][0] = del_lines[j][0] - deleted
@@ -1360,8 +1410,8 @@ def revert_breaks(file):
         # Convert the first inset to ERT.
         # The others are converted in the next loop runs (if they exist)
         if insets[0] == "vspace":
-            file.body[i:i+1] = ['\\begin_inset ERT', 'status Collapsed', '',
-                                '\\layout %s' % file.default_layout, '', '\\backslash ']
+            document.body[i:i+1] = ['\\begin_inset ERT', 'status Collapsed', '',
+                                '\\layout %s' % document.default_layout, '', '\\backslash ']
             i = i + 6
             if spaceamount[0][-1] == '*':
                 spaceamount[0] = spaceamount[0][:-1]
@@ -1387,36 +1437,36 @@ def revert_breaks(file):
             # Finally output the LaTeX code
             if (spaceamount[0] == 'smallskip' or spaceamount[0] == 'medskip' or
                 spaceamount[0] == 'bigskip'   or spaceamount[0] == 'vfill'):
-                file.body.insert(i, spaceamount[0] + '{}')
+                document.body.insert(i, spaceamount[0] + '{}')
             else :
                 if keep:
-                    file.body.insert(i, 'vspace*{')
+                    document.body.insert(i, 'vspace*{')
                 else:
-                    file.body.insert(i, 'vspace{')
-                i = convert_ertbackslash(file.body, i, spaceamount[0], file.format - 1, file.default_layout)
-                file.body[i] = file.body[i] + '}'
+                    document.body.insert(i, 'vspace{')
+                i = convert_ertbackslash(document.body, i, spaceamount[0], document.format - 1, document.default_layout)
+                document.body[i] = document.body[i] + '}'
             i = i + 1
         elif insets[0] == "lyxline":
-            file.body[i] = ''
+            document.body[i] = ''
             latexsize = lyxsize2latexsize(size)
             if latexsize == '':
-                file.warning("Could not convert LyX fontsize '%s' to LaTeX font size." % size)
+                document.warning("Could not convert LyX fontsize '%s' to LaTeX font size." % size)
                 latexsize = '\\normalsize'
-            i = insert_ert(file.body, i, 'Collapsed',
+            i = insert_ert(document.body, i, 'Collapsed',
                            '\\lyxline{%s}' % latexsize,
-                           file.format - 1, file.default_layout)
+                           document.format - 1, document.default_layout)
             # We use \providecommand so that we don't get an error if native
             # lyxlines are used (LyX writes first its own preamble and then
             # the user specified one)
-            add_to_preamble(file,
+            add_to_preamble(document,
                             ['% Commands inserted by lyx2lyx for lyxlines',
                              '\\providecommand{\\lyxline}[1]{',
                              '  {#1 \\vspace{1ex} \\hrule width \\columnwidth \\vspace{1ex}}'
                              '}'])
         elif insets[0] == "newpage":
-            file.body[i] = ''
-            i = insert_ert(file.body, i, 'Collapsed', '\\newpage{}',
-                           file.format - 1, file.default_layout)
+            document.body[i] = ''
+            i = insert_ert(document.body, i, 'Collapsed', '\\newpage{}',
+                           document.format - 1, document.default_layout)
 
 
 # Convert a LyX length into a LaTeX length
@@ -1431,22 +1481,22 @@ def convert_len(len, special):
 
     # Convert LyX units to LaTeX units
     for unit in units.keys():
-        if find(len, unit) != -1:
+        if len.find(unit) != -1:
             len = '%f' % (len2value(len) / 100) + units[unit]
             break
 
     return len
 
 
-# Convert a LyX length into valid ERT code and append it to body[i]
-# Return the (maybe incremented) line index i
 def convert_ertlen(body, i, len, special, format, default_layout):
-    # Convert backslashes and insert the converted length into body
+    """ Convert a LyX length into valid ERT code and append it to body[i]
+    Return the (maybe incremented) line index i
+    Convert backslashes and insert the converted length into body. """
     return convert_ertbackslash(body, i, convert_len(len, special), format, default_layout)
 
 
-# Return the value of len without the unit in numerical form
 def len2value(len):
+    " Return the value of len without the unit in numerical form. "
     result = re.search('([+-]?[0-9.]+)', len)
     if result:
         return float(result.group(1))
@@ -1454,9 +1504,10 @@ def len2value(len):
     return 1.0
 
 
-# Convert text to ERT and insert it at body[i]
-# Return the index of the line after the inserted ERT
 def insert_ert(body, i, status, text, format, default_layout):
+    """ Convert text to ERT and insert it at body[i]
+    Return the index of the line after the inserted ERT"""
+
     body[i:i] = ['\\begin_inset ERT', 'status ' + status, '']
     i = i + 3
     if format <= 224:
@@ -1473,29 +1524,31 @@ def insert_ert(body, i, status, text, format, default_layout):
     return i
 
 
-# Add text to the preamble if it is not already there.
-# Only the first line is checked!
-def add_to_preamble(file, text):
-    if find_token(file.preamble, text[0], 0) != -1:
+def add_to_preamble(document, text):
+    """ Add text to the preamble if it is not already there.
+    Only the first line is checked!"""
+
+    if find_token(document.preamble, text[0], 0) != -1:
         return
 
-    file.preamble.extend(text)
+    document.preamble.extend(text)
 
 
-def convert_frameless_box(file):
+def convert_frameless_box(document):
+    " Convert frameless box."
     pos = ['t', 'c', 'b']
     inner_pos = ['c', 't', 'b', 's']
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_inset Frameless', i)
+        i = find_token(document.body, '\\begin_inset Frameless', i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i)
+        j = find_end_of_inset(document.body, i)
         if j == -1:
-            file.warning("Malformed LyX file: Missing '\\end_inset'.")
+            document.warning("Malformed LyX document: Missing '\\end_inset'.")
             i = i + 1
             continue
-        del file.body[i]
+        del document.body[i]
         j = j - 1
 
         # Gather parameters
@@ -1504,7 +1557,7 @@ def convert_frameless_box(file):
                   'special':'none', 'height':'1in',
                   'height_special':'totalheight', 'collapsed':'false'}
         for key in params.keys():
-            value = replace(get_value(file.body, key, i, j), '"', '')
+            value = get_value(document.body, key, i, j).replace('"', '')
             if value != "":
                 if key == 'position':
                     # convert new to old position: 'position "t"' -> 0
@@ -1518,7 +1571,7 @@ def convert_frameless_box(file):
                         params[key] = value
                 else:
                     params[key] = value
-                j = del_token(file.body, key, i, j)
+                j = del_token(document.body, key, i, j)
         i = i + 1
 
         # Convert to minipage or ERT?
@@ -1559,7 +1612,7 @@ def convert_frameless_box(file):
             # Otherwise we will get LaTeX errors if this document is
             # converted to format 225 or above again (LyX 1.4 uses all
             # optional arguments).
-            add_to_preamble(file,
+            add_to_preamble(document,
                 ['% Commands inserted by lyx2lyx for frameless boxes',
                  '% Save the original minipage environment',
                  '\\let\\lyxtolyxrealminipage\\minipage',
@@ -1605,10 +1658,10 @@ def convert_frameless_box(file):
             ert = ert + '\\let\\endminipage\\endlyxtolyxminipage%\n'
 
             old_i = i
-            i = insert_ert(file.body, i, 'Collapsed', ert, file.format - 1, file.default_layout)
+            i = insert_ert(document.body, i, 'Collapsed', ert, document.format - 1, document.default_layout)
             j = j + i - old_i - 1
 
-            file.body[i:i] = ['\\begin_inset Minipage',
+            document.body[i:i] = ['\\begin_inset Minipage',
                               'position %d' % params['position'],
                               'inner_position 1',
                               'height "1in"',
@@ -1620,23 +1673,23 @@ def convert_frameless_box(file):
             # Restore the original minipage environment since we may have
             # minipages inside this box.
             # Start a new paragraph because the following may be nonstandard
-            file.body[i:i] = ['\\layout %s' % file.default_layout, '', '']
+            document.body[i:i] = ['\\layout %s' % document.default_layout, '', '']
             i = i + 2
             j = j + 3
             ert = '\\let\\minipage\\lyxtolyxrealminipage%\n'
             ert = ert + '\\let\\endminipage\\lyxtolyxrealendminipage%'
             old_i = i
-            i = insert_ert(file.body, i, 'Collapsed', ert, file.format - 1, file.default_layout)
+            i = insert_ert(document.body, i, 'Collapsed', ert, document.format - 1, document.default_layout)
             j = j + i - old_i - 1
 
             # Redefine the minipage end before the inset end.
             # Start a new paragraph because the previous may be nonstandard
-            file.body[j:j] = ['\\layout %s' % file.default_layout, '', '']
+            document.body[j:j] = ['\\layout %s' % document.default_layout, '', '']
             j = j + 2
             ert = '\\let\\endminipage\\endlyxtolyxminipage'
-            j = insert_ert(file.body, j, 'Collapsed', ert, file.format - 1, file.default_layout)
+            j = insert_ert(document.body, j, 'Collapsed', ert, document.format - 1, document.default_layout)
             j = j + 1
-            file.body.insert(j, '')
+            document.body.insert(j, '')
             j = j + 1
 
             # LyX writes '%\n' after each box. Therefore we need to end our
@@ -1645,7 +1698,7 @@ def convert_frameless_box(file):
                 ert = '}%\n'
             else:
                 ert = '\\end{lyxtolyxrealminipage}%\n'
-            j = insert_ert(file.body, j, 'Collapsed', ert, file.format - 1, file.default_layout)
+            j = insert_ert(document.body, j, 'Collapsed', ert, document.format - 1, document.default_layout)
 
             # We don't need to restore the original minipage after the inset
             # end because the scope of the redefinition is the original box.
@@ -1653,7 +1706,7 @@ def convert_frameless_box(file):
         else:
 
             # Convert to minipage
-            file.body[i:i] = ['\\begin_inset Minipage',
+            document.body[i:i] = ['\\begin_inset Minipage',
                               'position %d' % params['position'],
                               'inner_position %d' % params['inner_pos'],
                               'height "' + params['height'] + '"',
@@ -1662,103 +1715,99 @@ def convert_frameless_box(file):
             i = i + 6
 
 
-def remove_branches(file):
+def remove_branches(document):
+    " Remove branches. "
     i = 0
     while 1:
-        i = find_token(file.header, "\\branch", i)
+        i = find_token(document.header, "\\branch", i)
         if i == -1:
             break
-        file.warning("Removing branch %s." % split(file.header[i])[1])
-        j = find_token(file.header, "\\end_branch", i)
+        document.warning("Removing branch %s." % document.header[i].split()[1])
+        j = find_token(document.header, "\\end_branch", i)
         if j == -1:
-            file.warning("Malformed LyX file: Missing '\\end_branch'.")
+            document.warning("Malformed LyX document: Missing '\\end_branch'.")
             break
-        del file.header[i:j+1]
+        del document.header[i:j+1]
 
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset Branch", i)
+        i = find_token(document.body, "\\begin_inset Branch", i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i)
+        j = find_end_of_inset(document.body, i)
         if j == -1:
-            file.warning("Malformed LyX file: Missing '\\end_inset'.")
+            document.warning("Malformed LyX document: Missing '\\end_inset'.")
             i = i + 1
             continue
-        del file.body[i]
-        del file.body[j - 1]
+        del document.body[i]
+        del document.body[j - 1]
         # Seach for a line starting 'collapsed'
         # If, however, we find a line starting '\layout'
         # (_always_ present) then break with a warning message
         collapsed_found = 0
         while 1:
-            if (file.body[i][:9] == "collapsed"):
-                del file.body[i]
+            if (document.body[i][:9] == "collapsed"):
+                del document.body[i]
                 collapsed_found = 1
                 continue
-            elif (file.body[i][:7] == "\\layout"):
+            elif (document.body[i][:7] == "\\layout"):
                 if collapsed_found == 0:
-                    file.warning("Malformed LyX file: Missing 'collapsed'.")
+                    document.warning("Malformed LyX document: Missing 'collapsed'.")
                 # Delete this new paragraph, since it would not appear in
                 # .tex output. This avoids also empty paragraphs.
-                del file.body[i]
+                del document.body[i]
                 break
             i = i + 1
 
 
-##
-# Convert jurabib
-#
-
-def convert_jurabib(file):
-    i = find_token(file.header, '\\use_numerical_citations', 0)
+def convert_jurabib(document):
+    " Convert jurabib. "
+    i = find_token(document.header, '\\use_numerical_citations', 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\use_numerical_citations'.")
+        document.warning("Malformed lyx document: Missing '\\use_numerical_citations'.")
         return
-    file.header.insert(i + 1, '\\use_jurabib 0')
+    document.header.insert(i + 1, '\\use_jurabib 0')
 
 
-def revert_jurabib(file):
-    i = find_token(file.header, '\\use_jurabib', 0)
+def revert_jurabib(document):
+    " Revert jurabib. "
+    i = find_token(document.header, '\\use_jurabib', 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\use_jurabib'.")
+        document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
         return
-    if get_value(file.header, '\\use_jurabib', 0) != "0":
-        file.warning("Conversion of '\\use_jurabib = 1' not yet implemented.")
+    if get_value(document.header, '\\use_jurabib', 0) != "0":
+        document.warning("Conversion of '\\use_jurabib = 1' not yet implemented.")
         # Don't remove '\\use_jurabib' so that people will get warnings by lyx
         return
-    del file.header[i]
+    del document.header[i]
 
-##
-# Convert bibtopic
-#
 
-def convert_bibtopic(file):
-    i = find_token(file.header, '\\use_jurabib', 0)
+def convert_bibtopic(document):
+    " Convert bibtopic. "
+    i = find_token(document.header, '\\use_jurabib', 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\use_jurabib'.")
+        document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
         return
-    file.header.insert(i + 1, '\\use_bibtopic 0')
+    document.header.insert(i + 1, '\\use_bibtopic 0')
 
 
-def revert_bibtopic(file):
-    i = find_token(file.header, '\\use_bibtopic', 0)
+def revert_bibtopic(document):
+    " Revert bibtopic. "
+    i = find_token(document.header, '\\use_bibtopic', 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\use_bibtopic'.")
+        document.warning("Malformed lyx document: Missing '\\use_bibtopic'.")
         return
-    if get_value(file.header, '\\use_bibtopic', 0) != "0":
-        file.warning("Conversion of '\\use_bibtopic = 1' not yet implemented.")
+    if get_value(document.header, '\\use_bibtopic', 0) != "0":
+        document.warning("Conversion of '\\use_bibtopic = 1' not yet implemented.")
         # Don't remove '\\use_jurabib' so that people will get warnings by lyx
-    del file.header[i]
+    del document.header[i]
 
-##
-# Sideway Floats
-#
 
-def convert_float(file):
+def convert_float(document):
+    " Convert sideway floats. "
     i = 0
     while 1:
-        i = find_token_exact(file.body, '\\begin_inset Float', i)
+        i = find_token_exact(document.body, '\\begin_inset Float', i)
         if i == -1:
             return
         # Seach for a line starting 'wide'
@@ -1766,107 +1815,105 @@ def convert_float(file):
         # (_always_ present) then break with a warning message
         i = i + 1
         while 1:
-            if (file.body[i][:4] == "wide"):
-                file.body.insert(i + 1, 'sideways false')
+            if (document.body[i][:4] == "wide"):
+                document.body.insert(i + 1, 'sideways false')
                 break
-            elif (file.body[i][:13] == "\\begin_layout"):
-                file.warning("Malformed lyx file: Missing 'wide'.")
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed lyx document: Missing 'wide'.")
                 break
             i = i + 1
         i = i + 1
 
 
-def revert_float(file):
+def revert_float(document):
+    " Revert sideway floats. "
     i = 0
     while 1:
-        i = find_token_exact(file.body, '\\begin_inset Float', i)
+        i = find_token_exact(document.body, '\\begin_inset Float', i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i)
+        j = find_end_of_inset(document.body, i)
         if j == -1:
-            file.warning("Malformed lyx file: Missing '\\end_inset'.")
+            document.warning("Malformed lyx document: Missing '\\end_inset'.")
             i = i + 1
             continue
-        if get_value(file.body, 'sideways', i, j) != "false":
-            file.warning("Conversion of 'sideways true' not yet implemented.")
+        if get_value(document.body, 'sideways', i, j) != "false":
+            document.warning("Conversion of 'sideways true' not yet implemented.")
             # Don't remove 'sideways' so that people will get warnings by lyx
             i = i + 1
             continue
-        del_token(file.body, 'sideways', i, j)
+        del_token(document.body, 'sideways', i, j)
         i = i + 1
 
 
-def convert_graphics(file):
-    """ Add extension to filenames of insetgraphics if necessary.
+def convert_graphics(document):
+    """ Add extension to documentnames of insetgraphics if necessary.
     """
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_inset Graphics", i)
+        i = find_token(document.body, "\\begin_inset Graphics", i)
         if i == -1:
             return
 
-        j = find_token_exact(file.body, "filename", i)
+        j = find_token_exact(document.body, "documentname", i)
         if j == -1:
             return
         i = i + 1
-        filename = split(file.body[j])[1]
-        absname = os.path.normpath(os.path.join(file.dir, filename))
-        if file.input == stdin and not os.path.isabs(filename):
-            # We don't know the directory and cannot check the file.
+        filename = document.body[j].split()[1]
+        absname = os.path.normpath(os.path.join(document.dir, filename))
+        if document.input == stdin and not os.path.isabs(filename):
+            # We don't know the directory and cannot check the document.
             # We could use a heuristic and take the current directory,
-            # and we could try to find out if filename has an extension,
+            # and we could try to find out if documentname has an extension,
             # but that would be just guesses and could be wrong.
-            file.warning("""Warning: Can not determine whether file
+            document.warning("""Warning: Cannot determine whether document
          %s
          needs an extension when reading from standard input.
-         You may need to correct the file manually or run
-         lyx2lyx again with the .lyx file as commandline argument.""" % filename)
+         You may need to correct the document manually or run
+         lyx2lyx again with the .lyx document as commandline argument.""" % filename)
             continue
         # This needs to be the same algorithm as in pre 233 insetgraphics
         if access(absname, F_OK):
             continue
         if access(absname + ".ps", F_OK):
-            file.body[j] = replace(file.body[j], filename, filename + ".ps")
+            document.body[j] = document.body[j].replace(filename, filename + ".ps")
             continue
         if access(absname + ".eps", F_OK):
-            file.body[j] = replace(file.body[j], filename, filename + ".eps")
+            document.body[j] = document.body[j].replace(filename, filename + ".eps")
 
 
-##
-# Convert firstname and surname from styles -> char styles
-#
-def convert_names(file):
+def convert_names(document):
     """ Convert in the docbook backend from firstname and surname style
     to charstyles.
     """
-    if file.backend != "docbook":
+    if document.backend != "docbook":
         return
 
     i = 0
 
     while 1:
-        i = find_token(file.body, "\\begin_layout Author", i)
+        i = find_token(document.body, "\\begin_layout Author", i)
         if i == -1:
             return
 
         i = i + 1
-        while file.body[i] == "":
+        while document.body[i] == "":
             i = i + 1
 
-        if file.body[i][:11] != "\\end_layout" or file.body[i+2][:13] != "\\begin_deeper":
+        if document.body[i][:11] != "\\end_layout" or document.body[i+2][:13] != "\\begin_deeper":
             i = i + 1
             continue
 
         k = i
-        i = find_end_of( file.body, i+3, "\\begin_deeper","\\end_deeper")
+        i = find_end_of( document.body, i+3, "\\begin_deeper","\\end_deeper")
         if i == -1:
             # something is really wrong, abort
-            file.warning("Missing \\end_deeper, after style Author.")
-            file.warning("Aborted attempt to parse FirstName and Surname.")
+            document.warning("Missing \\end_deeper, after style Author.")
+            document.warning("Aborted attempt to parse FirstName and Surname.")
             return
         firstname, surname = "", ""
 
-        name = file.body[k:i]
+        name = document.body[k:i]
 
         j = find_token(name, "\\begin_layout FirstName", 0)
         if j != -1:
@@ -1883,13 +1930,13 @@ def convert_names(file):
                 j = j + 1
 
         # delete name
-        del file.body[k+2:i+1]
+        del document.body[k+2:i+1]
 
-        file.body[k-1:k-1] = ["", "",
+        document.body[k-1:k-1] = ["", "",
                           "\\begin_inset CharStyle Firstname",
                           "status inlined",
                           "",
-                          '\\begin_layout %s' % file.default_layout,
+                          '\\begin_layout %s' % document.default_layout,
                           "",
                           "%s" % firstname,
                           "\end_layout",
@@ -1900,7 +1947,7 @@ def convert_names(file):
                           "\\begin_inset CharStyle Surname",
                           "status inlined",
                           "",
-                          '\\begin_layout %s' % file.default_layout,
+                          '\\begin_layout %s' % document.default_layout,
                           "",
                           "%s" % surname,
                           "\\end_layout",
@@ -1909,38 +1956,37 @@ def convert_names(file):
                           ""]
 
 
-def revert_names(file):
+def revert_names(document):
     """ Revert in the docbook backend from firstname and surname char style
     to styles.
     """
-    if file.backend != "docbook":
+    if document.backend != "docbook":
         return
 
 
-##
-#    \use_natbib 1                       \cite_engine <style>
-#    \use_numerical_citations 0     ->   where <style> is one of
-#    \use_jurabib 0                      "basic", "natbib_authoryear",
-#                                        "natbib_numerical" or "jurabib"
-def convert_cite_engine(file):
-    a = find_token(file.header, "\\use_natbib", 0)
+def convert_cite_engine(document):
+    r""" \use_natbib 1                       \cite_engine <style>
+         \use_numerical_citations 0     ->   where <style> is one of
+         \use_jurabib 0                      "basic", "natbib_authoryear","""
+
+    a = find_token(document.header, "\\use_natbib", 0)
     if a == -1:
-        file.warning("Malformed lyx file: Missing '\\use_natbib'.")
+        document.warning("Malformed lyx document: Missing '\\use_natbib'.")
         return
 
-    b = find_token(file.header, "\\use_numerical_citations", 0)
+    b = find_token(document.header, "\\use_numerical_citations", 0)
     if b == -1 or b != a+1:
-        file.warning("Malformed lyx file: Missing '\\use_numerical_citations'.")
+        document.warning("Malformed lyx document: Missing '\\use_numerical_citations'.")
         return
 
-    c = find_token(file.header, "\\use_jurabib", 0)
+    c = find_token(document.header, "\\use_jurabib", 0)
     if c == -1 or c != b+1:
-        file.warning("Malformed lyx file: Missing '\\use_jurabib'.")
+        document.warning("Malformed lyx document: Missing '\\use_jurabib'.")
         return
 
-    use_natbib = int(split(file.header[a])[1])
-    use_numerical_citations = int(split(file.header[b])[1])
-    use_jurabib = int(split(file.header[c])[1])
+    use_natbib = int(document.header[a].split()[1])
+    use_numerical_citations = int(document.header[b].split()[1])
+    use_jurabib = int(document.header[c].split()[1])
 
     cite_engine = "basic"
     if use_natbib:
@@ -1951,17 +1997,18 @@ def convert_cite_engine(file):
     elif use_jurabib:
         cite_engine = "jurabib"
 
-    del file.header[a:c+1]
-    file.header.insert(a, "\\cite_engine " + cite_engine)
+    del document.header[a:c+1]
+    document.header.insert(a, "\\cite_engine " + cite_engine)
 
 
-def revert_cite_engine(file):
-    i = find_token(file.header, "\\cite_engine", 0)
+def revert_cite_engine(document):
+    " Revert the cite engine. "
+    i = find_token(document.header, "\\cite_engine", 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\cite_engine'.")
+        document.warning("Malformed lyx document: Missing '\\cite_engine'.")
         return
 
-    cite_engine = split(file.header[i])[1]
+    cite_engine = document.header[i].split()[1]
 
     use_natbib = '0'
     use_numerical = '0'
@@ -1974,83 +2021,81 @@ def revert_cite_engine(file):
     elif cite_engine == "jurabib":
         use_jurabib = '1'
 
-    del file.header[i]
-    file.header.insert(i, "\\use_jurabib " + use_jurabib)
-    file.header.insert(i, "\\use_numerical_citations " + use_numerical)
-    file.header.insert(i, "\\use_natbib " + use_natbib)
+    del document.header[i]
+    document.header.insert(i, "\\use_jurabib " + use_jurabib)
+    document.header.insert(i, "\\use_numerical_citations " + use_numerical)
+    document.header.insert(i, "\\use_natbib " + use_natbib)
 
 
-##
-# Paper package
-#
-def convert_paperpackage(file):
-    i = find_token(file.header, "\\paperpackage", 0)
+def convert_paperpackage(document):
+    " Convert paper package. "
+    i = find_token(document.header, "\\paperpackage", 0)
     if i == -1:
         return
 
     packages = {'default':'none','a4':'none', 'a4wide':'a4', 'widemarginsa4':'a4wide'}
-    if len(split(file.header[i])) > 1:
-        paperpackage = split(file.header[i])[1]
-        file.header[i] = replace(file.header[i], paperpackage, packages[paperpackage])
+    if len(document.header[i].split()) > 1:
+        paperpackage = document.header[i].split()[1]
+        document.header[i] = document.header[i].replace(paperpackage, packages[paperpackage])
     else:
-        file.header[i] = file.header[i] + ' widemarginsa4'
+        document.header[i] = document.header[i] + ' widemarginsa4'
 
 
-def revert_paperpackage(file):
-    i = find_token(file.header, "\\paperpackage", 0)
+def revert_paperpackage(document):
+    " Revert paper package. "
+    i = find_token(document.header, "\\paperpackage", 0)
     if i == -1:
         return
 
     packages = {'none':'a4', 'a4':'a4wide', 'a4wide':'widemarginsa4',
                 'widemarginsa4':'', 'default': 'default'}
-    if len(split(file.header[i])) > 1:
-        paperpackage = split(file.header[i])[1]
+    if len(document.header[i].split()) > 1:
+        paperpackage = document.header[i].split()[1]
     else:
         paperpackage = 'default'
-    file.header[i] = replace(file.header[i], paperpackage, packages[paperpackage])
+    document.header[i] = document.header[i].replace(paperpackage, packages[paperpackage])
 
 
-##
-# Bullets
-#
-def convert_bullets(file):
+def convert_bullets(document):
+    " Convert bullets. "
     i = 0
     while 1:
-        i = find_token(file.header, "\\bullet", i)
+        i = find_token(document.header, "\\bullet", i)
         if i == -1:
             return
-        if file.header[i][:12] == '\\bulletLaTeX':
-            file.header[i] = file.header[i] + ' ' + strip(file.header[i+1])
+        if document.header[i][:12] == '\\bulletLaTeX':
+            document.header[i] = document.header[i] + ' ' + document.header[i+1].strip()
             n = 3
         else:
-            file.header[i] = file.header[i] + ' ' + strip(file.header[i+1]) +\
-                        ' ' + strip(file.header[i+2]) + ' ' + strip(file.header[i+3])
+            document.header[i] = document.header[i] + ' ' + document.header[i+1].strip() +\
+                        ' ' + document.header[i+2].strip() + ' ' + document.header[i+3].strip()
             n = 5
-        del file.header[i+1:i + n]
+        del document.header[i+1:i + n]
         i = i + 1
 
 
-def revert_bullets(file):
+def revert_bullets(document):
+    " Revert bullets. "
     i = 0
     while 1:
-        i = find_token(file.header, "\\bullet", i)
+        i = find_token(document.header, "\\bullet", i)
         if i == -1:
             return
-        if file.header[i][:12] == '\\bulletLaTeX':
-            n = find(file.header[i], '"')
+        if document.header[i][:12] == '\\bulletLaTeX':
+            n = document.header[i].find('"')
             if n == -1:
-                file.warning("Malformed header.")
+                document.warning("Malformed header.")
                 return
             else:
-                file.header[i:i+1] = [file.header[i][:n-1],'\t' + file.header[i][n:], '\\end_bullet']
+                document.header[i:i+1] = [document.header[i][:n-1],'\t' + document.header[i][n:], '\\end_bullet']
             i = i + 3
         else:
-            frag = split(file.header[i])
+            frag = document.header[i].split()
             if len(frag) != 5:
-                file.warning("Malformed header.")
+                document.warning("Malformed header.")
                 return
             else:
-                file.header[i:i+1] = [frag[0] + ' ' + frag[1],
+                document.header[i:i+1] = [frag[0] + ' ' + frag[1],
                                  '\t' + frag[2],
                                  '\t' + frag[3],
                                  '\t' + frag[4],
@@ -2058,149 +2103,142 @@ def revert_bullets(file):
                 i = i + 5
 
 
-##
-# \begin_header and \begin_document
-#
-def add_begin_header(file):
-    i = find_token(file.header, '\\lyxformat', 0)
-    file.header.insert(i+1, '\\begin_header')
-    file.header.insert(i+1, '\\begin_document')
+def add_begin_header(document):
+    r" Add \begin_header and \begin_document. "
+    i = find_token(document.header, '\\lyxformat', 0)
+    document.header.insert(i+1, '\\begin_header')
+    document.header.insert(i+1, '\\begin_document')
 
 
-def remove_begin_header(file):
-    i = find_token(file.header, "\\begin_document", 0)
+def remove_begin_header(document):
+    r" Remove \begin_header and \begin_document. "
+    i = find_token(document.header, "\\begin_document", 0)
     if i != -1:
-        del file.header[i]
-    i = find_token(file.header, "\\begin_header", 0)
+        del document.header[i]
+    i = find_token(document.header, "\\begin_header", 0)
     if i != -1:
-        del file.header[i]
+        del document.header[i]
 
 
-##
-# \begin_file.body and \end_file.body
-#
-def add_begin_body(file):
-    file.body.insert(0, '\\begin_body')
-    file.body.insert(1, '')
-    i = find_token(file.body, "\\end_document", 0)
-    file.body.insert(i, '\\end_body')
+def add_begin_body(document):
+    r" Add and \begin_document and \end_document"
+    document.body.insert(0, '\\begin_body')
+    document.body.insert(1, '')
+    i = find_token(document.body, "\\end_document", 0)
+    document.body.insert(i, '\\end_body')
 
-def remove_begin_body(file):
-    i = find_token(file.body, "\\begin_body", 0)
+def remove_begin_body(document):
+    r" Remove \begin_body and \end_body"
+    i = find_token(document.body, "\\begin_body", 0)
     if i != -1:
-        del file.body[i]
-        if not file.body[i]:
-            del file.body[i]
-    i = find_token(file.body, "\\end_body", 0)
+        del document.body[i]
+        if not document.body[i]:
+            del document.body[i]
+    i = find_token(document.body, "\\end_body", 0)
     if i != -1:
-        del file.body[i]
+        del document.body[i]
 
 
-##
-# \papersize
-#
-def normalize_papersize(file):
-    i = find_token(file.header, '\\papersize', 0)
+def normalize_papersize(document):
+    r" Normalize \papersize"
+    i = find_token(document.header, '\\papersize', 0)
     if i == -1:
         return
 
-    tmp = split(file.header[i])
+    tmp = document.header[i].split()
     if tmp[1] == "Default":
-        file.header[i] = '\\papersize default'
+        document.header[i] = '\\papersize default'
         return
     if tmp[1] == "Custom":
-        file.header[i] = '\\papersize custom'
+        document.header[i] = '\\papersize custom'
 
 
-def denormalize_papersize(file):
-    i = find_token(file.header, '\\papersize', 0)
+def denormalize_papersize(document):
+    r" Revert \papersize"
+    i = find_token(document.header, '\\papersize', 0)
     if i == -1:
         return
 
-    tmp = split(file.header[i])
+    tmp = document.header[i].split()
     if tmp[1] == "custom":
-        file.header[i] = '\\papersize Custom'
+        document.header[i] = '\\papersize Custom'
 
 
-##
-# Strip spaces at end of command line
-#
-def strip_end_space(file):
-    for i in range(len(file.body)):
-        if file.body[i][:1] == '\\':
-            file.body[i] = strip(file.body[i])
+def strip_end_space(document):
+    " Strip spaces at end of command line. "
+    for i in range(len(document.body)):
+        if document.body[i][:1] == '\\':
+            document.body[i] = document.body[i].strip()
 
 
-##
-# Use boolean values for \use_geometry, \use_bibtopic and \tracking_changes
-#
-def use_x_boolean(file):
+def use_x_boolean(document):
+    r" Use boolean values for \use_geometry, \use_bibtopic and \tracking_changes"
     bin2bool = {'0': 'false', '1': 'true'}
     for use in '\\use_geometry', '\\use_bibtopic', '\\tracking_changes':
-        i = find_token(file.header, use, 0)
+        i = find_token(document.header, use, 0)
         if i == -1:
             continue
-        decompose = split(file.header[i])
-        file.header[i] = decompose[0] + ' ' + bin2bool[decompose[1]]
+        decompose = document.header[i].split()
+        document.header[i] = decompose[0] + ' ' + bin2bool[decompose[1]]
 
 
-def use_x_binary(file):
+def use_x_binary(document):
+    r" Use digit values for \use_geometry, \use_bibtopic and \tracking_changes"
     bool2bin = {'false': '0', 'true': '1'}
     for use in '\\use_geometry', '\\use_bibtopic', '\\tracking_changes':
-        i = find_token(file.header, use, 0)
+        i = find_token(document.header, use, 0)
         if i == -1:
             continue
-        decompose = split(file.header[i])
-        file.header[i] = decompose[0] + ' ' + bool2bin[decompose[1]]
+        decompose = document.header[i].split()
+        document.header[i] = decompose[0] + ' ' + bool2bin[decompose[1]]
 
-##
-# Place all the paragraph parameters in their own line
-#
-def normalize_paragraph_params(file):
-    body = file.body
-    allowed_parameters = '\\paragraph_spacing', '\\noindent', '\\align', '\\labelwidthstring', "\\start_of_appendix", "\\leftindent"
+
+def normalize_paragraph_params(document):
+    " Place all the paragraph parameters in their own line. "
+    body = document.body
+    
+    allowed_parameters = '\\paragraph_spacing', '\\noindent', \
+                         '\\align', '\\labelwidthstring', "\\start_of_appendix", \
+                         "\\leftindent"
 
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_layout', i)
+        i = find_token(document.body, '\\begin_layout', i)
         if i == -1:
             return
 
         i = i + 1
         while 1:
-            if strip(body[i]) and split(body[i])[0] not in allowed_parameters:
+            if body[i].strip() and body[i].split()[0] not in allowed_parameters:
                 break
 
-            j = find(body[i],'\\', 1)
+            j = body[i].find('\\', 1)
 
             if j != -1:
-                body[i:i+1] = [strip(body[i][:j]), body[i][j:]]
+                body[i:i+1] = [body[i][:j].strip(), body[i][j:]]
 
             i = i + 1
 
 
-##
-# Add/remove output_changes parameter
-#
-def convert_output_changes (file):
-    i = find_token(file.header, '\\tracking_changes', 0)
+def convert_output_changes (document):
+    " Add output_changes parameter. "
+    i = find_token(document.header, '\\tracking_changes', 0)
     if i == -1:
-        file.warning("Malformed lyx file: Missing '\\tracking_changes'.")
+        document.warning("Malformed lyx document: Missing '\\tracking_changes'.")
         return
-    file.header.insert(i+1, '\\output_changes true')
+    document.header.insert(i+1, '\\output_changes true')
 
 
-def revert_output_changes (file):
-    i = find_token(file.header, '\\output_changes', 0)
+def revert_output_changes (document):
+    " Remove output_changes parameter. "
+    i = find_token(document.header, '\\output_changes', 0)
     if i == -1:
         return
-    del file.header[i]
+    del document.header[i]
 
 
-##
-# Convert paragraph breaks and sanitize paragraphs
-#
-def convert_ert_paragraphs(file):
+def convert_ert_paragraphs(document):
+    " Convert paragraph breaks and sanitize paragraphs. "
     forbidden_settings = [
                           # paragraph parameters
                           '\\paragraph_spacing', '\\labelwidthstring',
@@ -2212,30 +2250,30 @@ def convert_ert_paragraphs(file):
                           '\\color', '\\lang']
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_inset ERT', i)
+        i = find_token(document.body, '\\begin_inset ERT', i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i)
+        j = find_end_of_inset(document.body, i)
         if j == -1:
-            file.warning("Malformed lyx file: Missing '\\end_inset'.")
+            document.warning("Malformed lyx document: Missing '\\end_inset'.")
             i = i + 1
             continue
 
         # convert non-standard paragraphs to standard
         k = i
         while 1:
-            k = find_token(file.body, "\\begin_layout", k, j)
+            k = find_token(document.body, "\\begin_layout", k, j)
             if k == -1:
                 break
-            file.body[k] = '\\begin_layout %s' % file.default_layout
+            document.body[k] = '\\begin_layout %s' % document.default_layout
             k = k + 1
 
         # remove all paragraph parameters and font settings
         k = i
         while k < j:
-            if (strip(file.body[k]) and
-                split(file.body[k])[0] in forbidden_settings):
-                del file.body[k]
+            if (document.body[k].strip() and
+                document.body[k].split()[0] in forbidden_settings):
+                del document.body[k]
                 j = j - 1
             else:
                 k = k + 1
@@ -2244,14 +2282,14 @@ def convert_ert_paragraphs(file):
         k = i
         first_pagraph = 1
         while 1:
-            k = find_token(file.body, "\\begin_layout", k, j)
+            k = find_token(document.body, "\\begin_layout", k, j)
             if k == -1:
                 break
             if first_pagraph:
                 first_pagraph = 0
                 k = k + 1
                 continue
-            file.body[k:k] = ['\\begin_layout %s' % file.default_layout, "",
+            document.body[k:k] = ['\\begin_layout %s' % document.default_layout, "",
                               "\\end_layout", ""]
             k = k + 5
             j = j + 4
@@ -2259,63 +2297,61 @@ def convert_ert_paragraphs(file):
         # convert \\newline to new paragraph
         k = i
         while 1:
-            k = find_token(file.body, "\\newline", k, j)
+            k = find_token(document.body, "\\newline", k, j)
             if k == -1:
                 break
-            file.body[k:k+1] = ["\\end_layout", "", '\\begin_layout %s' % file.default_layout]
-            k = k + 4
-            j = j + 3
-            # We need an empty line if file.default_layout == ''
-            if file.body[k-1] != '':
-                file.body.insert(k-1, '')
+            document.body[k:k+1] = ["\\end_layout", "", '\\begin_layout %s' % document.default_layout]
+            k = k + 3
+            j = j + 2
+            # We need an empty line if document.default_layout == ''
+            if document.body[k] != '':
+                document.body.insert(k, '')
                 k = k + 1
                 j = j + 1
         i = i + 1
 
 
-##
-# Remove double paragraph breaks
-#
-def revert_ert_paragraphs(file):
+def revert_ert_paragraphs(document):
+    " Remove double paragraph breaks. "
     i = 0
     while 1:
-        i = find_token(file.body, '\\begin_inset ERT', i)
+        i = find_token(document.body, '\\begin_inset ERT', i)
         if i == -1:
             return
-        j = find_end_of_inset(file.body, i)
+        j = find_end_of_inset(document.body, i)
         if j == -1:
-            file.warning("Malformed lyx file: Missing '\\end_inset'.")
+            document.warning("Malformed lyx document: Missing '\\end_inset'.")
             i = i + 1
             continue
 
         # replace paragraph breaks with \newline
         k = i
         while 1:
-            k = find_token(file.body, "\\end_layout", k, j)
-            l = find_token(file.body, "\\begin_layout", k, j)
+            k = find_token(document.body, "\\end_layout", k, j)
+            l = find_token(document.body, "\\begin_layout", k, j)
             if k == -1 or l == -1:
                 break
-            file.body[k:l+1] = ["\\newline"]
+            document.body[k:l+1] = ["\\newline"]
             j = j - l + k
             k = k + 1
 
         # replace double \newlines with paragraph breaks
         k = i
         while 1:
-            k = find_token(file.body, "\\newline", k, j)
+            k = find_token(document.body, "\\newline", k, j)
             if k == -1:
                 break
             l = k + 1
-            while file.body[l] == "":
+            while document.body[l] == "":
                 l = l + 1
-            if strip(file.body[l]) and split(file.body[l])[0] == "\\newline":
-                file.body[k:l+1] = ["\\end_layout", "",
-                                    '\\begin_layout %s' % file.default_layout]
+            if document.body[l].strip() and document.body[l].split()[0] == "\\newline":
+                document.body[k:l+1] = ["\\end_layout", "",
+                                    '\\begin_layout %s' % document.default_layout]
                 j = j - l + k + 2
                 k = k + 3
-                # We need an empty line if file.default_layout == ''
-                if file.body[l+1] != '':
-                    file.body.insert(l+1, '')
+                # We need an empty line if document.default_layout == ''
+                if document.body[l+1] != '':
+                    document.body.insert(l+1, '')
                     k = k + 1
                     j = j + 1
             else:
@@ -2323,32 +2359,34 @@ def revert_ert_paragraphs(file):
         i = i + 1
 
 
-def convert_french(file):
+def convert_french(document):
+    " Convert frenchb. "
     regexp = re.compile(r'^\\language\s+frenchb')
-    i = find_re(file.header, regexp, 0)
+    i = find_re(document.header, regexp, 0)
     if i != -1:
-        file.header[i] = "\\language french"
+        document.header[i] = "\\language french"
 
     # Change language in the document body
     regexp = re.compile(r'^\\lang\s+frenchb')
     i = 0
     while 1:
-        i = find_re(file.body, regexp, i)
+        i = find_re(document.body, regexp, i)
         if i == -1:
             break
-        file.body[i] = "\\lang french"
+        document.body[i] = "\\lang french"
         i = i + 1
 
 
-def remove_paperpackage(file):
-    i = find_token(file.header, '\\paperpackage', 0)
+def remove_paperpackage(document):
+    " Remove paper package. "
+    i = find_token(document.header, '\\paperpackage', 0)
 
     if i == -1:
         return
 
-    paperpackage = split(file.header[i])[1]
+    paperpackage = document.header[i].split()[1]
 
-    del file.header[i]
+    del document.header[i]
 
     if paperpackage not in ("a4", "a4wide", "widemarginsa4"):
         return
@@ -2356,45 +2394,46 @@ def remove_paperpackage(file):
     conv = {"a4":"\\usepackage{a4}","a4wide": "\\usepackage{a4wide}",
             "widemarginsa4": "\\usepackage[widemargins]{a4}"}
     # for compatibility we ensure it is the first entry in preamble
-    file.preamble[0:0] = [conv[paperpackage]]
+    document.preamble[0:0] = [conv[paperpackage]]
 
-    i = find_token(file.header, '\\papersize', 0)
+    i = find_token(document.header, '\\papersize', 0)
     if i != -1:
-        file.header[i] = "\\papersize default"
+        document.header[i] = "\\papersize default"
 
 
-def remove_quotestimes(file):
-    i = find_token(file.header, '\\quotes_times', 0)
+def remove_quotestimes(document):
+    " Remove quotestimes. "
+    i = find_token(document.header, '\\quotes_times', 0)
     if i == -1:
         return
-    del file.header[i]
+    del document.header[i]
 
 
-##
-# Convert SGML paragraphs
-#
-def convert_sgml_paragraphs(file):
-    if file.backend != "docbook":
+def convert_sgml_paragraphs(document):
+    " Convert SGML paragraphs. "
+    if document.backend != "docbook":
         return
 
     i = 0
     while 1:
-        i = find_token(file.body, "\\begin_layout SGML", i)
+        i = find_token(document.body, "\\begin_layout SGML", i)
 
         if i == -1:
             return
 
-        file.body[i] = "\\begin_layout Standard"
-        j = find_token(file.body, "\\end_layout", i)
+        document.body[i] = "\\begin_layout Standard"
+        j = find_token(document.body, "\\end_layout", i)
 
-        file.body[j+1:j+1] = ['','\\end_inset','','','\\end_layout']
-        file.body[i+1:i+1] = ['\\begin_inset ERT','status inlined','','\\begin_layout Standard','']
+        document.body[j+1:j+1] = ['','\\end_inset','','','\\end_layout']
+        document.body[i+1:i+1] = ['\\begin_inset ERT','status inlined','','\\begin_layout Standard','']
 
         i = i + 10
+
 ##
 # Convertion hub
 #
 
+supported_versions = ["1.4.%d" % i for i in range(3)] + ["1.4"]
 convert = [[222, [insert_tracking_changes, add_end_header, convert_amsmath]],
            [223, [remove_color_default, convert_spaces, convert_bibtex, remove_insetparent]],
            [224, [convert_external, convert_comment]],
diff --git a/lib/lyx2lyx/lyx_1_5.py b/lib/lyx2lyx/lyx_1_5.py
new file mode 100644
index 0000000000..77c80b242e
--- /dev/null
+++ b/lib/lyx2lyx/lyx_1_5.py
@@ -0,0 +1,2080 @@
+# This file is part of lyx2lyx
+# -*- coding: utf-8 -*-
+# Copyright (C) 2006 JosĂŠ Matos <jamatos@lyx.org>
+# Copyright (C) 2004-2006 Georg Baum <Georg.Baum@post.rwth-aachen.de>
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
+
+""" Convert files to the file format generated by lyx 1.5"""
+
+import re
+import unicodedata
+import sys, os
+
+from parser_tools import find_re, find_token, find_token_backwards, find_token_exact, find_tokens, find_end_of, get_value, find_beginning_of, find_nonempty_line
+from LyX import get_encoding
+
+
+####################################################################
+# Private helper functions
+
+def find_end_of_inset(lines, i):
+    " Find end of inset, where lines[i] is included."
+    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
+
+def find_end_of_layout(lines, i):
+    " Find end of layout, where lines[i] is included."
+    return find_end_of(lines, i, "\\begin_layout", "\\end_layout")
+
+def find_beginning_of_layout(lines, i):
+    "Find beginning of layout, where lines[i] is included."
+    return find_beginning_of(lines, i, "\\begin_layout", "\\end_layout")
+
+# End of helper functions
+####################################################################
+
+
+##
+#  Notes: Framed/Shaded
+#
+
+def revert_framed(document):
+    "Revert framed notes. "
+    i = 0
+    while 1:
+        i = find_tokens(document.body, ["\\begin_inset Note Framed", "\\begin_inset Note Shaded"], i)
+
+        if i == -1:
+            return
+        document.body[i] = "\\begin_inset Note"
+        i = i + 1
+
+
+##
+#  Fonts
+#
+
+roman_fonts      = {'default' : 'default', 'ae'       : 'ae',
+                    'times'   : 'times',   'palatino' : 'palatino',
+                    'helvet'  : 'default', 'avant'    : 'default',
+                    'newcent' : 'newcent', 'bookman'  : 'bookman',
+                    'pslatex' : 'times'}
+sans_fonts       = {'default' : 'default', 'ae'       : 'default',
+                    'times'   : 'default', 'palatino' : 'default',
+                    'helvet'  : 'helvet',  'avant'    : 'avant',
+                    'newcent' : 'default', 'bookman'  : 'default',
+                    'pslatex' : 'helvet'}
+typewriter_fonts = {'default' : 'default', 'ae'       : 'default',
+                    'times'   : 'default', 'palatino' : 'default',
+                    'helvet'  : 'default', 'avant'    : 'default',
+                    'newcent' : 'default', 'bookman'  : 'default',
+                    'pslatex' : 'courier'}
+
+def convert_font_settings(document):
+    " Convert font settings. "
+    i = 0
+    i = find_token_exact(document.header, "\\fontscheme", i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\fontscheme'.")
+        return
+    font_scheme = get_value(document.header, "\\fontscheme", i, i + 1)
+    if font_scheme == '':
+        document.warning("Malformed LyX document: Empty `\\fontscheme'.")
+        font_scheme = 'default'
+    if not font_scheme in roman_fonts.keys():
+        document.warning("Malformed LyX document: Unknown `\\fontscheme' `%s'." % font_scheme)
+        font_scheme = 'default'
+    document.header[i:i+1] = ['\\font_roman %s' % roman_fonts[font_scheme],
+                          '\\font_sans %s' % sans_fonts[font_scheme],
+                          '\\font_typewriter %s' % typewriter_fonts[font_scheme],
+                          '\\font_default_family default',
+                          '\\font_sc false',
+                          '\\font_osf false',
+                          '\\font_sf_scale 100',
+                          '\\font_tt_scale 100']
+
+
+def revert_font_settings(document):
+    " Revert font settings. "
+    i = 0
+    insert_line = -1
+    fonts = {'roman' : 'default', 'sans' : 'default', 'typewriter' : 'default'}
+    for family in 'roman', 'sans', 'typewriter':
+        name = '\\font_%s' % family
+        i = find_token_exact(document.header, name, i)
+        if i == -1:
+            document.warning("Malformed LyX document: Missing `%s'." % name)
+            i = 0
+        else:
+            if (insert_line < 0):
+                insert_line = i
+            fonts[family] = get_value(document.header, name, i, i + 1)
+            del document.header[i]
+    i = find_token_exact(document.header, '\\font_default_family', i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\font_default_family'.")
+        font_default_family = 'default'
+    else:
+        font_default_family = get_value(document.header, "\\font_default_family", i, i + 1)
+        del document.header[i]
+    i = find_token_exact(document.header, '\\font_sc', i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\font_sc'.")
+        font_sc = 'false'
+    else:
+        font_sc = get_value(document.header, '\\font_sc', i, i + 1)
+        del document.header[i]
+    if font_sc != 'false':
+        document.warning("Conversion of '\\font_sc' not yet implemented.")
+    i = find_token_exact(document.header, '\\font_osf', i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\font_osf'.")
+        font_osf = 'false'
+    else:
+        font_osf = get_value(document.header, '\\font_osf', i, i + 1)
+        del document.header[i]
+    i = find_token_exact(document.header, '\\font_sf_scale', i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\font_sf_scale'.")
+        font_sf_scale = '100'
+    else:
+        font_sf_scale = get_value(document.header, '\\font_sf_scale', i, i + 1)
+        del document.header[i]
+    if font_sf_scale != '100':
+        document.warning("Conversion of '\\font_sf_scale' not yet implemented.")
+    i = find_token_exact(document.header, '\\font_tt_scale', i)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\font_tt_scale'.")
+        font_tt_scale = '100'
+    else:
+        font_tt_scale = get_value(document.header, '\\font_tt_scale', i, i + 1)
+        del document.header[i]
+    if font_tt_scale != '100':
+        document.warning("Conversion of '\\font_tt_scale' not yet implemented.")
+    for font_scheme in roman_fonts.keys():
+        if (roman_fonts[font_scheme] == fonts['roman'] and
+            sans_fonts[font_scheme] == fonts['sans'] and
+            typewriter_fonts[font_scheme] == fonts['typewriter']):
+            document.header.insert(insert_line, '\\fontscheme %s' % font_scheme)
+            if font_default_family != 'default':
+                document.preamble.append('\\renewcommand{\\familydefault}{\\%s}' % font_default_family)
+            if font_osf == 'true':
+                document.warning("Ignoring `\\font_osf = true'")
+            return
+    font_scheme = 'default'
+    document.header.insert(insert_line, '\\fontscheme %s' % font_scheme)
+    if fonts['roman'] == 'cmr':
+        document.preamble.append('\\renewcommand{\\rmdefault}{cmr}')
+        if font_osf == 'true':
+            document.preamble.append('\\usepackage{eco}')
+            font_osf = 'false'
+    for font in 'lmodern', 'charter', 'utopia', 'beraserif', 'ccfonts', 'chancery':
+        if fonts['roman'] == font:
+            document.preamble.append('\\usepackage{%s}' % font)
+    for font in 'cmss', 'lmss', 'cmbr':
+        if fonts['sans'] == font:
+            document.preamble.append('\\renewcommand{\\sfdefault}{%s}' % font)
+    for font in 'berasans':
+        if fonts['sans'] == font:
+            document.preamble.append('\\usepackage{%s}' % font)
+    for font in 'cmtt', 'lmtt', 'cmtl':
+        if fonts['typewriter'] == font:
+            document.preamble.append('\\renewcommand{\\ttdefault}{%s}' % font)
+    for font in 'courier', 'beramono', 'luximono':
+        if fonts['typewriter'] == font:
+            document.preamble.append('\\usepackage{%s}' % font)
+    if font_default_family != 'default':
+        document.preamble.append('\\renewcommand{\\familydefault}{\\%s}' % font_default_family)
+    if font_osf == 'true':
+        document.warning("Ignoring `\\font_osf = true'")
+
+
+def revert_booktabs(document):
+    " We remove the booktabs flag or everything else will become a mess. "
+    re_row = re.compile(r'^<row.*space="[^"]+".*>$')
+    re_tspace = re.compile(r'\s+topspace="[^"]+"')
+    re_bspace = re.compile(r'\s+bottomspace="[^"]+"')
+    re_ispace = re.compile(r'\s+interlinespace="[^"]+"')
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset Tabular", i)
+        if i == -1:
+            return
+        j = find_end_of_inset(document.body, i + 1)
+        if j == -1:
+            document.warning("Malformed LyX document: Could not find end of tabular.")
+            continue
+        for k in range(i, j):
+            if re.search('^<features.* booktabs="true".*>$', document.body[k]):
+                document.warning("Converting 'booktabs' table to normal table.")
+                document.body[k] = document.body[k].replace(' booktabs="true"', '')
+            if re.search(re_row, document.body[k]):
+                document.warning("Removing extra row space.")
+                document.body[k] = re_tspace.sub('', document.body[k])
+                document.body[k] = re_bspace.sub('', document.body[k])
+                document.body[k] = re_ispace.sub('', document.body[k])
+        i = i + 1
+
+
+def convert_multiencoding(document, forward):
+    """ Fix files with multiple encodings.
+Files with an inputencoding of "auto" or "default" and multiple languages
+where at least two languages have different default encodings are encoded
+in multiple encodings for file formats < 249. These files are incorrectly
+read and written (as if the whole file was in the encoding of the main
+language).
+This is not true for files written by CJK-LyX, they are always in the locale
+encoding.
+
+This function
+- converts from fake unicode values to true unicode if forward is true, and
+- converts from true unicode values to fake unicode if forward is false.
+document.encoding must be set to the old value (format 248) in both cases.
+
+We do this here and not in LyX.py because it is far easier to do the
+necessary parsing in modern formats than in ancient ones.
+"""
+    inset_types = ["Foot", "Note"]
+    if document.cjk_encoding != '':
+        return
+    encoding_stack = [document.encoding]
+    insets = []
+    lang_re = re.compile(r"^\\lang\s(\S+)")
+    inset_re = re.compile(r"^\\begin_inset\s(\S+)")
+    if not forward: # no need to read file unless we are reverting
+        spec_chars = read_unicodesymbols()
+
+    if document.inputencoding == "auto" or document.inputencoding == "default":
+        i = 0
+        while i < len(document.body):
+            result = lang_re.match(document.body[i])
+            if result:
+                language = result.group(1)
+                if language == "default":
+                    document.warning("Resetting encoding from %s to %s." % (encoding_stack[-1], document.encoding), 3)
+                    encoding_stack[-1] = document.encoding
+                else:
+                    from lyx2lyx_lang import lang
+                    document.warning("Setting encoding from %s to %s." % (encoding_stack[-1], lang[language][3]), 3)
+                    encoding_stack[-1] = lang[language][3]
+            elif find_token(document.body, "\\begin_layout", i, i + 1) == i:
+                document.warning("Adding nested encoding %s." % encoding_stack[-1], 3)
+                if len(insets) > 0 and insets[-1] in inset_types:
+                    from lyx2lyx_lang import lang
+                    encoding_stack.append(lang[document.language][3])
+                else:
+                    encoding_stack.append(encoding_stack[-1])
+            elif find_token(document.body, "\\end_layout", i, i + 1) == i:
+                document.warning("Removing nested encoding %s." % encoding_stack[-1], 3)
+                if len(encoding_stack) == 1:
+                    # Don't remove the document encoding from the stack
+                    document.warning("Malformed LyX document: Unexpected `\\end_layout'.")
+                else:
+                    del encoding_stack[-1]
+            elif find_token(document.body, "\\begin_inset", i, i + 1) == i:
+                inset_result = inset_re.match(document.body[i])
+                if inset_result:
+                    insets.append(inset_result.group(1))
+                else: 
+                    insets.append("")
+            elif find_token(document.body, "\\end_inset", i, i + 1) == i:
+                del insets[-1]
+            if encoding_stack[-1] != document.encoding:
+                if forward:
+                    # This line has been incorrectly interpreted as if it was
+                    # encoded in 'encoding'.
+                    # Convert back to the 8bit string that was in the file.
+                    orig = document.body[i].encode(document.encoding)
+                    # Convert the 8bit string that was in the file to unicode
+                    # with the correct encoding.
+                    document.body[i] = orig.decode(encoding_stack[-1])
+                else:
+                    try:
+                        # Convert unicode to the 8bit string that will be written
+                        # to the file with the correct encoding.
+                        orig = document.body[i].encode(encoding_stack[-1])
+                        # Convert the 8bit string that will be written to the
+                        # file to fake unicode with the encoding that will later
+                        # be used when writing to the file.
+                        document.body[i] = orig.decode(document.encoding)
+                    except:
+                        mod_line = revert_unicode_line(document, i, insets, spec_chars)
+                        document.body[i:i+1] = mod_line.split('\n')
+                        i += len(mod_line.split('\n')) - 1
+            i += 1
+
+
+def convert_utf8(document):
+    " Set document encoding to UTF-8. "
+    convert_multiencoding(document, True)
+    document.encoding = "utf8"
+
+
+def revert_utf8(document):
+    " Set document encoding to the value corresponding to inputencoding. "
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    elif get_value(document.header, "\\inputencoding", i) == "utf8":
+        document.header[i] = "\\inputencoding auto"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+    document.encoding = get_encoding(document.language, document.inputencoding, 248, document.cjk_encoding)
+    convert_multiencoding(document, False)
+
+
+def read_unicodesymbols():
+    " Read the unicodesymbols list of unicode characters and corresponding commands."
+    pathname = os.path.abspath(os.path.dirname(sys.argv[0]))
+    fp = open(os.path.join(pathname.strip('lyx2lyx'), 'unicodesymbols'))
+    spec_chars = {}
+    for line in fp.readlines():
+        if line[0] != '#':
+            line=line.replace(' "',' ') # remove all quotation marks with spaces before
+            line=line.replace('" ',' ') # remove all quotation marks with spaces after
+            line=line.replace(r'\"','"') # replace \" by " (for characters with diaeresis)
+            try:
+                # flag1 and flag2 are preamble and other flags
+                [ucs4,command,flag1,flag2] =line.split(None,3)
+                spec_chars[unichr(eval(ucs4))] = [command, flag1, flag2]
+            except:
+                pass
+    fp.close()
+    return spec_chars
+
+
+def revert_unicode_line(document, i, insets, spec_chars, replacement_character = '???'):
+    # Define strings to start and end ERT and math insets
+    ert_intro='\n\n\\begin_inset ERT\nstatus collapsed\n\\begin_layout %s\n\\backslash\n' % document.default_layout
+    ert_outro='\n\\end_layout\n\n\\end_inset\n'
+    math_intro='\n\\begin_inset Formula $'
+    math_outro='$\n\\end_inset'
+
+    mod_line = u''
+    if i and not is_inset_line(document, i-1):
+        last_char = document.body[i - 1][-1:]
+    else:
+        last_char = ''
+
+    line = document.body[i]
+    for character in line:
+        try:
+            # Try to write the character
+            dummy = character.encode(document.encoding)
+            mod_line += character
+            last_char = character
+        except:
+            # Try to replace with ERT/math inset
+            if spec_chars.has_key(character):
+                command = spec_chars[character][0] # the command to replace unicode
+                flag1 = spec_chars[character][1]
+                flag2 = spec_chars[character][2]
+                if flag1.find('combining') > -1 or flag2.find('combining') > -1:
+                    # We have a character that should be combined with the previous
+                    command += '{' + last_char + '}'
+                    # Remove the last character. Ignore if it is whitespace
+                    if len(last_char.rstrip()):
+                        # last_char was found and is not whitespace
+                        if mod_line:
+                            mod_line = mod_line[:-1]
+                        else: # last_char belongs to the last line
+                            document.body[i-1] = document.body[i-1][:-1]
+                    else:
+                        # The last character was replaced by a command. For now it is
+                        # ignored. This could be handled better.
+                        pass
+                if command[0:2] == '\\\\':
+                    if command[2:12]=='ensuremath':
+                        if insets and insets[-1] == "ERT":
+                            # math in ERT
+                            command = command.replace('\\\\ensuremath{\\\\', '$\n\\backslash\n')
+                            command = command.replace('}', '$\n')
+                        elif not insets or insets[-1] != "Formula":
+                            # add a math inset with the replacement character
+                            command = command.replace('\\\\ensuremath{\\', math_intro)
+                            command = command.replace('}', math_outro)
+                        else:
+                            # we are already in a math inset
+                            command = command.replace('\\\\ensuremath{\\', '')
+                            command = command.replace('}', '')
+                    else:
+                        if insets and insets[-1] == "Formula":
+                            # avoid putting an ERT in a math; instead put command as text
+                            command = command.replace('\\\\', '\mathrm{')
+                            command = command + '}'
+                        elif not insets or insets[-1] != "ERT":
+                            # add an ERT inset with the replacement character
+                            command = command.replace('\\\\', ert_intro)
+                            command = command + ert_outro
+                        else:
+                            command = command.replace('\\\\', '\n\\backslash\n')
+                    last_char = '' # indicate that the character should not be removed
+                mod_line += command
+            else:
+                # Replace with replacement string
+                mod_line += replacement_character
+    return mod_line
+
+
+def revert_unicode(document):
+    '''Transform unicode characters that can not be written using the
+document encoding to commands according to the unicodesymbols
+file. Characters that can not be replaced by commands are replaced by
+an replacement string.  Flags other than 'combined' are currently not
+implemented.'''
+    spec_chars = read_unicodesymbols()
+    insets = [] # list of active insets
+
+    # Go through the document to capture all combining characters
+    i = 0
+    while i < len(document.body):
+        line = document.body[i]
+        # Check for insets
+        if line.find('\\begin_inset') > -1:
+            insets.append(line[13:].split()[0])
+        if line.find('\\end_inset') > -1:
+            del insets[-1]
+        
+        # Try to write the line
+        try:
+            # If all goes well the line is written here
+            dummy = line.encode(document.encoding)
+            i += 1
+        except:
+            # Error, some character(s) in the line need to be replaced
+            mod_line = revert_unicode_line(document, i, insets, spec_chars)
+            document.body[i:i+1] = mod_line.split('\n')
+            i += len(mod_line.split('\n'))
+
+
+def revert_cs_label(document):
+    " Remove status flag of charstyle label. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset CharStyle", i)
+        if i == -1:
+            return
+        # Seach for a line starting 'show_label'
+        # If it is not there, break with a warning message
+        i = i + 1
+        while 1:
+            if (document.body[i][:10] == "show_label"):
+                del document.body[i]
+                break
+            elif (document.body[i][:13] == "\\begin_layout"):
+                document.warning("Malformed LyX document: Missing 'show_label'.")
+                break
+            i = i + 1
+
+        i = i + 1
+
+
+def convert_bibitem(document):
+    """ Convert
+\bibitem [option]{argument}
+
+to
+
+\begin_inset LatexCommand bibitem
+label "option"
+key "argument"
+
+\end_inset
+
+This must be called after convert_commandparams.
+"""
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\bibitem", i)
+        if i == -1:
+            break
+        j = document.body[i].find('[') + 1
+        k = document.body[i].rfind(']')
+        if j == 0: # No optional argument found
+            option = None
+        else:
+            option = document.body[i][j:k]
+        j = document.body[i].rfind('{') + 1
+        k = document.body[i].rfind('}')
+        argument = document.body[i][j:k]
+        lines = ['\\begin_inset LatexCommand bibitem']
+        if option != None:
+            lines.append('label "%s"' % option.replace('"', '\\"'))
+        lines.append('key "%s"' % argument.replace('"', '\\"'))
+        lines.append('')
+        lines.append('\\end_inset')
+        document.body[i:i+1] = lines
+        i = i + 1
+
+
+commandparams_info = {
+    # command : [option1, option2, argument]
+    "bibitem" : ["label", "", "key"],
+    "bibtex" : ["options", "btprint", "bibfiles"],
+    "cite"        : ["after", "before", "key"],
+    "citet"       : ["after", "before", "key"],
+    "citep"       : ["after", "before", "key"],
+    "citealt"     : ["after", "before", "key"],
+    "citealp"     : ["after", "before", "key"],
+    "citeauthor"  : ["after", "before", "key"],
+    "citeyear"    : ["after", "before", "key"],
+    "citeyearpar" : ["after", "before", "key"],
+    "citet*"      : ["after", "before", "key"],
+    "citep*"      : ["after", "before", "key"],
+    "citealt*"    : ["after", "before", "key"],
+    "citealp*"    : ["after", "before", "key"],
+    "citeauthor*" : ["after", "before", "key"],
+    "Citet"       : ["after", "before", "key"],
+    "Citep"       : ["after", "before", "key"],
+    "Citealt"     : ["after", "before", "key"],
+    "Citealp"     : ["after", "before", "key"],
+    "Citeauthor"  : ["after", "before", "key"],
+    "Citet*"      : ["after", "before", "key"],
+    "Citep*"      : ["after", "before", "key"],
+    "Citealt*"    : ["after", "before", "key"],
+    "Citealp*"    : ["after", "before", "key"],
+    "Citeauthor*" : ["after", "before", "key"],
+    "citefield"   : ["after", "before", "key"],
+    "citetitle"   : ["after", "before", "key"],
+    "cite*"       : ["after", "before", "key"],
+    "hfill" : ["", "", ""],
+    "index"      : ["", "", "name"],
+    "printindex" : ["", "", "name"],
+    "label" : ["", "", "name"],
+    "eqref"     : ["name", "", "reference"],
+    "pageref"   : ["name", "", "reference"],
+    "prettyref" : ["name", "", "reference"],
+    "ref"       : ["name", "", "reference"],
+    "vpageref"  : ["name", "", "reference"],
+    "vref"      : ["name", "", "reference"],
+    "tableofcontents" : ["", "", "type"],
+    "htmlurl" : ["name", "", "target"],
+    "url"     : ["name", "", "target"]}
+
+
+def convert_commandparams(document):
+    """ Convert
+
+ \begin_inset LatexCommand \cmdname[opt1][opt2]{arg}
+ \end_inset
+
+ to
+
+ \begin_inset LatexCommand cmdname
+ name1 "opt1"
+ name2 "opt2"
+ name3 "arg"
+ \end_inset
+
+ name1, name2 and name3 can be different for each command.
+"""
+    # \begin_inset LatexCommand bibitem was not the official version (see
+    # convert_bibitem()), but could be read in, so we convert it here, too.
+
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset LatexCommand", i)
+        if i == -1:
+            break
+        command = document.body[i][26:].strip()
+        if command == "":
+            document.warning("Malformed LyX document: Missing LatexCommand name.")
+            i = i + 1
+            continue
+
+        j = find_token(document.body, "\\end_inset", i + 1)
+        if j == -1:
+            document.warning("Malformed document")
+        else:
+            command += "".join(document.body[i+1:j])
+            document.body[i+1:j] = []
+
+        # The following parser is taken from the original InsetCommandParams::scanCommand
+        name = ""
+        option1 = ""
+        option2 = ""
+        argument = ""
+        state = "WS"
+        # Used to handle things like \command[foo[bar]]{foo{bar}}
+        nestdepth = 0
+        b = 0
+        for c in command:
+            if ((state == "CMDNAME" and c == ' ') or
+                (state == "CMDNAME" and c == '[') or
+                (state == "CMDNAME" and c == '{')):
+                state = "WS"
+            if ((state == "OPTION" and c == ']') or
+                (state == "SECOPTION" and c == ']') or
+                (state == "CONTENT" and c == '}')):
+                if nestdepth == 0:
+                    state = "WS"
+                else:
+                    nestdepth = nestdepth - 1
+            if ((state == "OPTION" and c == '[') or
+                (state == "SECOPTION" and c == '[') or
+                (state == "CONTENT" and c == '{')):
+                nestdepth = nestdepth + 1
+            if state == "CMDNAME":
+                    name += c
+            elif state == "OPTION":
+                    option1 += c
+            elif state == "SECOPTION":
+                    option2 += c
+            elif state == "CONTENT":
+                    argument += c
+            elif state == "WS":
+                if c == '\\':
+                    state = "CMDNAME"
+                elif c == '[' and b != ']':
+                    state = "OPTION"
+                    nestdepth = 0 # Just to be sure
+                elif c == '[' and b == ']':
+                    state = "SECOPTION"
+                    nestdepth = 0 # Just to be sure
+                elif c == '{':
+                    state = "CONTENT"
+                    nestdepth = 0 # Just to be sure
+            b = c
+
+        # Now we have parsed the command, output the parameters
+        lines = ["\\begin_inset LatexCommand %s" % name]
+        if option1 != "":
+            if commandparams_info[name][0] == "":
+                document.warning("Ignoring invalid option `%s' of command `%s'." % (option1, name))
+            else:
+                lines.append('%s "%s"' % (commandparams_info[name][0], option1.replace('"', '\\"')))
+        if option2 != "":
+            if commandparams_info[name][1] == "":
+                document.warning("Ignoring invalid second option `%s' of command `%s'." % (option2, name))
+            else:
+                lines.append('%s "%s"' % (commandparams_info[name][1], option2.replace('"', '\\"')))
+        if argument != "":
+            if commandparams_info[name][2] == "":
+                document.warning("Ignoring invalid argument `%s' of command `%s'." % (argument, name))
+            else:
+                lines.append('%s "%s"' % (commandparams_info[name][2], argument.replace('"', '\\"')))
+        document.body[i:i+1] = lines
+        i = i + 1
+
+
+def revert_commandparams(document):
+    regex = re.compile(r'(\S+)\s+(.+)')
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset LatexCommand", i)
+        if i == -1:
+            break
+        name = document.body[i].split()[2]
+        j = find_end_of_inset(document.body, i + 1)
+        preview_line = ""
+        option1 = ""
+        option2 = ""
+        argument = ""
+        for k in range(i + 1, j):
+            match = re.match(regex, document.body[k])
+            if match:
+                pname = match.group(1)
+                pvalue = match.group(2)
+                if pname == "preview":
+                    preview_line = document.body[k]
+                elif (commandparams_info[name][0] != "" and
+                      pname == commandparams_info[name][0]):
+                    option1 = pvalue.strip('"').replace('\\"', '"')
+                elif (commandparams_info[name][1] != "" and
+                      pname == commandparams_info[name][1]):
+                    option2 = pvalue.strip('"').replace('\\"', '"')
+                elif (commandparams_info[name][2] != "" and
+                      pname == commandparams_info[name][2]):
+                    argument = pvalue.strip('"').replace('\\"', '"')
+            elif document.body[k].strip() != "":
+                document.warning("Ignoring unknown contents `%s' in command inset %s." % (document.body[k], name))
+        if name == "bibitem":
+            if option1 == "":
+                lines = ["\\bibitem {%s}" % argument]
+            else:
+                lines = ["\\bibitem [%s]{%s}" % (option1, argument)]
+        else:
+            if option1 == "":
+                if option2 == "":
+                    lines = ["\\begin_inset LatexCommand \\%s{%s}" % (name, argument)]
+                else:
+                    lines = ["\\begin_inset LatexCommand \\%s[][%s]{%s}" % (name, option2, argument)]
+            else:
+                if option2 == "":
+                    lines = ["\\begin_inset LatexCommand \\%s[%s]{%s}" % (name, option1, argument)]
+                else:
+                    lines = ["\\begin_inset LatexCommand \\%s[%s][%s]{%s}" % (name, option1, option2, argument)]
+        if name != "bibitem":
+            if preview_line != "":
+                lines.append(preview_line)
+            lines.append('')
+            lines.append('\\end_inset')
+        document.body[i:j+1] = lines
+        i = j + 1
+
+
+def revert_nomenclature(document):
+    " Convert nomenclature entry to ERT. "
+    regex = re.compile(r'(\S+)\s+(.+)')
+    i = 0
+    use_nomencl = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset LatexCommand nomenclature", i)
+        if i == -1:
+            break
+        use_nomencl = 1
+        j = find_end_of_inset(document.body, i + 1)
+        preview_line = ""
+        symbol = ""
+        description = ""
+        prefix = ""
+        for k in range(i + 1, j):
+            match = re.match(regex, document.body[k])
+            if match:
+                name = match.group(1)
+                value = match.group(2)
+                if name == "preview":
+                    preview_line = document.body[k]
+                elif name == "symbol":
+                    symbol = value.strip('"').replace('\\"', '"')
+                elif name == "description":
+                    description = value.strip('"').replace('\\"', '"')
+                elif name == "prefix":
+                    prefix = value.strip('"').replace('\\"', '"')
+            elif document.body[k].strip() != "":
+                document.warning("Ignoring unknown contents `%s' in nomenclature inset." % document.body[k])
+        if prefix == "":
+            command = 'nomenclature{%s}{%s}' % (symbol, description)
+        else:
+            command = 'nomenclature[%s]{%s}{%s}' % (prefix, symbol, description)
+        document.body[i:j+1] = ['\\begin_inset ERT',
+                                'status collapsed',
+                                '',
+                                '\\begin_layout %s' % document.default_layout,
+                                '',
+                                '',
+                                '\\backslash',
+                                command,
+                                '\\end_layout',
+                                '',
+                                '\\end_inset']
+        i = i + 11
+    if use_nomencl and find_token(document.preamble, '\\usepackage{nomencl}[2005/09/22]', 0) == -1:
+        document.preamble.append('\\usepackage{nomencl}[2005/09/22]')
+        document.preamble.append('\\makenomenclature')
+
+
+def revert_printnomenclature(document):
+    " Convert printnomenclature to ERT. "
+    regex = re.compile(r'(\S+)\s+(.+)')
+    i = 0
+    use_nomencl = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset LatexCommand printnomenclature", i)
+        if i == -1:
+            break
+        use_nomencl = 1
+        j = find_end_of_inset(document.body, i + 1)
+        preview_line = ""
+        labelwidth = ""
+        for k in range(i + 1, j):
+            match = re.match(regex, document.body[k])
+            if match:
+                name = match.group(1)
+                value = match.group(2)
+                if name == "preview":
+                    preview_line = document.body[k]
+                elif name == "labelwidth":
+                    labelwidth = value.strip('"').replace('\\"', '"')
+            elif document.body[k].strip() != "":
+                document.warning("Ignoring unknown contents `%s' in printnomenclature inset." % document.body[k])
+        if labelwidth == "":
+            command = 'nomenclature{}'
+        else:
+            command = 'nomenclature[%s]' % labelwidth
+        document.body[i:j+1] = ['\\begin_inset ERT',
+                                'status collapsed',
+                                '',
+                                '\\begin_layout %s' % document.default_layout,
+                                '',
+                                '',
+                                '\\backslash',
+                                command,
+                                '\\end_layout',
+                                '',
+                                '\\end_inset']
+        i = i + 11
+    if use_nomencl and find_token(document.preamble, '\\usepackage{nomencl}[2005/09/22]', 0) == -1:
+        document.preamble.append('\\usepackage{nomencl}[2005/09/22]')
+        document.preamble.append('\\makenomenclature')
+
+
+def convert_esint(document):
+    " Add \\use_esint setting to header. "
+    i = find_token(document.header, "\\cite_engine", 0)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\cite_engine'.")
+        return
+    # 0 is off, 1 is auto, 2 is on.
+    document.header.insert(i, '\\use_esint 0')
+
+
+def revert_esint(document):
+    " Remove \\use_esint setting from header. "
+    i = find_token(document.header, "\\use_esint", 0)
+    if i == -1:
+        document.warning("Malformed LyX document: Missing `\\use_esint'.")
+        return
+    use_esint = document.header[i].split()[1]
+    del document.header[i]
+    # 0 is off, 1 is auto, 2 is on.
+    if (use_esint == 2):
+        document.preamble.append('\\usepackage{esint}')
+
+
+def revert_clearpage(document):
+    " clearpage -> ERT "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\clearpage", i)
+        if i == -1:
+            break
+        document.body[i:i+1] =  ['\\begin_inset ERT',
+                                'status collapsed',
+                                '',
+                                '\\begin_layout %s' % document.default_layout,
+                                '',
+                                '',
+                                '\\backslash',
+                                'clearpage',
+                                '\\end_layout',
+                                '',
+                                '\\end_inset']
+    i = i + 1
+
+
+def revert_cleardoublepage(document):
+    " cleardoublepage -> ERT "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\cleardoublepage", i)
+        if i == -1:
+            break
+        document.body[i:i+1] =  ['\\begin_inset ERT',
+                                'status collapsed',
+                                '',
+                                '\\begin_layout %s' % document.default_layout,
+                                '',
+                                '',
+                                '\\backslash',
+                                'cleardoublepage',
+                                '\\end_layout',
+                                '',
+                                '\\end_inset']
+    i = i + 1
+
+
+def convert_lyxline(document):
+    " remove fontsize commands for \lyxline "
+    # The problematic is: The old \lyxline definition doesn't handle the fontsize
+    # to change the line thickness. The new definiton does this so that imported
+    # \lyxlines would have a different line thickness. The eventual fontsize command
+    # before \lyxline is therefore removed to get the same output.
+    fontsizes = ["tiny", "scriptsize", "footnotesize", "small", "normalsize",
+                 "large", "Large", "LARGE", "huge", "Huge"]
+    for n in range(0, len(fontsizes)):
+        i = 0
+        k = 0
+        while i < len(document.body):
+            i = find_token(document.body, "\\size " + fontsizes[n], i)
+            k = find_token(document.body, "\\lyxline", i)
+            # the corresponding fontsize command is always 2 lines before the \lyxline
+            if (i != -1 and k == i+2):
+                document.body[i:i+1] = []
+            else:
+                break
+        i = i + 1
+
+
+def revert_encodings(document):
+    " Set new encodings to auto. "
+    encodings = ["8859-6", "8859-8", "cp437", "cp437de", "cp850", "cp852",
+                 "cp855", "cp858", "cp862", "cp865", "cp866", "cp1250",
+                 "cp1252", "cp1256", "cp1257", "latin10", "pt254", "tis620-0"]
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    else:
+        inputenc = get_value(document.header, "\\inputencoding", i)
+        if inputenc in encodings:
+            document.header[i] = "\\inputencoding auto"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+
+
+def convert_caption(document):
+    " Convert caption layouts to caption insets. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_layout Caption", i)
+        if i == -1:
+            return
+        j = find_end_of_layout(document.body, i)
+        if j == -1:
+            document.warning("Malformed LyX document: Missing `\\end_layout'.")
+            return
+
+        document.body[j:j] = ["\\end_layout", "", "\\end_inset", "", ""]
+        document.body[i:i+1] = ["\\begin_layout %s" % document.default_layout,
+                            "\\begin_inset Caption", "",
+                            "\\begin_layout %s" % document.default_layout]
+        i = i + 1
+
+
+def revert_caption(document):
+    " Convert caption insets to caption layouts. "
+    " This assumes that the text class has a caption style. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset Caption", i)
+        if i == -1:
+            return
+
+        # We either need to delete the previous \begin_layout line, or we
+        # need to end the previous layout if this inset is not in the first
+        # position of the paragraph.
+        layout_before = find_token_backwards(document.body, "\\begin_layout", i)
+        if layout_before == -1:
+            document.warning("Malformed LyX document: Missing `\\begin_layout'.")
+            return
+        layout_line = document.body[layout_before]
+        del_layout_before = True
+        l = layout_before + 1
+        while l < i:
+            if document.body[l] != "":
+                del_layout_before = False
+                break
+            l = l + 1
+        if del_layout_before:
+            del document.body[layout_before:i]
+            i = layout_before
+        else:
+            document.body[i:i] = ["\\end_layout", ""]
+            i = i + 2
+
+        # Find start of layout in the inset and end of inset
+        j = find_token(document.body, "\\begin_layout", i)
+        if j == -1:
+            document.warning("Malformed LyX document: Missing `\\begin_layout'.")
+            return
+        k = find_end_of_inset(document.body, i)
+        if k == -1:
+            document.warning("Malformed LyX document: Missing `\\end_inset'.")
+            return
+
+        # We either need to delete the following \end_layout line, or we need
+        # to restart the old layout if this inset is not at the paragraph end.
+        layout_after = find_token(document.body, "\\end_layout", k)
+        if layout_after == -1:
+            document.warning("Malformed LyX document: Missing `\\end_layout'.")
+            return
+        del_layout_after = True
+        l = k + 1
+        while l < layout_after:
+            if document.body[l] != "":
+                del_layout_after = False
+                break
+            l = l + 1
+        if del_layout_after:
+            del document.body[k+1:layout_after+1]
+        else:
+            document.body[k+1:k+1] = [layout_line, ""]
+
+        # delete \begin_layout and \end_inset and replace \begin_inset with
+        # "\begin_layout Caption". This works because we can only have one
+        # paragraph in the caption inset: The old \end_layout will be recycled.
+        del document.body[k]
+        if document.body[k] == "":
+            del document.body[k]
+        del document.body[j]
+        if document.body[j] == "":
+            del document.body[j]
+        document.body[i] = "\\begin_layout Caption"
+        if document.body[i+1] == "":
+            del document.body[i+1]
+        i = i + 1
+
+
+# Accents of InsetLaTeXAccent
+accent_map = {
+    "`" : u'\u0300', # grave
+    "'" : u'\u0301', # acute
+    "^" : u'\u0302', # circumflex
+    "~" : u'\u0303', # tilde
+    "=" : u'\u0304', # macron
+    "u" : u'\u0306', # breve
+    "." : u'\u0307', # dot above
+    "\"": u'\u0308', # diaeresis
+    "r" : u'\u030a', # ring above
+    "H" : u'\u030b', # double acute
+    "v" : u'\u030c', # caron
+    "b" : u'\u0320', # minus sign below
+    "d" : u'\u0323', # dot below
+    "c" : u'\u0327', # cedilla
+    "k" : u'\u0328', # ogonek
+    "t" : u'\u0361'  # tie. This is special: It spans two characters, but
+                     # only one is given as argument, so we don't need to
+                     # treat it differently.
+}
+
+
+# special accents of InsetLaTeXAccent without argument
+special_accent_map = {
+    'i' : u'\u0131', # dotless i
+    'j' : u'\u0237', # dotless j
+    'l' : u'\u0142', # l with stroke
+    'L' : u'\u0141'  # L with stroke
+}
+
+
+# special accent arguments of InsetLaTeXAccent
+accented_map = {
+    '\\i' : u'\u0131', # dotless i
+    '\\j' : u'\u0237'  # dotless j
+}
+
+
+def _convert_accent(accent, accented_char):
+    type = accent
+    char = accented_char
+    if char == '':
+        if type in special_accent_map:
+            return special_accent_map[type]
+        # a missing char is treated as space by LyX
+        char = ' '
+    elif type == 'q' and char in ['t', 'd', 'l', 'L']:
+        # Special caron, only used with t, d, l and L.
+        # It is not in the map because we convert it to the same unicode
+        # character as the normal caron: \q{} is only defined if babel with
+        # the czech or slovak language is used, and the normal caron
+        # produces the correct output if the T1 font encoding is used.
+        # For the same reason we never convert to \q{} in the other direction.
+        type = 'v'
+    elif char in accented_map:
+        char = accented_map[char]
+    elif (len(char) > 1):
+        # We can only convert accents on a single char
+        return ''
+    a = accent_map.get(type)
+    if a:
+        return unicodedata.normalize("NFC", "%s%s" % (char, a))
+    return ''
+
+
+def convert_ertbackslash(body, i, ert, default_layout):
+    r""" -------------------------------------------------------------------------------------------
+    Convert backslashes and '\n' into valid ERT code, append the converted
+    text to body[i] and return the (maybe incremented) line index i"""
+
+    for c in ert:
+        if c == '\\':
+            body[i] = body[i] + '\\backslash '
+            i = i + 1
+            body.insert(i, '')
+        elif c == '\n':
+            body[i+1:i+1] = ['\\end_layout', '', '\\begin_layout %s' % default_layout, '']
+            i = i + 4
+        else:
+            body[i] = body[i] + c
+    return i
+
+
+def convert_accent(document):
+    # The following forms are supported by LyX:
+    # '\i \"{a}' (standard form, as written by LyX)
+    # '\i \"{}' (standard form, as written by LyX if the accented char is a space)
+    # '\i \"{ }' (also accepted if the accented char is a space)
+    # '\i \" a'  (also accepted)
+    # '\i \"'    (also accepted)
+    re_wholeinset = re.compile(r'^(.*)(\\i\s+)(.*)$')
+    re_contents = re.compile(r'^([^\s{]+)(.*)$')
+    re_accentedcontents = re.compile(r'^\s*{?([^{}]*)}?\s*$')
+    i = 0
+    while 1:
+        i = find_re(document.body, re_wholeinset, i)
+        if i == -1:
+            return
+        match = re_wholeinset.match(document.body[i])
+        prefix = match.group(1)
+        contents = match.group(3).strip()
+        match = re_contents.match(contents)
+        if match:
+            # Strip first char (always \)
+            accent = match.group(1)[1:]
+            accented_contents = match.group(2).strip()
+            match = re_accentedcontents.match(accented_contents)
+            accented_char = match.group(1)
+            converted = _convert_accent(accent, accented_char)
+            if converted == '':
+                # Normalize contents
+                contents = '%s{%s}' % (accent, accented_char),
+            else:
+                document.body[i] = '%s%s' % (prefix, converted)
+                i += 1
+                continue
+        document.warning("Converting unknown InsetLaTeXAccent `\\i %s' to ERT." % contents)
+        document.body[i] = prefix
+        document.body[i+1:i+1] = ['\\begin_inset ERT',
+                                  'status collapsed',
+                                  '',
+                                  '\\begin_layout %s' % document.default_layout,
+                                  '',
+                                  '',
+                                  '']
+        i = convert_ertbackslash(document.body, i + 7,
+                                 '\\%s' % contents,
+                                 document.default_layout)
+        document.body[i+1:i+1] = ['\\end_layout',
+                                  '',
+                                  '\\end_inset']
+        i += 3
+
+
+def is_inset_line(document, i):
+    """ Line i of body has an inset """
+    if document.body[i][:1] == '\\':
+        return True
+    last_tokens = "".join(document.body[i].split()[-2:])
+    return last_tokens.find('\\') != -1
+
+
+def revert_accent(document):
+    inverse_accent_map = {}
+    for k in accent_map:
+        inverse_accent_map[accent_map[k]] = k
+    inverse_special_accent_map = {}
+    for k in special_accent_map:
+        inverse_special_accent_map[special_accent_map[k]] = k
+    inverse_accented_map = {}
+    for k in accented_map:
+        inverse_accented_map[accented_map[k]] = k
+
+    # Since LyX may insert a line break within a word we must combine all
+    # words before unicode normalization.
+    # We do this only if the next line starts with an accent, otherwise we
+    # would create things like '\begin_inset ERTstatus'.
+    for i in range(len(document.body) - 1):
+        if document.body[i] == '' or document.body[i+1] == '' or document.body[i][-1] == ' ':
+            continue
+        if (document.body[i+1][0] in inverse_accent_map and not is_inset_line(document, i)):
+            # the last character of this line and the first of the next line
+            # form probably a surrogate pair, inline insets are excluded (second part of the test)
+            while (len(document.body[i+1]) > 0 and document.body[i+1][0] != ' '):
+                document.body[i] += document.body[i+1][0]
+                document.body[i+1] = document.body[i+1][1:]
+
+    # Normalize to "Normal form D" (NFD, also known as canonical decomposition).
+    # This is needed to catch all accented characters.
+    for i in range(len(document.body)):
+        # Unfortunately we have a mixture of unicode strings and plain strings,
+        # because we never use u'xxx' for string literals, but 'xxx'.
+        # Therefore we may have to try two times to normalize the data.
+        try:
+            document.body[i] = unicodedata.normalize("NFD", document.body[i])
+        except TypeError:
+            document.body[i] = unicodedata.normalize("NFD", unicode(document.body[i], 'utf-8'))
+
+    # Replace accented characters with InsetLaTeXAccent
+    # Do not convert characters that can be represented in the chosen
+    # encoding.
+    encoding_stack = [get_encoding(document.language, document.inputencoding, 248, document.cjk_encoding)]
+    lang_re = re.compile(r"^\\lang\s(\S+)")
+
+    i = 0
+    while i < len(document.body):
+        if (document.inputencoding == "auto" or document.inputencoding == "default") and document.cjk_encoding != '':
+            # Track the encoding of the current line
+            result = lang_re.match(document.body[i])
+            if result:
+                language = result.group(1)
+                if language == "default":
+                    encoding_stack[-1] = document.encoding
+                else:
+                    from lyx2lyx_lang import lang
+                    encoding_stack[-1] = lang[language][3]
+                continue
+            elif find_token(document.body, "\\begin_layout", i, i + 1) == i:
+                encoding_stack.append(encoding_stack[-1])
+                continue
+            elif find_token(document.body, "\\end_layout", i, i + 1) == i:
+                del encoding_stack[-1]
+                continue
+
+        for j in range(len(document.body[i])):
+            # dotless i and dotless j are both in special_accent_map and can
+            # occur as an accented character, so we need to test that the
+            # following character is no accent
+            if (document.body[i][j] in inverse_special_accent_map and
+                (j == len(document.body[i]) - 1 or document.body[i][j+1] not in inverse_accent_map)):
+                accent = document.body[i][j]
+                try:
+                    dummy = accent.encode(encoding_stack[-1])
+                except UnicodeEncodeError:
+                    # Insert the rest of the line as new line
+                    if j < len(document.body[i]) - 1:
+                        document.body.insert(i+1, document.body[i][j+1:])
+                    # Delete the accented character
+                    document.body[i] = document.body[i][:j]
+                    # Finally add the InsetLaTeXAccent
+                    document.body[i] += "\\i \\%s{}" % inverse_special_accent_map[accent]
+                    break
+            elif j > 0 and document.body[i][j] in inverse_accent_map:
+                accented_char = document.body[i][j-1]
+                if accented_char == ' ':
+                    # Conform to LyX output
+                    accented_char = ''
+                elif accented_char in inverse_accented_map:
+                    accented_char = inverse_accented_map[accented_char]
+                accent = document.body[i][j]
+                try:
+                    dummy = unicodedata.normalize("NFC", accented_char + accent).encode(encoding_stack[-1])
+                except UnicodeEncodeError:
+                    # Insert the rest of the line as new line
+                    if j < len(document.body[i]) - 1:
+                        document.body.insert(i+1, document.body[i][j+1:])
+                    # Delete the accented characters
+                    document.body[i] = document.body[i][:j-1]
+                    # Finally add the InsetLaTeXAccent
+                    document.body[i] += "\\i \\%s{%s}" % (inverse_accent_map[accent], accented_char)
+                    break
+        i = i + 1
+
+    # Normalize to "Normal form C" (NFC, pre-composed characters) again
+    for i in range(len(document.body)):
+        document.body[i] = unicodedata.normalize("NFC", document.body[i])
+
+
+def normalize_font_whitespace_259(document):
+    """ Before format 259 the font changes were ignored if a
+    whitespace was the first or last character in the sequence, this function
+    transfers the whitespace outside."""
+	
+    char_properties = {"\\series": "default",
+                       "\\emph": "default",
+                       "\\color": "none",
+                       "\\shape": "default",
+                       "\\bar": "default",
+                       "\\family": "default"}
+    return normalize_font_whitespace(document, char_properties)
+
+def normalize_font_whitespace_274(document):
+    """ Before format 259 (sic) the font changes were ignored if a
+    whitespace was the first or last character in the sequence. This was 
+    corrected for most font properties in format 259, but the language 
+    was forgotten then. This function applies the same conversion done
+    there (namely, transfers the whitespace outside) for font language
+    changes, as well."""
+
+    char_properties = {"\\lang": "default"}
+    return normalize_font_whitespace(document, char_properties)
+
+def get_paragraph_language(document, i):
+    """ Return the language of the paragraph in which line i of the document
+    body is. If the first thing in the paragraph is a \\lang command, that
+    is the paragraph's langauge; otherwise, the paragraph's language is the 
+    document's language."""
+
+    lines = document.body
+	
+    first_nonempty_line = \
+        find_nonempty_line(lines, find_beginning_of_layout(lines, i) + 1)
+
+    words = lines[first_nonempty_line].split()
+
+    if len(words) > 1 and words[0] == "\\lang":
+        return words[1]
+    else:
+        return document.language
+	
+def normalize_font_whitespace(document, char_properties):
+    """ Before format 259 the font changes were ignored if a
+    whitespace was the first or last character in the sequence, this function
+    transfers the whitespace outside. Only a change in one of the properties
+    in the provided	char_properties is handled by this function."""
+
+    if document.backend != "latex":
+        return
+
+    lines = document.body
+
+    changes = {}
+
+    i = 0
+    while i < len(lines):
+        words = lines[i].split()
+
+        if len(words) > 0 and words[0] == "\\begin_layout":
+            # a new paragraph resets all font changes
+            changes.clear()
+            # also reset the default language to be the paragraph's language
+            if "\\lang" in char_properties.keys():
+                char_properties["\\lang"] = \
+                    get_paragraph_language(document, i + 1)
+
+        elif len(words) > 1 and words[0] in char_properties.keys():
+            # we have a font change
+            if char_properties[words[0]] == words[1]:
+                # property gets reset
+                if words[0] in changes.keys():
+                    del changes[words[0]]
+                defaultproperty = True
+            else:
+                # property gets set
+                changes[words[0]] = words[1]
+                defaultproperty = False
+
+            # We need to explicitly reset all changed properties if we find
+            # a space below, because LyX 1.4 would output the space after
+            # closing the previous change and before starting the new one,
+            # and closing a font change means to close all properties, not
+            # just the changed one.
+
+            if lines[i-1] and lines[i-1][-1] == " ":
+                lines[i-1] = lines[i-1][:-1]
+                # a space before the font change
+                added_lines = [" "]
+                for k in changes.keys():
+                    # exclude property k because that is already in lines[i]
+                    if k != words[0]:
+                        added_lines[1:1] = ["%s %s" % (k, changes[k])]
+                for k in changes.keys():
+                    # exclude property k because that must be added below anyway
+                    if k != words[0]:
+                        added_lines[0:0] = ["%s %s" % (k, char_properties[k])]
+                if defaultproperty:
+                    # Property is reset in lines[i], so add the new stuff afterwards
+                    lines[i+1:i+1] = added_lines
+                else:
+                    # Reset property for the space
+                    added_lines[0:0] = ["%s %s" % (words[0], char_properties[words[0]])]
+                    lines[i:i] = added_lines
+                i = i + len(added_lines)
+
+            elif lines[i+1] and lines[i+1][0] == " " and (len(changes) > 0 or not defaultproperty):
+                # a space after the font change
+                if (lines[i+1] == " " and lines[i+2]):
+                    next_words = lines[i+2].split()
+                    if len(next_words) > 0 and next_words[0] == words[0]:
+                        # a single blank with a property different from the
+                        # previous and the next line must not be changed
+                        i = i + 2
+                        continue
+                lines[i+1] = lines[i+1][1:]
+                added_lines = [" "]
+                for k in changes.keys():
+                    # exclude property k because that is already in lines[i]
+                    if k != words[0]:
+                        added_lines[1:1] = ["%s %s" % (k, changes[k])]
+                for k in changes.keys():
+                    # exclude property k because that must be added below anyway
+                    if k != words[0]:
+                        added_lines[0:0] = ["%s %s" % (k, char_properties[k])]
+                # Reset property for the space
+                added_lines[0:0] = ["%s %s" % (words[0], char_properties[words[0]])]
+                lines[i:i] = added_lines
+                i = i + len(added_lines)
+
+        i = i + 1
+
+
+def revert_utf8x(document):
+    " Set utf8x encoding to utf8. "
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    else:
+        inputenc = get_value(document.header, "\\inputencoding", i)
+        if inputenc == "utf8x":
+            document.header[i] = "\\inputencoding utf8"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+
+
+def revert_utf8plain(document):
+    " Set utf8plain encoding to utf8. "
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    else:
+        inputenc = get_value(document.header, "\\inputencoding", i)
+        if inputenc == "utf8-plain":
+            document.header[i] = "\\inputencoding utf8"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+
+
+def revert_beamer_alert(document):
+    " Revert beamer's \\alert inset back to ERT. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset CharStyle Alert", i)
+        if i == -1:
+            return
+        document.body[i] = "\\begin_inset ERT"
+        i = i + 1
+        while 1:
+            if (document.body[i][:13] == "\\begin_layout"):
+                # Insert the \alert command
+                document.body[i + 1] = "\\alert{" + document.body[i + 1] + '}'
+                break
+            i = i + 1
+
+        i = i + 1
+
+
+def revert_beamer_structure(document):
+    " Revert beamer's \\structure inset back to ERT. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset CharStyle Structure", i)
+        if i == -1:
+            return
+        document.body[i] = "\\begin_inset ERT"
+        i = i + 1
+        while 1:
+            if (document.body[i][:13] == "\\begin_layout"):
+                document.body[i + 1] = "\\structure{" + document.body[i + 1] + '}'
+                break
+            i = i + 1
+
+        i = i + 1
+
+
+def convert_changes(document):
+    " Switch output_changes off if tracking_changes is off. "
+    i = find_token(document.header, '\\tracking_changes', 0)
+    if i == -1:
+        document.warning("Malformed lyx document: Missing '\\tracking_changes'.")
+        return
+    j = find_token(document.header, '\\output_changes', 0)
+    if j == -1:
+        document.warning("Malformed lyx document: Missing '\\output_changes'.")
+        return
+    tracking_changes = get_value(document.header, "\\tracking_changes", i)
+    output_changes = get_value(document.header, "\\output_changes", j)
+    if tracking_changes == "false" and output_changes == "true":
+        document.header[j] = "\\output_changes false"
+
+
+def revert_ascii(document):
+    " Set ascii encoding to auto. "
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    else:
+        inputenc = get_value(document.header, "\\inputencoding", i)
+        if inputenc == "ascii":
+            document.header[i] = "\\inputencoding auto"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+
+
+def normalize_language_name(document):
+    lang = { "brazil": "brazilian",
+             "portuges": "portuguese"}
+
+    if document.language in lang:
+        document.language = lang[document.language]
+        i = find_token(document.header, "\\language", 0)
+        document.header[i] = "\\language %s" % document.language
+
+
+def revert_language_name(document):
+    lang = { "brazilian": "brazil",
+             "portuguese": "portuges"}
+
+    if document.language in lang:
+        document.language = lang[document.language]
+        i = find_token(document.header, "\\language", 0)
+        document.header[i] = "\\language %s" % document.language
+
+#
+#  \textclass cv -> \textclass simplecv
+def convert_cv_textclass(document):
+    if document.textclass == "cv":
+        document.textclass = "simplecv"
+
+
+def revert_cv_textclass(document):
+    if document.textclass == "simplecv":
+        document.textclass = "cv"
+
+
+#
+# add scaleBeforeRotation graphics param
+def convert_graphics_rotation(document):
+    " add scaleBeforeRotation graphics parameter. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset Graphics", i)
+        if i == -1:
+            return
+        j = find_end_of_inset(document.body, i+1)
+        if j == -1:
+            # should not happen
+            document.warning("Malformed LyX document: Could not find end of graphics inset.")
+        # Seach for rotateAngle and width or height or scale
+        # If these params are not there, nothing needs to be done.
+        k = find_token(document.body, "\trotateAngle", i + 1, j)
+        l = find_tokens(document.body, ["\twidth", "\theight", "\tscale"], i + 1, j)
+        if (k != -1 and l != -1):
+            document.body.insert(j, 'scaleBeforeRotation')
+        i = i + 1
+
+
+#
+# remove scaleBeforeRotation graphics param
+def revert_graphics_rotation(document):
+    " remove scaleBeforeRotation graphics parameter. "
+    i = 0
+    while 1:
+        i = find_token(document.body, "\\begin_inset Graphics", i)
+        if i == -1:
+            return
+        j = find_end_of_inset(document.body, i + 1)
+        if j == -1:
+            # should not happen
+            document.warning("Malformed LyX document: Could not find end of graphics inset.")
+        # If there's a scaleBeforeRotation param, just remove that
+        k = find_token(document.body, "\tscaleBeforeRotation", i + 1, j)
+        if k != -1:
+            del document.body[k]
+        else:
+            # if not, and if we have rotateAngle and width or height or scale,
+            # we have to put the rotateAngle value to special
+            rotateAngle = get_value(document.body, 'rotateAngle', i + 1, j)
+            special = get_value(document.body, 'special', i + 1, j)
+            if rotateAngle != "":
+                k = find_tokens(document.body, ["\twidth", "\theight", "\tscale"], i + 1, j)
+                if k == -1:
+                    break
+                if special == "":
+                    document.body.insert(j-1, '\tspecial angle=%s' % rotateAngle)
+                else:
+                    l = find_token(document.body, "\tspecial", i + 1, j)
+                    document.body[l] = document.body[l].replace(special, 'angle=%s,%s' % (rotateAngle, special))
+                k = find_token(document.body, "\trotateAngle", i + 1, j)
+                if k != -1:
+                    del document.body[k]
+        i = i + 1
+
+
+
+def convert_tableborder(document):
+    # The problematic is: LyX double the table cell border as it ignores the "|" character in
+    # the cell arguments. A fix takes care of this and therefore the "|" has to be removed
+    i = 0
+    while i < len(document.body):
+        h = document.body[i].find("leftline=\"true\"", 0, len(document.body[i]))
+        k = document.body[i].find("|>{", 0, len(document.body[i]))
+        # the two tokens have to be in one line
+        if (h != -1 and k != -1):
+            # delete the "|"
+            document.body[i] = document.body[i][:k] + document.body[i][k+1:len(document.body[i])-1]
+        i = i + 1
+
+
+def revert_tableborder(document):
+    i = 0
+    while i < len(document.body):
+        h = document.body[i].find("leftline=\"true\"", 0, len(document.body[i]))
+        k = document.body[i].find(">{", 0, len(document.body[i]))
+        # the two tokens have to be in one line
+        if (h != -1 and k != -1):
+            # add the "|"
+            document.body[i] = document.body[i][:k] + '|' + document.body[i][k:]
+        i = i + 1
+
+
+def revert_armenian(document):
+    
+    # set inputencoding from armscii8 to auto 
+    if document.inputencoding == "armscii8":
+        i = find_token(document.header, "\\inputencoding", 0)
+        if i != -1:
+            document.header[i] = "\\inputencoding auto"
+    # check if preamble exists, if not k is set to -1 
+    i = 0
+    k = -1
+    while i < len(document.preamble):
+        if k == -1:
+            k = document.preamble[i].find("\\", 0, len(document.preamble[i]))
+        if k == -1:
+            k = document.preamble[i].find("%", 0, len(document.preamble[i]))
+        i = i + 1
+    # add the entry \usepackage{armtex} to the document preamble
+    if document.language == "armenian":
+        # set the armtex entry as the first preamble line
+        if k != -1:
+            document.preamble[0:0] = ["\\usepackage{armtex}"]
+        # create the preamble when it doesn't exist
+        else:
+            document.preamble.append('\\usepackage{armtex}')
+    # Set document language from armenian to english 
+    if document.language == "armenian":
+        document.language = "english"
+        i = find_token(document.header, "\\language", 0)
+        if i != -1:
+            document.header[i] = "\\language english"
+
+
+def revert_CJK(document):
+    " Set CJK encodings to default and languages chinese, japanese and korean to english. "
+    encodings = ["Bg5", "Bg5+", "GB", "GBt", "GBK", "JIS",
+                 "KS", "SJIS", "UTF8", "EUC-TW", "EUC-JP"]
+    i = find_token(document.header, "\\inputencoding", 0)
+    if i == -1:
+        document.header.append("\\inputencoding auto")
+    else:
+        inputenc = get_value(document.header, "\\inputencoding", i)
+        if inputenc in encodings:
+            document.header[i] = "\\inputencoding default"
+    document.inputencoding = get_value(document.header, "\\inputencoding", 0)
+
+    if document.language == "chinese-simplified" or \
+       document.language == "chinese-traditional" or \
+       document.language == "japanese" or document.language == "korean":
+        document.language = "english"
+        i = find_token(document.header, "\\language", 0)
+        if i != -1:
+            document.header[i] = "\\language english"
+
+
+def revert_preamble_listings_params(document):
+    " Revert preamble option \listings_params "
+    i = find_token(document.header, "\\listings_params", 0)
+    if i != -1:
+        document.preamble.append('\\usepackage{listings}')
+        document.preamble.append('\\lstset{%s}' % document.header[i].split()[1].strip('"'))
+        document.header.pop(i);
+
+
+def revert_listings_inset(document):
+    r''' Revert listings inset to \lstinline or \begin, \end lstlisting, translate 
+FROM
+
+\begin_inset 
+lstparams "language=Delphi"
+inline true
+status open
+
+\begin_layout Standard
+var i = 10;
+\end_layout
+
+\end_inset
+
+TO
+
+\begin_inset ERT
+status open
+\begin_layout Standard
+
+
+\backslash
+lstinline[language=Delphi]{var i = 10;}
+\end_layout
+
+\end_inset
+
+There can be an caption inset in this inset
+
+\begin_layout Standard
+\begin_inset Caption
+
+\begin_layout Standard
+before label
+\begin_inset LatexCommand label
+name "lst:caption"
+
+\end_inset
+
+after label
+\end_layout
+
+\end_inset
+
+
+\end_layout
+
+'''
+    i = 0
+    while True:
+        i = find_token(document.body, '\\begin_inset listings', i)
+        if i == -1:
+            break
+        else:
+            if not '\\usepackage{listings}' in document.preamble:
+                document.preamble.append('\\usepackage{listings}')
+        j = find_end_of_inset(document.body, i + 1)
+        if j == -1:
+            # this should not happen
+            break
+        inline = 'false'
+        params = ''
+        status = 'open'
+        # first three lines
+        for line in range(i + 1, i + 4):
+            if document.body[line].startswith('inline'):
+                inline = document.body[line].split()[1]
+            if document.body[line].startswith('lstparams'):
+                params = document.body[line].split()[1].strip('"')
+            if document.body[line].startswith('status'):
+                status = document.body[line].split()[1].strip()
+                k = line + 1
+        # caption?
+        caption = ''
+        label = ''
+        cap = find_token(document.body, '\\begin_inset Caption', i)
+        if cap != -1:
+            cap_end = find_end_of_inset(document.body, cap + 1)
+            if cap_end == -1:
+                # this should not happen
+                break
+            # label?
+            lbl = find_token(document.body, '\\begin_inset LatexCommand label', cap + 1)
+            if lbl != -1:
+                lbl_end = find_end_of_inset(document.body, lbl + 1)
+                if lbl_end == -1:
+                    # this should not happen
+                    break
+            else:
+                lbl = cap_end
+                lbl_end = cap_end
+            for line in document.body[lbl : lbl_end + 1]:
+                if line.startswith('name '):
+                    label = line.split()[1].strip('"')
+                    break
+            for line in document.body[cap : lbl ] + document.body[lbl_end + 1 : cap_end + 1]:
+                if not line.startswith('\\'):
+                    caption += line.strip()
+            k = cap_end + 1
+        inlinecode = ''
+        # looking for the oneline code for lstinline
+        inlinecode = document.body[find_end_of_layout(document.body, 
+            find_token(document.body,  '\\begin_layout %s' % document.default_layout, i + 1) +1 ) - 1]
+        if len(caption) > 0:
+            if len(params) == 0:
+                params = 'caption={%s}' % caption
+            else:
+                params += ',caption={%s}' % caption
+        if len(label) > 0:
+            if len(params) == 0:
+                params = 'label={%s}' % label
+            else:
+                params += ',label={%s}' % label
+        if len(params) > 0:
+            params = '[%s]' % params
+            params = params.replace('\\', '\\backslash\n')
+        if inline == 'true':
+            document.body[i:(j+1)] = [r'\begin_inset ERT',
+                                      'status %s' % status,
+                                      r'\begin_layout %s' % document.default_layout,
+                                      '', 
+                                      '',
+                                      r'\backslash',
+                                      'lstinline%s{%s}' % (params, inlinecode),
+                                      r'\end_layout',
+                                      '',
+                                      r'\end_inset']
+        else:
+            document.body[i: j+1] =  [r'\begin_inset ERT',
+                                      'status %s' % status,
+                                      '',
+                                      r'\begin_layout %s' % document.default_layout,
+                                      '',
+                                      '',
+                                      r'\backslash',
+                                      r'begin{lstlisting}%s' % params,
+                                      r'\end_layout',
+                                      '',
+                                      r'\begin_layout %s' % document.default_layout,
+                                    ] + document.body[k : j - 1] + \
+                                     ['',
+                                      r'\begin_layout %s' % document.default_layout,
+                                      '',
+                                      r'\backslash',
+                                      'end{lstlisting}',
+                                      r'\end_layout',
+                                      '',
+                                      r'\end_inset']
+            
+
+def revert_include_listings(document):
+    r''' Revert lstinputlisting Include option , translate
+\begin_inset Include \lstinputlisting{file}[opt]
+preview false
+
+\end_inset
+
+TO
+
+\begin_inset ERT
+status open
+
+\begin_layout Standard
+
+
+\backslash
+lstinputlisting{file}[opt]
+\end_layout
+
+\end_inset
+    '''
+
+    i = 0
+    while True:
+        i = find_token(document.body, r'\begin_inset Include \lstinputlisting', i)
+        if i == -1:
+            break
+        else:
+            if not '\\usepackage{listings}' in document.preamble:
+                document.preamble.append('\\usepackage{listings}')
+        j = find_end_of_inset(document.body, i + 1)
+        if j == -1:
+            # this should not happen
+            break
+        # find command line lstinputlisting{file}[options]
+        cmd, file, option = '', '', ''
+        if re.match(r'\\(lstinputlisting){([.\w]*)}(.*)', document.body[i].split()[2]):
+            cmd, file, option = re.match(r'\\(lstinputlisting){([.\w]*)}(.*)', document.body[i].split()[2]).groups()            
+        option = option.replace('\\', '\\backslash\n')
+        document.body[i : j + 1] = [r'\begin_inset ERT',
+                                    'status open',
+                                    '',
+                                    r'\begin_layout %s' % document.default_layout,
+                                    '',
+                                    '',
+                                    r'\backslash',
+                                    '%s%s{%s}' % (cmd, option, file),
+                                    r'\end_layout',
+                                    '',
+                                    r'\end_inset']
+
+
+def revert_ext_font_sizes(document):
+    if document.backend != "latex": return
+    if not document.textclass.startswith("ext"): return
+
+    fontsize = get_value(document.header, '\\paperfontsize', 0)
+    if fontsize not in ('10', '11', '12'): return
+    fontsize += 'pt'
+
+    i = find_token(document.header, '\\paperfontsize', 0)
+    document.header[i] = '\\paperfontsize default'
+
+    i = find_token(document.header, '\\options', 0)
+    if i == -1:
+        i = find_token(document.header, '\\textclass', 0) + 1
+        document.header[i:i] = ['\\options %s' % fontsize]
+    else:
+        document.header[i] += ',%s' % fontsize
+
+
+def convert_ext_font_sizes(document):
+    if document.backend != "latex": return
+    if not document.textclass.startswith("ext"): return
+
+    fontsize = get_value(document.header, '\\paperfontsize', 0)
+    if fontsize != 'default': return
+
+    i = find_token(document.header, '\\options', 0)
+    if i == -1: return
+
+    options = get_value(document.header, '\\options', i)
+
+    fontsizes = '10pt', '11pt', '12pt'
+    for fs in fontsizes:
+        if options.find(fs) != -1:
+            break
+    else: # this else will only be attained if the for cycle had no match
+        return
+
+    options = options.split(',')
+    for j, opt in enumerate(options):
+        if opt in fontsizes:
+            fontsize = opt[:-2]
+            del options[j]
+            break
+    else:
+        return
+
+    k = find_token(document.header, '\\paperfontsize', 0)
+    document.header[k] = '\\paperfontsize %s' % fontsize
+
+    if options:
+        document.header[i] = '\\options %s' % ','.join(options)
+    else:
+        del document.header[i]
+
+
+def revert_separator_layout(document):
+    r'''Revert --Separator-- to a lyx note
+From
+
+\begin_layout --Separator--
+something
+\end_layout
+
+to
+
+\begin_layout Standard
+\begin_inset Note Note
+status open
+
+\begin_layout Standard
+Separate Evironment
+\end_layout
+
+\end_inset
+something
+
+\end_layout
+
+    '''
+
+    i = 0
+    while True:
+        i = find_token(document.body, r'\begin_layout --Separator--', i)
+        if i == -1:
+            break
+        j = find_end_of_layout(document.body, i + 1)
+        if j == -1:
+            # this should not happen
+            break
+        document.body[i : j + 1] = [r'\begin_layout %s' % document.default_layout,
+                                    r'\begin_inset Note Note',
+                                    'status open',
+                                    '',
+                                    r'\begin_layout %s' % document.default_layout,
+                                    'Separate Environment',
+                                    r'\end_layout',
+                                    '',
+                                    r'\end_inset'] + \
+                                    document.body[ i + 1 : j] + \
+                                    ['',
+                                    r'\end_layout'
+                                    ]
+
+
+def convert_arabic (document):
+    if document.language == "arabic":
+        document.language = "arabic_arabtex"
+        i = find_token(document.header, "\\language", 0)
+        if i != -1:
+            document.header[i] = "\\language arabic_arabtex"
+    i = 0
+    while i < len(document.body):
+        h = document.body[i].find("\lang arabic", 0, len(document.body[i]))
+        if (h != -1):
+            # change the language name
+            document.body[i] = '\lang arabic_arabtex'
+        i = i + 1
+
+
+def revert_arabic (document):
+    if document.language == "arabic_arabtex":
+        document.language = "arabic"
+        i = find_token(document.header, "\\language", 0)
+        if i != -1:
+            document.header[i] = "\\language arabic"
+    i = 0
+    while i < len(document.body):
+        h = document.body[i].find("\lang arabic_arabtex", 0, len(document.body[i]))
+        if (h != -1):
+            # change the language name
+            document.body[i] = '\lang arabic'
+        i = i + 1
+
+
+##
+# Conversion hub
+#
+
+supported_versions = ["1.5.0","1.5"]
+convert = [[246, []],
+           [247, [convert_font_settings]],
+           [248, []],
+           [249, [convert_utf8]],
+           [250, []],
+           [251, []],
+           [252, [convert_commandparams, convert_bibitem]],
+           [253, []],
+           [254, [convert_esint]],
+           [255, []],
+           [256, []],
+           [257, [convert_caption]],
+           [258, [convert_lyxline]],
+           [259, [convert_accent, normalize_font_whitespace_259]],
+           [260, []],
+           [261, [convert_changes]],
+           [262, []],
+           [263, [normalize_language_name]],
+           [264, [convert_cv_textclass]],
+           [265, [convert_tableborder]],
+           [266, []],
+           [267, []],
+           [268, []],
+           [269, []],
+           [270, []],
+           [271, [convert_ext_font_sizes]],
+           [272, []],
+           [273, []],
+           [274, [normalize_font_whitespace_274]],
+           [275, [convert_graphics_rotation]],
+           [276, [convert_arabic]]
+          ]
+
+revert =  [
+           [275, [revert_arabic]],
+           [274, [revert_graphics_rotation]],
+           [273, []],
+           [272, [revert_separator_layout]],
+           [271, [revert_preamble_listings_params, revert_listings_inset, revert_include_listings]],
+           [270, [revert_ext_font_sizes]],
+           [269, [revert_beamer_alert, revert_beamer_structure]],
+           [268, [revert_preamble_listings_params, revert_listings_inset, revert_include_listings]],
+           [267, [revert_CJK]],
+           [266, [revert_utf8plain]],
+           [265, [revert_armenian]],
+           [264, [revert_tableborder]],
+           [263, [revert_cv_textclass]],
+           [262, [revert_language_name]],
+           [261, [revert_ascii]],
+           [260, []],
+           [259, [revert_utf8x]],
+           [258, []],
+           [257, []],
+           [256, [revert_caption]],
+           [255, [revert_encodings]],
+           [254, [revert_clearpage, revert_cleardoublepage]],
+           [253, [revert_esint]],
+           [252, [revert_nomenclature, revert_printnomenclature]],
+           [251, [revert_commandparams]],
+           [250, [revert_cs_label]],
+           [249, []],
+           [248, [revert_accent, revert_utf8, revert_unicode]],
+           [247, [revert_booktabs]],
+           [246, [revert_font_settings]],
+           [245, [revert_framed]]]
+
+
+if __name__ == "__main__":
+    pass
diff --git a/lib/lyx2lyx/parser_tools.py b/lib/lyx2lyx/parser_tools.py
index c204cd73a3..78459d21d9 100644
--- a/lib/lyx2lyx/parser_tools.py
+++ b/lib/lyx2lyx/parser_tools.py
@@ -1,6 +1,6 @@
 # This file is part of lyx2lyx
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2002-2004 Dekel Tsur <dekel@lyx.org>, José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2002-2004 Dekel Tsur <dekel@lyx.org>, JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
@@ -16,65 +16,93 @@
 # along with this program; if not, write to the Free Software
 # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
 
-import string
-import re
+" This modules offer several free functions to help parse lines."
 
+# Utilities for one line
 def check_token(line, token):
-    if line[:len(token)] == token:
-        return 1
-    return 0
+    """ check_token(line, token) -> bool
+
+    Return True if token is present in line and is the first element
+    else returns False."""
+
+    return line[:len(token)] == token
 
 
-# We need to check that the char after the token is space, but I think
-# we can ignore this
-def find_token(lines, token, start, end = 0):
+def is_nonempty_line(line):
+    """ is_nonempty_line(line) -> bool
+
+    Return False if line is either empty or it has only whitespaces,
+    else return True."""
+    return line != " "*len(line)
+
+
+# Utilities for a list of lines
+def find_token(lines, token, start, end = 0, exact = False):
+    """ find_token(lines, token, start[[, end], exact]) -> int
+
+    Return the lowest line where token is found, and is the first
+    element, in lines[start, end].
+
+    Return -1 on failure."""
+
     if end == 0:
         end = len(lines)
     m = len(token)
     for i in xrange(start, end):
-        if lines[i][:m] == token:
-            return i
-    return -1
-
-
-def find_token_exact(lines, token, start, end = 0):
-    if end == 0:
-        end = len(lines)
-    for i in xrange(start, end):
-        x = string.split(lines[i])
-        y = string.split(token)
-        if len(x) < len(y):
-            continue
-        if x[:len(y)] == y:
-            return i
-    return -1
-
-
-def find_tokens(lines, tokens, start, end = 0):
-    if end == 0:
-        end = len(lines)
-    for i in xrange(start, end):
-        for token in tokens:
-            if lines[i][:len(token)] == token:
-                return i
-    return -1
-
-
-def find_tokens_exact(lines, tokens, start, end = 0):
-    if end == 0:
-        end = len(lines)
-    for i in xrange(start, end):
-        for token in tokens:
-            x = string.split(lines[i])
-            y = string.split(token)
+        if exact:
+            x = lines[i].split()
+            y = token.split()
             if len(x) < len(y):
                 continue
             if x[:len(y)] == y:
                 return i
+        else:
+            if lines[i][:m] == token:
+                return i
     return -1
 
 
+def find_token_exact(lines, token, start, end = 0):
+    return find_token(lines, token, start, end, True)
+
+
+def find_tokens(lines, tokens, start, end = 0, exact = False):
+    """ find_tokens(lines, tokens, start[[, end], exact]) -> int
+
+    Return the lowest line where one token in tokens is found, and is
+    the first element, in lines[start, end].
+
+    Return -1 on failure."""
+    if end == 0:
+        end = len(lines)
+
+    for i in xrange(start, end):
+        for token in tokens:
+            if exact:
+                x = lines[i].split()
+                y = token.split()
+                if len(x) < len(y):
+                    continue
+                if x[:len(y)] == y:
+                    return i            
+            else:
+                if lines[i][:len(token)] == token:
+                    return i
+    return -1
+
+
+def find_tokens_exact(lines, tokens, start, end = 0):
+    return find_tokens(lines, tokens, start, end, True)
+
+
 def find_re(lines, rexp, start, end = 0):
+    """ find_token_re(lines, rexp, start[, end]) -> int
+
+    Return the lowest line where rexp, a regular expression, is found
+    in lines[start, end].
+
+    Return -1 on failure."""
+
     if end == 0:
         end = len(lines)
     for i in xrange(start, end):
@@ -84,6 +112,12 @@ def find_re(lines, rexp, start, end = 0):
 
 
 def find_token_backwards(lines, token, start):
+    """ find_token_backwards(lines, token, start) -> int
+
+    Return the highest line where token is found, and is the first
+    element, in lines[start, end].
+
+    Return -1 on failure."""
     m = len(token)
     for i in xrange(start, -1, -1):
         line = lines[i]
@@ -93,6 +127,12 @@ def find_token_backwards(lines, token, start):
 
 
 def find_tokens_backwards(lines, tokens, start):
+    """ find_tokens_backwards(lines, token, start) -> int
+
+    Return the highest line where token is found, and is the first
+    element, in lines[end, start].
+
+    Return -1 on failure."""
     for i in xrange(start, -1, -1):
         line = lines[i]
         for token in tokens:
@@ -101,82 +141,43 @@ def find_tokens_backwards(lines, tokens, start):
     return -1
 
 
-def get_value(lines, token, start, end = 0):
+def get_value(lines, token, start, end = 0, default = ""):
+    """ get_value(lines, token, start[[, end], default]) -> list of strings
+
+    Return tokens after token for the first line, in lines, where
+    token is the first element."""
+
     i = find_token_exact(lines, token, start, end)
     if i == -1:
         return ""
-    if len(string.split(lines[i])) > 1:
-        return string.split(lines[i])[1]
+    if len(lines[i].split()) > 1:
+        return lines[i].split()[1]
     else:
-        return ""
+        return default
 
 
-def get_layout(line, default_layout):
-    tokens = string.split(line)
-    if len(tokens) > 1:
-        return tokens[1]
-    return default_layout
+def del_token(lines, token, start, end):
+    """ del_token(lines, token, start, end) -> int
 
+    Find the lower line in lines where token is the first element and
+    delete that line.
 
-def del_token(lines, token, i, j):
-    k = find_token_exact(lines, token, i, j)
+    Returns the number of lines remaining."""
+
+    k = find_token_exact(lines, token, start, end)
     if k == -1:
-        return j
+        return end
     else:
         del lines[k]
-        return j-1
+        return end - 1
 
 
-# Finds the paragraph that contains line i.
-def get_paragraph(lines, i, format):
-    if format < 225:
-        begin_layout = "\\layout"
-    else:
-        begin_layout = "\\begin_layout"
-    while i != -1:
-        i = find_tokens_backwards(lines, ["\\end_inset", begin_layout], i)
-        if i == -1: return -1
-        if check_token(lines[i], begin_layout):
-            return i
-        i = find_beginning_of_inset(lines, i)
-    return -1
-
-
-# Finds the paragraph after the paragraph that contains line i.
-def get_next_paragraph(lines, i, format):
-    if format < 225:
-        tokens = ["\\begin_inset", "\\layout", "\\end_float", "\\the_end"]
-    elif format < 236:
-        tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_document"]
-    else:
-        tokens = ["\\begin_inset", "\\begin_layout", "\\end_float", "\\end_body", "\\end_document"]
-    while i != -1:
-        i = find_tokens(lines, tokens, i)
-        if not check_token(lines[i], "\\begin_inset"):
-            return i
-        i = find_end_of_inset(lines, i)
-    return -1
-
-
-def find_end_of(lines, i, start_token, end_token):
-    count = 1
-    n = len(lines)
-    while i < n:
-        i = find_tokens(lines, [end_token, start_token], i+1)
-        if check_token(lines[i], start_token):
-            count = count+1
-        else:
-            count = count-1
-        if count == 0:
-            return i
-    return -1
-
-
-# Finds the matching \end_inset
 def find_beginning_of(lines, i, start_token, end_token):
     count = 1
     while i > 0:
         i = find_tokens_backwards(lines, [start_token, end_token], i-1)
+        if i == -1:
+            return -1
         if check_token(lines[i], end_token):
             count = count+1
         else:
@@ -186,38 +187,20 @@ def find_beginning_of(lines, i, start_token, end_token):
     return -1
 
 
-# Finds the matching \end_inset
-def find_end_of_inset(lines, i):
-    return find_end_of(lines, i, "\\begin_inset", "\\end_inset")
-
-
-# Finds the matching \end_inset
-def find_beginning_of_inset(lines, i):
-    return find_beginning_of(lines, i, "\\begin_inset", "\\end_inset")
-
-
-def find_end_of_tabular(lines, i):
-    return find_end_of(lines, i, "<lyxtabular", "</lyxtabular")
-
-
-def get_tabular_lines(lines, i):
-    result = []
-    i = i+1
-    j = find_end_of_tabular(lines, i)
-    if j == -1:
-        return []
-
-    while i <= j:
-        if check_token(lines[i], "\\begin_inset"):
-            i = find_end_of_inset(lines, i)+1
+def find_end_of(lines, i, start_token, end_token):
+    count = 1
+    n = len(lines)
+    while i < n:
+        i = find_tokens(lines, [end_token, start_token], i+1)
+        if i == -1:
+            return -1
+        if check_token(lines[i], start_token):
+            count = count+1
         else:
-            result.append(i)
-            i = i+1
-    return result
-
-
-def is_nonempty_line(line):
-    return line != " "*len(line)
+            count = count-1
+        if count == 0:
+            return i
+    return -1
 
 
 def find_nonempty_line(lines, start, end = 0):
diff --git a/lib/lyx2lyx/profiling.py b/lib/lyx2lyx/profiling.py
index d249675a14..b97bc22d1b 100755
--- a/lib/lyx2lyx/profiling.py
+++ b/lib/lyx2lyx/profiling.py
@@ -1,6 +1,6 @@
 #! /usr/bin/env python
-# -*- coding: iso-8859-1 -*-
-# Copyright (C) 2004 José Matos <jamatos@lyx.org>
+# -*- coding: utf-8 -*-
+# Copyright (C) 2004 JosĂŠ Matos <jamatos@lyx.org>
 #
 # This program is free software; you can redistribute it and/or
 # modify it under the terms of the GNU General Public License
diff --git a/lib/unicodesymbols b/lib/unicodesymbols
new file mode 100644
index 0000000000..a582cc15c9
--- /dev/null
+++ b/lib/unicodesymbols
@@ -0,0 +1,1399 @@
+#
+# file unicodesymbols
+# This file is part of LyX, the document processor.
+# Licence details can be found in the file COPYING.
+#
+# author Georg Baum
+# author Uwe StĂśhr
+#
+# Full author contact details are available in file CREDITS.
+
+# This file is a database of LaTeX commands for unicode characters.
+# These commands will be used by LyX for LaTeX export for all characters
+# that are not representable in the chosen encoding.
+
+# If you change this file please keep the order and indentation!
+# You can use development/tools/unicodesymbols.py to add stubs for more
+# symbols.
+# Do only add commands that give correct output, no hacks that look "similar".
+# Commands that modify other parts of the text should not be added either.
+
+# syntax:
+# ucs4 command                    preamble flags
+# preamble can either be a feature known by the LaTeXFeatures class (e.g.
+# tipa), or a LaTeX command (e.g. \\usepackage{bla}).
+# Known flags:
+# - combining This is a combining char that will get combined with a base char
+# - force     Always output replacement command
+
+0x00a0 "~"                        "" "" # NO-BREAK SPACE
+0x00a1 "\\textexclamdown"         "" "" # INVERTED EXCLAMATION MARK
+0x00a2 "\\textcent"               "textcomp" "" # CENT SIGN
+0x00a3 "\\pounds"                 "" "" # ÂŁ POUND SIGN
+0x00a4 "\\textcurrency"           "textcomp" "" # CURRENCY SYMBOL
+0x00a5 "\\textyen"                "textcomp" "" # YEN SIGN
+0x00a6 "\\textbrokenbar"          "textcomp" "" # BROKEN BAR
+0x00a7 "\\textsection"            "textcomp" "" # SECTION SIGN
+0x00a8 "\\textasciidieresis"      "textcomp" "" # DIAERESIS
+0x00a9 "\\textcopyright"          "textcomp" "" # COPYRIGHT SIGN
+0x00aa "\\textordfeminine"        "textcomp" "" # FEMININE ORDINAL INDICATOR
+0x00ab "\\guillemotleft"          "" "" # LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+0x00ac "\\textlnot"               "textcomp" "force" # ÂŹ NOT SIGN
+0x00ad "\\-"                      "" "" # SOFT HYPHEN
+0x00ae "\\textregistered"         "textcomp" "" # REGISTERED SIGN
+0x00af "\\textasciimacron"        "textcomp" "" # MACRON
+0x00b0 "\\textdegree"             "textcomp" "" # DEGREE SIGN
+0x00b1 "\\textpm"                 "textcomp" "force" # Âą PLUS-MINUS SIGN
+0x00b2 "\\texttwosuperior"        "textcomp" "force" # Â˛ SUPERSCRIPT TWO
+0x00b3 "\\textthreesuperior"      "textcomp" "force" # Âł SUPERSCRIPT THREE
+0x00b4 "\\textasciiacute"         "textcomp" "" # ACUTE ACCENT
+0x00b5 "\\textmu"                 "textcomp" "force" # Âľ MICRO SIGN
+0x00b6 "\\textparagraph"          "textcomp" "" # PILCROW SIGN # not equal to \textpilcrow
+0x00b7 "\\textperiodcentered"     "" "" # MIDDLE DOT
+0x00b8 "\\c\\ "                   "" "" # CEDILLA (command from latin1.def)
+0x00b9 "\\textonesuperior"        "textcomp" "force" # Âš SUPERSCRIPT ONE
+0x00ba "\\textordmasculine"       "textcomp" "" # MASCULINE ORDINAL INDICATOR
+0x00bb "\\guillemotright"         "" "" # RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+0x00bc "\\textonequarter"         "textcomp" "" # 1/4 FRACTION
+0x00bd "\\textonehalf"            "textcomp" "" # 1/2 FRACTION
+0x00be "\\textthreequarters"      "textcomp" "" # 3/4 FRACTION
+0x00bf "\\textquestiondown"       "" "" # INVERTED QUESTION MARK
+0x00c0 "\\`{A}"                   "" "" # LATIN CAPITAL LETTER A WITH GRAVE
+0x00c1 "\\'{A}"                   "" "" # LATIN CAPITAL LETTER A WITH ACUTE
+0x00c2 "\\^{A}"                   "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX
+0x00c3 "\\~{A}"                   "" "" # LATIN CAPITAL LETTER A WITH TILDE
+0x00c4 "\\\"{A}"                  "" "" # LATIN CAPITAL LETTER A WITH DIAERESIS
+0x00c5 "\\r{A}"                   "" "" # LATIN CAPITAL LETTER A WITH RING ABOVE
+0x00c6 "\\AE"                     "" "" # LATIN CAPITAL LETTER AE
+0x00c7 "\\c{C}"                   "" "" # LATIN CAPITAL LETTER C WITH CEDILLA
+0x00c8 "\\`{E}"                   "" "" # LATIN CAPITAL LETTER E WITH GRAVE
+0x00c9 "\\'{E}"                   "" "" # LATIN CAPITAL LETTER E WITH ACUTE
+0x00ca "\\^{E}"                   "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX
+0x00cb "\\\"{E}"                  "" "" # LATIN CAPITAL LETTER E WITH DIAERESIS
+0x00cc "\\`{I}"                   "" "" # LATIN CAPITAL LETTER I WITH GRAVE
+0x00cd "\\'{I}"                   "" "" # LATIN CAPITAL LETTER I WITH ACUTE
+0x00ce "\\^{I}"                   "" "" # LATIN CAPITAL LETTER I WITH CIRCUMFLEX
+0x00cf "\\\"{I}"                  "" "" # LATIN CAPITAL LETTER I WITH DIAERESIS
+0x00d0 "\\DH"                     "" "" # LATIN CAPITAL LETTER ETH
+0x00d1 "\\~{N}"                   "" "" # LATIN CAPITAL LETTER N WITH TILDE
+0x00d2 "\\`{O}"                   "" "" # LATIN CAPITAL LETTER O WITH GRAVE
+0x00d3 "\\'{O}"                   "" "" # LATIN CAPITAL LETTER O WITH ACUTE
+0x00d4 "\\^{O}"                   "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX
+0x00d5 "\\~{O}"                   "" "" # LATIN CAPITAL LETTER O WITH TILDE
+0x00d6 "\\\"{O}"                  "" "" # LATIN CAPITAL LETTER O WITH DIAERESIS
+0x00d7 "\\texttimes"              "textcomp" "force" # Ă MULTIPLICATION SIGN
+0x00d8 "\\O"                      "" "" # LATIN CAPITAL LETTER O WITH STROKE
+0x00d9 "\\`{U}"                   "" "" # LATIN CAPITAL LETTER U WITH GRAVE
+0x00da "\\'{U}"                   "" "" # LATIN CAPITAL LETTER U WITH ACUTE
+0x00db "\\^{U}"                   "" "" # LATIN CAPITAL LETTER U WITH CIRCUMFLEX
+0x00dc "\\\"{U}"                  "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS
+0x00dd "\\'{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH ACUTE
+0x00de "\\TH"                     "" "" # LATIN CAPITAL LETTER THORN
+0x00df "\\ss"                     "" "" # LATIN SMALL LETTER SHARP S
+0x00e0 "\\`{a}"                   "" "" # LATIN SMALL LETTER A WITH GRAVE
+0x00e1 "\\'{a}"                   "" "" # LATIN SMALL LETTER A WITH ACUTE
+0x00e2 "\\^{a}"                   "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX
+0x00e3 "\\~{a}"                   "" "" # LATIN SMALL LETTER A WITH TILDE
+0x00e4 "\\\"{a}"                  "" "" # LATIN SMALL LETTER A WITH DIAERESIS
+0x00e5 "\\r{a}"                   "" "" # LATIN SMALL LETTER A WITH RING ABOVE
+0x00e6 "\\ae"                     "" "" # LATIN SMALL LETTER AE
+0x00e7 "\\c{c}"                   "" "" # LATIN SMALL LETTER C WITH CEDILLA
+0x00e8 "\\`{e}"                   "" "" # LATIN SMALL LETTER E WITH GRAVE
+0x00e9 "\\'{e}"                   "" "" # LATIN SMALL LETTER E WITH ACUTE
+0x00ea "\\^{e}"                   "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX
+0x00eb "\\\"{e}"                  "" "" # LATIN SMALL LETTER E WITH DIAERESIS
+0x00ec "\\`{\\i}"                 "" "" # LATIN SMALL LETTER I WITH GRAVE
+0x00ed "\\'{\\i}"                 "" "" # LATIN SMALL LETTER I WITH ACUTE
+0x00ee "\\^{\\i}"                 "" "" # LATIN SMALL LETTER I WITH CIRCUMFLEX
+0x00ef "\\\"{\\i}"                "" "" # LATIN SMALL LETTER I WITH DIAERESIS
+0x00f0 "\\dh"                     "" "" # LATIN SMALL LETTER ETH
+0x00f1 "\\~{n}"                   "" "" # LATIN SMALL LETTER N WITH TILDE
+0x00f2 "\\`{o}"                   "" "" # LATIN SMALL LETTER O WITH GRAVE
+0x00f3 "\\'{o}"                   "" "" # LATIN SMALL LETTER O WITH ACUTE
+0x00f4 "\\^{o}"                   "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX
+0x00f5 "\\~{o}"                   "" "" # LATIN SMALL LETTER O WITH TILDE
+0x00f6 "\\\"{o}"                  "" "" # LATIN SMALL LETTER O WITH DIAERESIS
+0x00f7 "\\textdiv"                "textcomp" "force" # Ăˇ DIVISION SIGN
+0x00f8 "\\o"                      "" "" # LATIN SMALL LETTER O WITH STROKE
+0x00f9 "\\`{u}"                   "" "" # LATIN SMALL LETTER U WITH GRAVE
+0x00fa "\\'{u}"                   "" "" # LATIN SMALL LETTER U WITH ACUTE
+0x00fb "\\^{u}"                   "" "" # LATIN SMALL LETTER U WITH CIRCUMFLEX
+0x00fc "\\\"{u}"                  "" "" # LATIN SMALL LETTER U WITH DIAERESIS
+0x00fd "\\'{y}"                   "" "" # LATIN SMALL LETTER Y WITH ACUTE
+0x00fe "\\th"                     "" "" # LATIN SMALL LETTER THORN
+0x00ff "\\\"{y}"                  "" "" # LATIN SMALL LETTER Y WITH DIAERESIS
+0x0100 "\\={A}"                   "" "" # LATIN CAPITAL LETTER A WITH MACRON
+0x0101 "\\={a}"                   "" "" # LATIN SMALL LETTER A WITH MACRON
+0x0102 "\\u{A}"                   "" "" # LATIN CAPITAL LETTER A WITH BREVE
+0x0103 "\\u{a}"                   "" "" # LATIN SMALL LETTER A WITH BREVE
+0x0104 "\\k{A}"                   "" "" # LATIN CAPITAL LETTER A WITH OGONEK
+0x0105 "\\k{a}"                   "" "" # LATIN SMALL LETTER A WITH OGONEK
+0x0106 "\\'{C}"                   "" "" # LATIN CAPITAL LETTER C WITH ACUTE
+0x0107 "\\'{c}"                   "" "" # LATIN SMALL LETTER C WITH ACUTE
+0x0108 "\\^{C}"                   "" "" # LATIN CAPITAL LETTER C WITH CIRCUMFLEX
+0x0109 "\\^{c}"                   "" "" # LATIN SMALL LETTER C WITH CIRCUMFLEX
+0x010a "\\.{C}"                   "" "" # LATIN CAPITAL LETTER C WITH DOT ABOVE
+0x010b "\\.{c}"                   "" "" # LATIN SMALL LETTER C WITH DOT ABOVE
+0x010c "\\v{C}"                   "" "" # LATIN CAPITAL LETTER C WITH CARON
+0x010d "\\v{c}"                   "" "" # LATIN SMALL LETTER C WITH CARON
+0x010e "\\v{D}"                   "" "" # LATIN CAPITAL LETTER D WITH CARON
+0x010f "\\v{d}"                   "" "" # LATIN SMALL LETTER D WITH CARON
+0x0110 "\\DJ"                     "" "" # LATIN CAPITAL LETTER D WITH STROKE
+0x0111 "\\dj"                     "" "" # LATIN SMALL LETTER D WITH STROKE
+0x0112 "\\={E}"                   "" "" # LATIN CAPITAL LETTER E WITH MACRON
+0x0113 "\\={e}"                   "" "" # LATIN SMALL LETTER E WITH MACRON
+0x0114 "\\u{E}"                   "" "" # LATIN CAPITAL LETTER E WITH BREVE
+0x0115 "\\u{e}"                   "" "" # LATIN SMALL LETTER E WITH BREVE
+0x0116 "\\.{E}"                   "" "" # LATIN CAPITAL LETTER E WITH DOT ABOVE
+0x0117 "\\.{e}"                   "" "" # LATIN SMALL LETTER E WITH DOT ABOVE
+0x0118 "\\k{E}"                   "" "" # LATIN CAPITAL LETTER E WITH OGONEK
+0x0119 "\\k{e}"                   "" "" # LATIN SMALL LETTER E WITH OGONEK
+0x011a "\\v{E}"                   "" "" # LATIN CAPITAL LETTER E WITH CARON
+0x011b "\\v{e}"                   "" "" # LATIN SMALL LETTER E WITH CARON
+0x011c "\\^{G}"                   "" "" # LATIN CAPITAL LETTER G WITH CIRCUMFLEX
+0x011d "\\^{g}"                   "" "" # LATIN SMALL LETTER G WITH CIRCUMFLEX
+0x011e "\\u{G}"                   "" "" # LATIN CAPITAL LETTER G WITH BREVE
+0x011f "\\u{g}"                   "" "" # LATIN SMALL LETTER G WITH BREVE
+0x0120 "\\.{G}"                   "" "" # LATIN CAPITAL LETTER G WITH DOT ABOVE
+0x0121 "\\.{g}"                   "" "" # LATIN SMALL LETTER G WITH DOT ABOVE
+0x0122 "\\c{G}"                   "" "" # LATIN CAPITAL LETTER G WITH CEDILLA
+0x0123 "\\c{g}"                   "" "" # LATIN SMALL LETTER G WITH CEDILLA
+0x0124 "\\^{H}"                   "" "" # LATIN CAPITAL LETTER H WITH CIRCUMFLEX
+0x0125 "\\^{h}"                   "" "" # LATIN SMALL LETTER H WITH CIRCUMFLEX
+#0x0126 ""                         "" "" # LATIN CAPITAL LETTER H WITH STROKE
+#0x0127 ""                         "" "" # LATIN SMALL LETTER H WITH STROKE
+0x0128 "\\~{I}"                   "" "" # LATIN CAPITAL LETTER I WITH TILDE
+0x0129 "\\~{\\i}"                 "" "" # LATIN SMALL LETTER I WITH TILDE
+0x012a "\\={I}"                   "" "" # LATIN CAPITAL LETTER I WITH MACRON
+0x012b "\\={\\i}"                 "" "" # LATIN SMALL LETTER I WITH MACRON
+0x012c "\\u{I}"                   "" "" # LATIN CAPITAL LETTER I WITH BREVE
+0x012d "\\u{\\i}"                 "" "" # LATIN SMALL LETTER I WITH BREVE
+0x012e "\\k{I}"                   "" "" # LATIN CAPITAL LETTER I WITH OGONEK
+0x012f "\\k{i}"                   "" "" # LATIN SMALL LETTER I WITH OGONEK
+0x0130 "\\.{I}"                   "" "" # LATIN CAPITAL LETTER I WITH DOT ABOVE
+0x0131 "\\i"                      "" "" # LATIN SMALL LETTER DOTLESS I
+#0x0132 ""                         "" "" # LATIN CAPITAL LIGATURE IJ
+#0x0133 ""                         "" "" # LATIN SMALL LIGATURE IJ
+0x0134 "\\^{J}"                   "" "" # LATIN CAPITAL LETTER J WITH CIRCUMFLEX
+0x0135 "\\^{\\j}"                 "" "" # LATIN SMALL LETTER J WITH CIRCUMFLEX
+0x0136 "\\c{K}"                   "" "" # LATIN CAPITAL LETTER K WITH CEDILLA
+0x0137 "\\c{k}"                   "" "" # LATIN SMALL LETTER K WITH CEDILLA
+#0x0138 ""                         "" "" # LATIN SMALL LETTER KRA
+0x0139 "\\'{L}"                   "" "" # LATIN CAPITAL LETTER L WITH ACUTE
+0x013a "\\'{l}"                   "" "" # LATIN SMALL LETTER L WITH ACUTE
+0x013b "\\c{L}"                   "" "" # LATIN CAPITAL LETTER L WITH CEDILLA
+0x013c "\\c{l}"                   "" "" # LATIN SMALL LETTER L WITH CEDILLA
+0x013d "\\v{L}"                   "" "" # LATIN CAPITAL LETTER L WITH CARON
+0x013e "\\v{l}"                   "" "" # LATIN SMALL LETTER L WITH CARON
+#0x013f ""                         "" "" # LATIN CAPITAL LETTER L WITH MIDDLE DOT
+#0x0140 ""                         "" "" # LATIN SMALL LETTER L WITH MIDDLE DOT
+0x0141 "\\L"                      "" "" # LATIN CAPITAL LETTER L WITH STROKE
+0x0142 "\\l"                      "" "" # LATIN SMALL LETTER L WITH STROKE
+0x0143 "\\'{N}"                   "" "" # LATIN CAPITAL LETTER N WITH ACUTE
+0x0144 "\\'{n}"                   "" "" # LATIN SMALL LETTER N WITH ACUTE
+0x0145 "\\c{N}"                   "" "" # LATIN CAPITAL LETTER N WITH CEDILLA
+0x0146 "\\c{n}"                   "" "" # LATIN SMALL LETTER N WITH CEDILLA
+0x0147 "\\v{N}"                   "" "" # LATIN CAPITAL LETTER N WITH CARON
+0x0148 "\\v{n}"                   "" "" # LATIN SMALL LETTER N WITH CARON
+#0x0149 ""                         "" "" # LATIN SMALL LETTER N PRECEDED BY APOSTROPHE
+0x014a "\\NG"                     "" "" # LATIN CAPITAL LETTER ENG
+0x014b "\\ng"                     "" "" # LATIN SMALL LETTER ENG
+0x014c "\\={O}"                   "" "" # LATIN CAPITAL LETTER O WITH MACRON
+0x014d "\\={o}"                   "" "" # LATIN SMALL LETTER O WITH MACRON
+0x014e "\\u{O}"                   "" "" # LATIN CAPITAL LETTER O WITH BREVE
+0x014f "\\u{o}"                   "" "" # LATIN SMALL LETTER O WITH BREVE
+0x0150 "\\H{O}"                   "" "" # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
+0x0151 "\\H{o}"                   "" "" # LATIN SMALL LETTER O WITH DOUBLE ACUTE
+0x0152 "\\OE"                     "" "" # LATIN CAPITAL LIGATURE OE
+0x0153 "\\oe"                     "" "" # LATIN SMALL LIGATURE OE
+0x0154 "\\'{R}"                   "" "" # LATIN CAPITAL LETTER R WITH ACUTE
+0x0155 "\\'{r}"                   "" "" # LATIN SMALL LETTER R WITH ACUTE
+0x0156 "\\c{R}"                   "" "" # LATIN CAPITAL LETTER R WITH CEDILLA
+0x0157 "\\c{r}"                   "" "" # LATIN SMALL LETTER R WITH CEDILLA
+0x0158 "\\v{R}"                   "" "" # LATIN CAPITAL LETTER R WITH CARON
+0x0159 "\\v{r}"                   "" "" # LATIN SMALL LETTER R WITH CARON
+0x015a "\\'{S}"                   "" "" # LATIN CAPITAL LETTER S WITH ACUTE
+0x015b "\\'{s}"                   "" "" # LATIN SMALL LETTER S WITH ACUTE
+0x015c "\\^{S}"                   "" "" # LATIN CAPITAL LETTER S WITH CIRCUMFLEX
+0x015d "\\^{s}"                   "" "" # LATIN SMALL LETTER S WITH CIRCUMFLEX
+0x015e "\\c{S}"                   "" "" # LATIN CAPITAL LETTER S WITH CEDILLA
+0x015f "\\c{s}"                   "" "" # LATIN SMALL LETTER S WITH CEDILLA
+0x0160 "\\v{S}"                   "" "" # LATIN CAPITAL LETTER S WITH CARON
+0x0161 "\\v{s}"                   "" "" # LATIN SMALL LETTER S WITH CARON
+0x0162 "\\c{T}"                   "" "" # LATIN CAPITAL LETTER T WITH CEDILLA
+0x0163 "\\c{t}"                   "" "" # LATIN SMALL LETTER T WITH CEDILLA
+0x0164 "\\v{T}"                   "" "" # LATIN CAPITAL LETTER T WITH CARON
+0x0165 "\\v{t}"                   "" "" # LATIN SMALL LETTER T WITH CARON
+#0x0166 ""                         "" "" # LATIN CAPITAL LETTER T WITH STROKE
+#0x0167 ""                         "" "" # LATIN SMALL LETTER T WITH STROKE
+0x0168 "\\~{U}"                   "" "" # LATIN CAPITAL LETTER U WITH TILDE
+0x0169 "\\~{u}"                   "" "" # LATIN SMALL LETTER U WITH TILDE
+0x016a "\\={U}"                   "" "" # LATIN CAPITAL LETTER U WITH MACRON
+0x016b "\\={u}"                   "" "" # LATIN SMALL LETTER U WITH MACRON
+0x016c "\\u{U}"                   "" "" # LATIN CAPITAL LETTER U WITH BREVE
+0x016d "\\u{u}"                   "" "" # LATIN SMALL LETTER U WITH BREVE
+0x016e "\\r{U}"                   "" "" # LATIN CAPITAL LETTER U WITH RING ABOVE
+0x016f "\\r{u}"                   "" "" # LATIN SMALL LETTER U WITH RING ABOVE
+0x0170 "\\H{U}"                   "" "" # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
+0x0171 "\\H{u}"                   "" "" # LATIN SMALL LETTER U WITH DOUBLE ACUTE
+0x0172 "\\k{U}"                   "" "" # LATIN CAPITAL LETTER U WITH OGONEK
+0x0173 "\\k{u}"                   "" "" # LATIN SMALL LETTER U WITH OGONEK
+0x0174 "\\^{W}"                   "" "" # LATIN CAPITAL LETTER W WITH CIRCUMFLEX
+0x0175 "\\^{w}"                   "" "" # LATIN SMALL LETTER W WITH CIRCUMFLEX
+0x0176 "\\^{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH CIRCUMFLEX
+0x0177 "\\^{y}"                   "" "" # LATIN SMALL LETTER Y WITH CIRCUMFLEX
+0x0178 "\\\"{Y}"                  "" "" # LATIN CAPITAL LETTER Y WITH DIAERESIS
+0x0179 "\\'{Z}"                   "" "" # LATIN CAPITAL LETTER Z WITH ACUTE
+0x017a "\\'{z}"                   "" "" # LATIN SMALL LETTER Z WITH ACUTE
+0x017b "\\.{Z}"                   "" "" # LATIN CAPITAL LETTER Z WITH DOT ABOVE
+0x017c "\\.{z}"                   "" "" # LATIN SMALL LETTER Z WITH DOT ABOVE
+0x017d "\\v{Z}"                   "" "" # LATIN CAPITAL LETTER Z WITH CARON
+0x017e "\\v{z}"                   "" "" # LATIN SMALL LETTER Z WITH CARON
+#0x017f ""                         "" "" # LATIN SMALL LETTER LONG S
+#0x0180 ""                         "" "" # LATIN SMALL LETTER B WITH STROKE
+#0x0181 ""                         "" "" # LATIN CAPITAL LETTER B WITH HOOK
+#0x0182 ""                         "" "" # LATIN CAPITAL LETTER B WITH TOPBAR
+#0x0183 ""                         "" "" # LATIN SMALL LETTER B WITH TOPBAR
+#0x0184 ""                         "" "" # LATIN CAPITAL LETTER TONE SIX
+#0x0185 ""                         "" "" # LATIN SMALL LETTER TONE SIX
+#0x0186 ""                         "" "" # LATIN CAPITAL LETTER OPEN O
+#0x0187 ""                         "" "" # LATIN CAPITAL LETTER C WITH HOOK
+#0x0188 ""                         "" "" # LATIN SMALL LETTER C WITH HOOK
+#0x0189 ""                         "" "" # LATIN CAPITAL LETTER AFRICAN D
+#0x018a ""                         "" "" # LATIN CAPITAL LETTER D WITH HOOK
+#0x018b ""                         "" "" # LATIN CAPITAL LETTER D WITH TOPBAR
+#0x018c ""                         "" "" # LATIN SMALL LETTER D WITH TOPBAR
+#0x018d ""                         "" "" # LATIN SMALL LETTER TURNED DELTA
+#0x018e ""                         "" "" # LATIN CAPITAL LETTER REVERSED E
+#0x018f ""                         "" "" # LATIN CAPITAL LETTER SCHWA
+#0x0190 ""                         "" "" # LATIN CAPITAL LETTER OPEN E
+#0x0191 ""                         "" "" # LATIN CAPITAL LETTER F WITH HOOK
+0x0192 "\\textflorin"             "textcomp" "" # LATIN SMALL LETTER F WITH HOOK
+#0x0193 ""                         "" "" # LATIN CAPITAL LETTER G WITH HOOK
+#0x0194 ""                         "" "" # LATIN CAPITAL LETTER GAMMA
+#0x0195 ""                         "" "" # LATIN SMALL LETTER HV
+#0x0196 ""                         "" "" # LATIN CAPITAL LETTER IOTA
+#0x0197 ""                         "" "" # LATIN CAPITAL LETTER I WITH STROKE
+#0x0198 ""                         "" "" # LATIN CAPITAL LETTER K WITH HOOK
+#0x0199 ""                         "" "" # LATIN SMALL LETTER K WITH HOOK
+#0x019a ""                         "" "" # LATIN SMALL LETTER L WITH BAR
+#0x019b ""                         "" "" # LATIN SMALL LETTER LAMBDA WITH STROKE
+#0x019c ""                         "" "" # LATIN CAPITAL LETTER TURNED M
+#0x019d ""                         "" "" # LATIN CAPITAL LETTER N WITH LEFT HOOK
+#0x019e ""                         "" "" # LATIN SMALL LETTER N WITH LONG RIGHT LEG
+#0x019f ""                         "" "" # LATIN CAPITAL LETTER O WITH MIDDLE TILDE
+#0x01a0 ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN
+#0x01a1 ""                         "" "" # LATIN SMALL LETTER O WITH HORN
+#0x01a2 ""                         "" "" # LATIN CAPITAL LETTER OI
+#0x01a3 ""                         "" "" # LATIN SMALL LETTER OI
+#0x01a4 ""                         "" "" # LATIN CAPITAL LETTER P WITH HOOK
+#0x01a5 ""                         "" "" # LATIN SMALL LETTER P WITH HOOK
+#0x01a6 ""                         "" "" # LATIN LETTER YR
+#0x01a7 ""                         "" "" # LATIN CAPITAL LETTER TONE TWO
+#0x01a8 ""                         "" "" # LATIN SMALL LETTER TONE TWO
+#0x01a9 ""                         "" "" # LATIN CAPITAL LETTER ESH
+#0x01aa ""                         "" "" # LATIN LETTER REVERSED ESH LOOP
+#0x01ab ""                         "" "" # LATIN SMALL LETTER T WITH PALATAL HOOK
+#0x01ac ""                         "" "" # LATIN CAPITAL LETTER T WITH HOOK
+#0x01ad ""                         "" "" # LATIN SMALL LETTER T WITH HOOK
+#0x01ae ""                         "" "" # LATIN CAPITAL LETTER T WITH RETROFLEX HOOK
+#0x01af ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN
+#0x01b0 ""                         "" "" # LATIN SMALL LETTER U WITH HORN
+#0x01b1 ""                         "" "" # LATIN CAPITAL LETTER UPSILON
+#0x01b2 ""                         "" "" # LATIN CAPITAL LETTER V WITH HOOK
+#0x01b3 ""                         "" "" # LATIN CAPITAL LETTER Y WITH HOOK
+#0x01b4 ""                         "" "" # LATIN SMALL LETTER Y WITH HOOK
+#0x01b5 ""                         "" "" # LATIN CAPITAL LETTER Z WITH STROKE
+#0x01b6 ""                         "" "" # LATIN SMALL LETTER Z WITH STROKE
+#0x01b7 ""                         "" "" # LATIN CAPITAL LETTER EZH
+#0x01b8 ""                         "" "" # LATIN CAPITAL LETTER EZH REVERSED
+#0x01b9 ""                         "" "" # LATIN SMALL LETTER EZH REVERSED
+#0x01ba ""                         "" "" # LATIN SMALL LETTER EZH WITH TAIL
+#0x01bb ""                         "" "" # LATIN LETTER TWO WITH STROKE
+#0x01bc ""                         "" "" # LATIN CAPITAL LETTER TONE FIVE
+#0x01bd ""                         "" "" # LATIN SMALL LETTER TONE FIVE
+#0x01be ""                         "" "" # LATIN LETTER INVERTED GLOTTAL STOP WITH STROKE
+#0x01bf ""                         "" "" # LATIN LETTER WYNN
+#0x01c0 ""                         "" "" # LATIN LETTER DENTAL CLICK
+#0x01c1 ""                         "" "" # LATIN LETTER LATERAL CLICK
+#0x01c2 ""                         "" "" # LATIN LETTER ALVEOLAR CLICK
+#0x01c3 ""                         "" "" # LATIN LETTER RETROFLEX CLICK
+#0x01c4 ""                         "" "" # LATIN CAPITAL LETTER DZ WITH CARON
+#0x01c5 ""                         "" "" # LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON
+#0x01c6 ""                         "" "" # LATIN SMALL LETTER DZ WITH CARON
+#0x01c7 ""                         "" "" # LATIN CAPITAL LETTER LJ
+#0x01c8 ""                         "" "" # LATIN CAPITAL LETTER L WITH SMALL LETTER J
+#0x01c9 ""                         "" "" # LATIN SMALL LETTER LJ
+#0x01ca ""                         "" "" # LATIN CAPITAL LETTER NJ
+#0x01cb ""                         "" "" # LATIN CAPITAL LETTER N WITH SMALL LETTER J
+#0x01cc ""                         "" "" # LATIN SMALL LETTER NJ
+0x01cd "\\v{A}"                   "" "" # LATIN CAPITAL LETTER A WITH CARON
+0x01ce "\\v{a}"                   "" "" # LATIN SMALL LETTER A WITH CARON
+0x01cf "\\v{I}"                   "" "" # LATIN CAPITAL LETTER I WITH CARON
+0x01d0 "\\v{\\i}"                 "" "" # LATIN SMALL LETTER I WITH CARON
+0x01d1 "\\v{O}"                   "" "" # LATIN CAPITAL LETTER O WITH CARON
+0x01d2 "\\v{o}"                   "" "" # LATIN SMALL LETTER O WITH CARON
+0x01d3 "\\v{U}"                   "" "" # LATIN CAPITAL LETTER U WITH CARON
+0x01d4 "\\v{u}"                   "" "" # LATIN SMALL LETTER U WITH CARON
+#0x01d5 ""                         "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON
+#0x01d6 ""                         "" "" # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON
+#0x01d7 ""                         "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE
+#0x01d8 ""                         "" "" # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE
+#0x01d9 ""                         "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON
+#0x01da ""                         "" "" # LATIN SMALL LETTER U WITH DIAERESIS AND CARON
+#0x01db ""                         "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE
+#0x01dc ""                         "" "" # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE
+#0x01dd ""                         "" "" # LATIN SMALL LETTER TURNED E
+#0x01de ""                         "" "" # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON
+#0x01df ""                         "" "" # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON
+#0x01e0 ""                         "" "" # LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON
+#0x01e1 ""                         "" "" # LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON
+0x01e2 "\\={\\AE}"                "" "" # LATIN CAPITAL LETTER AE WITH MACRON
+0x01e3 "\\={\\ae}"                "" "" # LATIN SMALL LETTER AE WITH MACRON
+#0x01e4 ""                         "" "" # LATIN CAPITAL LETTER G WITH STROKE
+#0x01e5 ""                         "" "" # LATIN SMALL LETTER G WITH STROKE
+0x01e6 "\\v{G}"                   "" "" # LATIN CAPITAL LETTER G WITH CARON
+0x01e7 "\\v{g}"                   "" "" # LATIN SMALL LETTER G WITH CARON
+0x01e8 "\\v{K}"                   "" "" # LATIN CAPITAL LETTER K WITH CARON
+0x01e9 "\\v{k}"                   "" "" # LATIN SMALL LETTER K WITH CARON
+0x01ea "\\k{O}"                   "" "" # LATIN CAPITAL LETTER O WITH OGONEK
+0x01eb "\\k{o}"                   "" "" # LATIN SMALL LETTER O WITH OGONEK
+#0x01ec ""                         "" "" # LATIN CAPITAL LETTER O WITH OGONEK AND MACRON
+#0x01ed ""                         "" "" # LATIN SMALL LETTER O WITH OGONEK AND MACRON
+#0x01ee ""                         "" "" # LATIN CAPITAL LETTER EZH WITH CARON
+#0x01ef ""                         "" "" # LATIN SMALL LETTER EZH WITH CARON
+0x01f0 "\\v{\\j}"                 "" "" # LATIN SMALL LETTER J WITH CARON
+0x01ce "\\v{a}"                   "" "" # LATIN SMALL LETTER A WITH CARON
+#0x01f1 ""                         "" "" # LATIN CAPITAL LETTER DZ
+#0x01f2 ""                         "" "" # LATIN CAPITAL LETTER D WITH SMALL LETTER Z
+#0x01f3 ""                         "" "" # LATIN SMALL LETTER DZ
+0x01f4 "\\'{G}"                   "" "" # LATIN CAPITAL LETTER G WITH ACUTE
+0x01f5 "\\'{g}"                   "" "" # LATIN SMALL LETTER G WITH ACUTE
+#0x01f6 ""                         "" "" # LATIN CAPITAL LETTER HWAIR
+#0x01f7 ""                         "" "" # LATIN CAPITAL LETTER WYNN
+0x01f8 "\\`{N}"                   "" "" # LATIN CAPITAL LETTER N WITH GRAVE
+0x01f9 "\\`{n}"                   "" "" # LATIN SMALL LETTER N WITH GRAVE
+#0x01fa ""                         "" "" # LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE
+#0x01fb ""                         "" "" # LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE
+0x01fc "\\'{\\AE}"                "" "" # LATIN CAPITAL LETTER AE WITH ACUTE
+0x01fd "\\'{\\ae}"                "" "" # LATIN SMALL LETTER AE WITH ACUTE
+#0x01fe ""                         "" "" # LATIN CAPITAL LETTER O WITH STROKE AND ACUTE
+#0x01ff ""                         "" "" # LATIN SMALL LETTER O WITH STROKE AND ACUTE
+0x0200 "\\textdoublegrave{A}"     "tipa" "" # LATIN CAPITAL LETTER A WITH DOUBLE GRAVE
+0x0201 "\\textdoublegrave{a}"     "tipa" "" # LATIN SMALL LETTER A WITH DOUBLE GRAVE
+#0x0202 ""                         "" "" # LATIN CAPITAL LETTER A WITH INVERTED BREVE
+#0x0203 ""                         "" "" # LATIN SMALL LETTER A WITH INVERTED BREVE
+0x0204 "\\textdoublegrave{E}"     "tipa" "" # LATIN CAPITAL LETTER E WITH DOUBLE GRAVE
+0x0205 "\\textdoublegrave{e}"     "tipa" "" # LATIN SMALL LETTER E WITH DOUBLE GRAVE
+#0x0206 ""                         "" "" # LATIN CAPITAL LETTER E WITH INVERTED BREVE
+#0x0207 ""                         "" "" # LATIN SMALL LETTER E WITH INVERTED BREVE
+0x0208 "\\textdoublegrave{I}"     "tipa" "" # LATIN CAPITAL LETTER I WITH DOUBLE GRAVE
+0x0209 "\\textdoublegrave{\\i}"   "tipa" "" # LATIN SMALL LETTER I WITH DOUBLE GRAVE
+#0x020a ""                         "" "" # LATIN CAPITAL LETTER I WITH INVERTED BREVE
+#0x020b ""                         "" "" # LATIN SMALL LETTER I WITH INVERTED BREVE
+0x020c "\\textdoublegrave{O}"     "tipa" "" # LATIN CAPITAL LETTER O WITH DOUBLE GRAVE
+0x020d "\\textdoublegrave{o}"     "tipa" "" # LATIN SMALL LETTER O WITH DOUBLE GRAVE
+#0x020e ""                         "" "" # LATIN CAPITAL LETTER O WITH INVERTED BREVE
+#0x020f ""                         "" "" # LATIN SMALL LETTER O WITH INVERTED BREVE
+0x0210 "\\textdoublegrave{R}"     "tipa" "" # LATIN CAPITAL LETTER R WITH DOUBLE GRAVE
+0x0211 "\\textdoublegrave{r}"     "tipa" "" # LATIN SMALL LETTER R WITH DOUBLE GRAVE
+#0x0212 ""                         "" "" # LATIN CAPITAL LETTER R WITH INVERTED BREVE
+#0x0213 ""                         "" "" # LATIN SMALL LETTER R WITH INVERTED BREVE
+0x0214 "\\textdoublegrave{U}"     "tipa" "" # LATIN CAPITAL LETTER U WITH DOUBLE GRAVE
+0x0215 "\\textdoublegrave{u}"     "tipa" "" # LATIN SMALL LETTER U WITH DOUBLE GRAVE
+#0x0216 ""                         "" "" # LATIN CAPITAL LETTER U WITH INVERTED BREVE
+#0x0217 ""                         "" "" # LATIN SMALL LETTER U WITH INVERTED BREVE
+#0x0218 ""                         "" "" # LATIN CAPITAL LETTER S WITH COMMA BELOW
+#0x0219 ""                         "" "" # LATIN SMALL LETTER S WITH COMMA BELOW
+#0x021a ""                         "" "" # LATIN CAPITAL LETTER T WITH COMMA BELOW
+#0x021b ""                         "" "" # LATIN SMALL LETTER T WITH COMMA BELOW
+#0x021c ""                         "" "" # LATIN CAPITAL LETTER YOGH
+#0x021d ""                         "" "" # LATIN SMALL LETTER YOGH
+0x021e "\\v{H}"                   "" "" # LATIN CAPITAL LETTER H WITH CARON
+0x021f "\\v{h}"                   "" "" # LATIN SMALL LETTER H WITH CARON
+#0x0220 ""                         "" "" # LATIN CAPITAL LETTER N WITH LONG RIGHT LEG
+#0x0222 ""                         "" "" # LATIN CAPITAL LETTER OU
+#0x0223 ""                         "" "" # LATIN SMALL LETTER OU
+#0x0224 ""                         "" "" # LATIN CAPITAL LETTER Z WITH HOOK
+#0x0225 ""                         "" "" # LATIN SMALL LETTER Z WITH HOOK
+0x0226 "\\.{A}"                   "" "" # LATIN CAPITAL LETTER A WITH DOT ABOVE
+0x0227 "\\.{a}"                   "" "" # LATIN SMALL LETTER A WITH DOT ABOVE
+0x0228 "\\c{E}"                   "" "" # LATIN CAPITAL LETTER E WITH CEDILLA
+0x0229 "\\c{e}"                   "" "" # LATIN SMALL LETTER E WITH CEDILLA
+#0x022a ""                         "" "" # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON
+#0x022b ""                         "" "" # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON
+#0x022c ""                         "" "" # LATIN CAPITAL LETTER O WITH TILDE AND MACRON
+#0x022d ""                         "" "" # LATIN SMALL LETTER O WITH TILDE AND MACRON
+0x022e "\\.{O}"                   "" "" # LATIN CAPITAL LETTER O WITH DOT ABOVE
+0x022f "\\.{o}"                   "" "" # LATIN SMALL LETTER O WITH DOT ABOVE
+#0x0230 ""                         "" "" # LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON
+#0x0231 ""                         "" "" # LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON
+0x0232 "\\={Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH MACRON
+0x0233 "\\={y}"                   "" "" # LATIN SMALL LETTER Y WITH MACRON
+0x0237 "\\j"                      "" "" # LATIN SMALL LETTER DOTLESS J
+0x0250 "\\textturna"              "tipa" "" # LATIN SMALL LETTER TURNED A
+#0x0251 ""                         "" "" # LATIN SMALL LETTER ALPHA
+#0x0252 ""                         "" "" # LATIN SMALL LETTER TURNED ALPHA
+#0x0253 ""                         "" "" # LATIN SMALL LETTER B WITH HOOK
+#0x0254 ""                         "" "" # LATIN SMALL LETTER OPEN O
+#0x0255 ""                         "" "" # LATIN SMALL LETTER C WITH CURL
+#0x0256 ""                         "" "" # LATIN SMALL LETTER D WITH TAIL
+#0x0257 ""                         "" "" # LATIN SMALL LETTER D WITH HOOK
+0x0258 "\\textreve"               "tipa" "" # LATIN SMALL LETTER REVERSED E
+0x0259 "\\textschwa"              "tipa" "" # LATIN SMALL LETTER SCHWA
+0x025a "\\textrhookschwa"         "tipa" "" # LATIN SMALL LETTER SCHWA WITH HOOK
+#0x025b ""                         "" "" # LATIN SMALL LETTER OPEN E
+#0x025c ""                         "" "" # LATIN SMALL LETTER REVERSED OPEN E
+#0x025d ""                         "" "" # LATIN SMALL LETTER REVERSED OPEN E WITH HOOK
+#0x025e ""                         "" "" # LATIN SMALL LETTER CLOSED REVERSED OPEN E
+#0x025f ""                         "" "" # LATIN SMALL LETTER DOTLESS J WITH STROKE
+#0x0260 ""                         "" "" # LATIN SMALL LETTER G WITH HOOK
+#0x0261 ""                         "" "" # LATIN SMALL LETTER SCRIPT G
+#0x0262 ""                         "" "" # LATIN LETTER SMALL CAPITAL G
+#0x0263 ""                         "" "" # LATIN SMALL LETTER GAMMA
+#0x0264 ""                         "" "" # LATIN SMALL LETTER RAMS HORN
+0x0265 "\\textturnh"              "tipa" "" # LATIN SMALL LETTER TURNED H
+#0x0266 ""                         "" "" # LATIN SMALL LETTER H WITH HOOK
+#0x0267 ""                         "" "" # LATIN SMALL LETTER HENG WITH HOOK
+#0x0268 ""                         "" "" # LATIN SMALL LETTER I WITH STROKE
+#0x0269 ""                         "" "" # LATIN SMALL LETTER IOTA
+#0x026a ""                         "" "" # LATIN LETTER SMALL CAPITAL I
+#0x026b ""                         "" "" # LATIN SMALL LETTER L WITH MIDDLE TILDE
+#0x026c ""                         "" "" # LATIN SMALL LETTER L WITH BELT
+#0x026d ""                         "" "" # LATIN SMALL LETTER L WITH RETROFLEX HOOK
+#0x026e ""                         "" "" # LATIN SMALL LETTER LEZH
+0x026f "\\textturnm"              "tipa" "" # LATIN SMALL LETTER TURNED M
+0x0270 "\\textturnmrleg"          "tipa" "" # LATIN SMALL LETTER TURNED M WITH LONG LEG
+#0x0271 ""                         "" "" # LATIN SMALL LETTER M WITH HOOK
+#0x0272 ""                         "" "" # LATIN SMALL LETTER N WITH LEFT HOOK
+#0x0273 ""                         "" "" # LATIN SMALL LETTER N WITH RETROFLEX HOOK
+#0x0274 ""                         "" "" # LATIN LETTER SMALL CAPITAL N
+#0x0275 ""                         "" "" # LATIN SMALL LETTER BARRED O
+#0x0276 ""                         "" "" # LATIN LETTER SMALL CAPITAL OE
+#0x0277 ""                         "" "" # LATIN SMALL LETTER CLOSED OMEGA
+#0x0278 ""                         "" "" # LATIN SMALL LETTER PHI
+0x0279 "\\textturnr"              "tipa" "" # LATIN SMALL LETTER TURNED R
+0x027a "\\textturnlonglegr"       "tipa" "" # LATIN SMALL LETTER TURNED R WITH LONG LEG
+0x027b "\\textturnrrtail"         "tipa" "" # LATIN SMALL LETTER TURNED R WITH HOOK
+#0x027c ""                         "" "" # LATIN SMALL LETTER R WITH LONG LEG
+#0x027d ""                         "" "" # LATIN SMALL LETTER R WITH TAIL
+#0x027e ""                         "" "" # LATIN SMALL LETTER R WITH FISHHOOK
+#0x027f ""                         "" "" # LATIN SMALL LETTER REVERSED R WITH FISHHOOK
+#0x0280 ""                         "" "" # LATIN LETTER SMALL CAPITAL R
+#0x0281 ""                         "" "" # LATIN LETTER SMALL CAPITAL INVERTED R
+#0x0282 ""                         "" "" # LATIN SMALL LETTER S WITH HOOK
+#0x0283 ""                         "" "" # LATIN SMALL LETTER ESH
+#0x0284 ""                         "" "" # LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK
+#0x0285 ""                         "" "" # LATIN SMALL LETTER SQUAT REVERSED ESH
+#0x0286 ""                         "" "" # LATIN SMALL LETTER ESH WITH CURL
+0x0287 "\\textturnt"              "tipa" "" # LATIN SMALL LETTER TURNED T
+#0x0288 ""                         "" "" # LATIN SMALL LETTER T WITH RETROFLEX HOOK
+#0x0289 ""                         "" "" # LATIN SMALL LETTER U BAR
+#0x028a ""                         "" "" # LATIN SMALL LETTER UPSILON
+#0x028b ""                         "" "" # LATIN SMALL LETTER V WITH HOOK
+0x028c "\\textturnv"              "tipa" "" # LATIN SMALL LETTER TURNED V
+0x028d "\\textturnw"              "tipa" "" # LATIN SMALL LETTER TURNED W
+0x028e "\\textturny"              "tipa" "" # LATIN SMALL LETTER TURNED Y
+#0x028f ""                         "" "" # LATIN LETTER SMALL CAPITAL Y
+#0x0290 ""                         "" "" # LATIN SMALL LETTER Z WITH RETROFLEX HOOK
+#0x0291 ""                         "" "" # LATIN SMALL LETTER Z WITH CURL
+#0x0292 ""                         "" "" # LATIN SMALL LETTER EZH
+#0x0293 ""                         "" "" # LATIN SMALL LETTER EZH WITH CURL
+0x0294 "\\textglotstop"           "tipa" "" # LATIN LETTER GLOTTAL STOP
+#0x0295 ""                         "" "" # LATIN LETTER PHARYNGEAL VOICED FRICATIVE
+0x0296 "\\textinvglotstop"        "tipa" "" # LATIN LETTER INVERTED GLOTTAL STOP
+#0x0297 ""                         "" "" # LATIN LETTER STRETCHED C
+#0x0298 ""                         "" "" # LATIN LETTER BILABIAL CLICK
+#0x0299 ""                         "" "" # LATIN LETTER SMALL CAPITAL B
+#0x029a ""                         "" "" # LATIN SMALL LETTER CLOSED OPEN E
+#0x029b ""                         "" "" # LATIN LETTER SMALL CAPITAL G WITH HOOK
+#0x029c ""                         "" "" # LATIN LETTER SMALL CAPITAL H
+#0x029d ""                         "" "" # LATIN SMALL LETTER J WITH CROSSED-TAIL
+0x029e "\\textturnk"              "tipa" "" # LATIN SMALL LETTER TURNED K
+#0x029f ""                         "" "" # LATIN LETTER SMALL CAPITAL L
+#0x02a0 ""                         "" "" # LATIN SMALL LETTER Q WITH HOOK
+#0x02a1 ""                         "" "" # LATIN LETTER GLOTTAL STOP WITH STROKE
+#0x02a2 ""                         "" "" # LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE
+#0x02a3 ""                         "" "" # LATIN SMALL LETTER DZ DIGRAPH
+#0x02a4 ""                         "" "" # LATIN SMALL LETTER DEZH DIGRAPH
+#0x02a5 ""                         "" "" # LATIN SMALL LETTER DZ DIGRAPH WITH CURL
+#0x02a6 ""                         "" "" # LATIN SMALL LETTER TS DIGRAPH
+#0x02a7 ""                         "" "" # LATIN SMALL LETTER TESH DIGRAPH
+#0x02a8 ""                         "" "" # LATIN SMALL LETTER TC DIGRAPH WITH CURL
+#0x02a9 ""                         "" "" # LATIN SMALL LETTER FENG DIGRAPH
+#0x02aa ""                         "" "" # LATIN SMALL LETTER LS DIGRAPH
+#0x02ab ""                         "" "" # LATIN SMALL LETTER LZ DIGRAPH
+#0x02ac ""                         "" "" # LATIN LETTER BILABIAL PERCUSSIVE
+#0x02ad ""                         "" "" # LATIN LETTER BIDENTAL PERCUSSIVE
+#0x02b0 ""                         "" "" # MODIFIER LETTER SMALL H
+#0x02b1 ""                         "" "" # MODIFIER LETTER SMALL H WITH HOOK
+#0x02b2 ""                         "" "" # MODIFIER LETTER SMALL J
+#0x02b3 ""                         "" "" # MODIFIER LETTER SMALL R
+#0x02b4 ""                         "" "" # MODIFIER LETTER SMALL TURNED R
+#0x02b5 ""                         "" "" # MODIFIER LETTER SMALL TURNED R WITH HOOK
+#0x02b6 ""                         "" "" # MODIFIER LETTER SMALL CAPITAL INVERTED R
+#0x02b7 ""                         "" "" # MODIFIER LETTER SMALL W
+#0x02b8 ""                         "" "" # MODIFIER LETTER SMALL Y
+#0x02b9 ""                         "" "" # MODIFIER LETTER PRIME
+#0x02ba ""                         "" "" # MODIFIER LETTER DOUBLE PRIME
+#0x02bb ""                         "" "" # MODIFIER LETTER TURNED COMMA
+#0x02bc ""                         "" "" # MODIFIER LETTER APOSTROPHE
+#0x02bd ""                         "" "" # MODIFIER LETTER REVERSED COMMA
+#0x02be ""                         "" "" # MODIFIER LETTER RIGHT HALF RING
+#0x02bf ""                         "" "" # MODIFIER LETTER LEFT HALF RING
+#0x02c0 ""                         "" "" # MODIFIER LETTER GLOTTAL STOP
+#0x02c1 ""                         "" "" # MODIFIER LETTER REVERSED GLOTTAL STOP
+#0x02c2 ""                         "" "" # MODIFIER LETTER LEFT ARROWHEAD
+#0x02c3 ""                         "" "" # MODIFIER LETTER RIGHT ARROWHEAD
+#0x02c4 ""                         "" "" # MODIFIER LETTER UP ARROWHEAD
+#0x02c5 ""                         "" "" # MODIFIER LETTER DOWN ARROWHEAD
+#0x02c6 ""                         "" "" # MODIFIER LETTER CIRCUMFLEX ACCENT
+0x02c7 "\\v{ }"                   "" "" # CARON
+#0x02c8 ""                         "" "" # MODIFIER LETTER VERTICAL LINE
+#0x02c9 ""                         "" "" # MODIFIER LETTER MACRON
+#0x02ca ""                         "" "" # MODIFIER LETTER ACUTE ACCENT
+#0x02cb ""                         "" "" # MODIFIER LETTER GRAVE ACCENT
+#0x02cc ""                         "" "" # MODIFIER LETTER LOW VERTICAL LINE
+#0x02cd ""                         "" "" # MODIFIER LETTER LOW MACRON
+#0x02ce ""                         "" "" # MODIFIER LETTER LOW GRAVE ACCENT
+#0x02cf ""                         "" "" # MODIFIER LETTER LOW ACUTE ACCENT
+#0x02d0 ""                         "" "" # MODIFIER LETTER TRIANGULAR COLON
+#0x02d1 ""                         "" "" # MODIFIER LETTER HALF TRIANGULAR COLON
+#0x02d2 ""                         "" "" # MODIFIER LETTER CENTRED RIGHT HALF RING
+#0x02d3 ""                         "" "" # MODIFIER LETTER CENTRED LEFT HALF RING
+#0x02d4 ""                         "" "" # MODIFIER LETTER UP TACK
+#0x02d5 ""                         "" "" # MODIFIER LETTER DOWN TACK
+#0x02d6 ""                         "" "" # MODIFIER LETTER PLUS SIGN
+#0x02d7 ""                         "" "" # MODIFIER LETTER MINUS SIGN
+0x02d8 "\\u{ }"                   "" "" # BREVE
+0x02d9 "\\.{ }"                   "" "" # DOT ABOVE
+0x02da "\\r{ }"                   "" "" # RING ABOVE
+0x02db "\\k{ }"                   "" "" # OGONEK
+0x02dc "\\~{ }"                   "" "" # SMALL TILDE
+0x02dd "\\H{ }"                   "" "" # DOUBLE ACUTE ACCENT
+#0x02de ""                         "" "" # MODIFIER LETTER RHOTIC HOOK
+#0x02df ""                         "" "" # MODIFIER LETTER CROSS ACCENT
+#0x02e0 ""                         "" "" # MODIFIER LETTER SMALL GAMMA
+#0x02e1 ""                         "" "" # MODIFIER LETTER SMALL L
+#0x02e2 ""                         "" "" # MODIFIER LETTER SMALL S
+#0x02e3 ""                         "" "" # MODIFIER LETTER SMALL X
+#0x02e4 ""                         "" "" # MODIFIER LETTER SMALL REVERSED GLOTTAL STOP
+#0x02e5 ""                         "" "" # MODIFIER LETTER EXTRA-HIGH TONE BAR
+#0x02e6 ""                         "" "" # MODIFIER LETTER HIGH TONE BAR
+#0x02e7 ""                         "" "" # MODIFIER LETTER MID TONE BAR
+#0x02e8 ""                         "" "" # MODIFIER LETTER LOW TONE BAR
+#0x02e9 ""                         "" "" # MODIFIER LETTER EXTRA-LOW TONE BAR
+#0x02ea ""                         "" "" # MODIFIER LETTER YIN DEPARTING TONE MARK
+#0x02eb ""                         "" "" # MODIFIER LETTER YANG DEPARTING TONE MARK
+#0x02ec ""                         "" "" # MODIFIER LETTER VOICING
+#0x02ed ""                         "" "" # MODIFIER LETTER UNASPIRATED
+#0x02ee ""                         "" "" # MODIFIER LETTER DOUBLE APOSTROPHE
+0x0300 "\\`"                      "" "combining" # COMBINING GRAVE ACCENT
+0x0301 "\\'"                      "" "combining" # COMBINING ACUTE ACCENT
+0x0302 "\\^"                      "" "combining" # COMBINING CIRCUMFLEX ACCENT
+0x0303 "\\~"                      "" "combining" # COMBINING TILDE
+0x0304 "\\="                      "" "combining" # COMBINING MACRON
+#0x0305 ""                         "" "combining" # COMBINING OVERLINE
+0x0306 "\\u"                      "" "combining" # COMBINING BREVE
+0x0307 "\\."                      "" "combining" # COMBINING DOT ABOVE
+0x0308 "\\\""                     "" "combining" # COMBINING DIAERESIS
+#0x0309 ""                         "" "combining" # COMBINING HOOK ABOVE
+0x030a "\\r"                      "" "combining" # COMBINING RING ABOVE
+0x030b "\\H"                      "" "combining" # COMBINING DOUBLE ACUTE ACCENT
+0x030c "\\v"                      "" "combining" # COMBINING CARON
+0x030d "\\textvbaraccent"         "tipa" "combining" # COMBINING VERTICAL LINE ABOVE
+0x030e "\\textdoublevbaraccent"   "tipa" "combining" # COMBINING DOUBLE VERTICAL LINE ABOVE
+0x030f "\\textdoublegrave"        "tipa" "combining" # COMBINING DOUBLE GRAVE ACCENT
+0x0310 "\\textdotbreve"           "tipa" "combining" # COMBINING CANDRABINDU
+0x0311 "\\textroundcap"           "tipa" "combining" # COMBINING INVERTED BREVE
+#0x0312 ""                         "" "combining" # COMBINING TURNED COMMA ABOVE
+#0x0313 ""                         "" "combining" # COMBINING COMMA ABOVE
+#0x0314 ""                         "" "combining" # COMBINING REVERSED COMMA ABOVE
+#0x0315 ""                         "" "combining" # COMBINING COMMA ABOVE RIGHT
+0x0316 "\\textsubgrave"           "tipa" "combining" # COMBINING GRAVE ACCENT BELOW
+0x0317 "\\textsubacute"           "tipa" "combining" # COMBINING ACUTE ACCENT BELOW
+0x0318 "\\textadvancing"          "tipa" "combining" # COMBINING LEFT TACK BELOW
+0x0319 "\\textretracting"         "tipa" "combining" # COMBINING RIGHT TACK BELOW
+#0x031a ""                         "" "combining" # COMBINING LEFT ANGLE ABOVE
+#0x031b ""                         "" "combining" # COMBINING HORN
+0x031c "\\textsublhalfring"       "tipa" "combining" # COMBINING LEFT HALF RING BELOW
+0x031d "\\textraising"            "tipa" "combining" # COMBINING UP TACK BELOW
+0x031e "\\textlowering"           "tipa" "combining" # COMBINING DOWN TACK BELOW
+0x031f "\\textsubplus"            "tipa" "combining" # COMBINING PLUS SIGN BELOW
+0x0320 "\\b"                      "" "combining" # COMBINING MINUS SIGN BELOW
+#0x0321 ""                         "" "combining" # COMBINING PALATALIZED HOOK BELOW
+#0x0322 ""                         "" "combining" # COMBINING RETROFLEX HOOK BELOW
+0x0323 "\\d"                      "" "combining" # COMBINING DOT BELOW
+0x0324 "\\textsubumlaut"          "tipa" "combining" # COMBINING DIAERESIS BELOW
+0x0325 "\\textsubring"            "tipa" "combining" # COMBINING RING BELOW
+#0x0326 ""                         "" "combining" # COMBINING COMMA BELOW
+0x0327 "\\c"                      "" "combining" # COMBINING CEDILLA
+0x0328 "\\k"                      "" "combining" # COMBINING OGONEK
+0x0329 "\\textsyllabic"           "tipa" "combining" # COMBINING VERTICAL LINE BELOW
+0x032a "\\textsubbridge"          "tipa" "combining" # COMBINING BRIDGE BELOW
+0x032b "\\textsubw"               "tipa" "combining" # COMBINING INVERTED DOUBLE ARCH BELOW
+0x032c "\\textsubwedge"           "tipa" "combining" # COMBINING CARON BELOW
+0x032d "\\textsubcircum"          "tipa" "combining" # COMBINING CIRCUMFLEX ACCENT BELOW
+#0x032e ""                         "" "combining" # COMBINING BREVE BELOW
+0x032f "\\textsubarch"            "tipa" "combining" # COMBINING INVERTED BREVE BELOW
+0x0330 "\\textsubtilde"           "tipa" "combining" # COMBINING TILDE BELOW
+#0x0331 ""                         "" "combining" # COMBINING MACRON BELOW
+#0x0332 ""                         "" "combining" # COMBINING LOW LINE
+#0x0333 ""                         "" "combining" # COMBINING DOUBLE LOW LINE
+0x0334 "\\textsuperimposetilde"   "tipa" "combining" # COMBINING TILDE OVERLAY
+#0x0335 ""                         "" "combining" # COMBINING SHORT STROKE OVERLAY
+#0x0336 ""                         "" "combining" # COMBINING LONG STROKE OVERLAY
+#0x0337 ""                         "" "combining" # COMBINING SHORT SOLIDUS OVERLAY
+#0x0338 ""                         "" "combining" # COMBINING LONG SOLIDUS OVERLAY
+0x0339 "\\textsubrhalfring"       "tipa" "combining" # COMBINING RIGHT HALF RING BELOW
+0x033a "\\textinvsubbridge"       "tipa" "combining" # COMBINING INVERTED BRIDGE BELOW
+0x033b "\\textsubsquare"          "tipa" "combining" # COMBINING SQUARE BELOW
+0x033c "\\textseagull"            "tipa" "combining" # COMBINING SEAGULL BELOW
+0x033d "\\textovercross"          "tipa" "combining" # COMBINING X ABOVE
+#0x033e ""                         "" "combining" # COMBINING VERTICAL TILDE
+#0x033f ""                         "" "combining" # COMBINING DOUBLE OVERLINE
+#0x0340 ""                         "" "combining" # COMBINING GRAVE TONE MARK
+#0x0341 ""                         "" "combining" # COMBINING ACUTE TONE MARK
+#0x0342 ""                         "" "combining" # COMBINING GREEK PERISPOMENI
+#0x0343 ""                         "" "combining" # COMBINING GREEK KORONIS
+#0x0344 ""                         "" "combining" # COMBINING GREEK DIALYTIKA TONOS
+#0x0345 ""                         "" "combining" # COMBINING GREEK YPOGEGRAMMENI
+0x0346 "\\overbridge"             "tipa" "combining" # COMBINING BRIDGE ABOVE
+0x0347 "\\subdoublebar"           "tipa" "combining" # COMBINING EQUALS SIGN BELOW
+0x0348 "\\subdoublevert"          "tipa" "combining" # COMBINING DOUBLE VERTICAL LINE BELOW
+0x0349 "\\subcorner"              "tipa" "combining" # COMBINING LEFT ANGLE BELOW
+0x034a "\\crtilde"                "tipa" "combining" # COMBINING NOT TILDE ABOVE
+0x034b "\\dottedtilde"            "tipa" "combining" # COMBINING HOMOTHETIC ABOVE
+0x034c "\\doubletilde"            "tipa" "combining" # COMBINING ALMOST EQUAL TO ABOVE
+0x034d "\\spreadlips"             "tipa" "combining" # COMBINING LEFT RIGHT ARROW BELOW
+0x034e "\\whistle"                "tipa" "combining" # COMBINING UPWARDS ARROW BELOW
+#0x034f ""                         "" "" # COMBINING GRAPHEME JOINER
+#0x0360 ""                         "" "combining" # COMBINING DOUBLE TILDE
+0x0361 "\\t"                      "" "combining" # COMBINING DOUBLE INVERTED BREVE (ligature tie)
+#0x0362 ""                         "" "combining" # COMBINING DOUBLE RIGHTWARDS ARROW BELOW
+#0x0363 ""                         "" "combining" # COMBINING LATIN SMALL LETTER A
+#0x0364 ""                         "" "combining" # COMBINING LATIN SMALL LETTER E
+#0x0365 ""                         "" "combining" # COMBINING LATIN SMALL LETTER I
+#0x0366 ""                         "" "combining" # COMBINING LATIN SMALL LETTER O
+#0x0367 ""                         "" "combining" # COMBINING LATIN SMALL LETTER U
+#0x0368 ""                         "" "combining" # COMBINING LATIN SMALL LETTER C
+#0x0369 ""                         "" "combining" # COMBINING LATIN SMALL LETTER D
+#0x036a ""                         "" "combining" # COMBINING LATIN SMALL LETTER H
+#0x036b ""                         "" "combining" # COMBINING LATIN SMALL LETTER M
+#0x036c ""                         "" "combining" # COMBINING LATIN SMALL LETTER R
+#0x036d ""                         "" "combining" # COMBINING LATIN SMALL LETTER T
+#0x036e ""                         "" "combining" # COMBINING LATIN SMALL LETTER V
+#0x036f ""                         "" "combining" # COMBINING LATIN SMALL LETTER X
+0x0e3f "\\textbaht"               "textcomp" "" # THAI CURRENCY SYMBOL BAHT
+0x1e00 "\\textsubring{A}"         "tipa" "" # LATIN CAPITAL LETTER A WITH RING BELOW
+0x1e01 "\\textsubring{a}"         "tipa" "" # LATIN SMALL LETTER A WITH RING BELOW
+0x1e02 "\\.{B}"                   "" "" # LATIN CAPITAL LETTER B WITH DOT ABOVE
+0x1e03 "\\.{b}"                   "" "" # LATIN SMALL LETTER B WITH DOT ABOVE
+0x1e04 "\\d{B}"                   "" "" # LATIN CAPITAL LETTER B WITH DOT BELOW
+0x1e05 "\\d{b}"                   "" "" # LATIN SMALL LETTER B WITH DOT BELOW
+#0x1e06 ""                         "" "" # LATIN CAPITAL LETTER B WITH LINE BELOW
+#0x1e07 ""                         "" "" # LATIN SMALL LETTER B WITH LINE BELOW
+#0x1e08 ""                         "" "" # LATIN CAPITAL LETTER C WITH CEDILLA AND ACUTE
+#0x1e09 ""                         "" "" # LATIN SMALL LETTER C WITH CEDILLA AND ACUTE
+0x1e0a "\\.{D}"                   "" "" # LATIN CAPITAL LETTER D WITH DOT ABOVE
+0x1e0b "\\.{d}"                   "" "" # LATIN SMALL LETTER D WITH DOT ABOVE
+0x1e0c "\\d{D}"                   "" "" # LATIN CAPITAL LETTER D WITH DOT BELOW
+0x1e0d "\\d{d}"                   "" "" # LATIN SMALL LETTER D WITH DOT BELOW
+#0x1e0e ""                         "" "" # LATIN CAPITAL LETTER D WITH LINE BELOW
+#0x1e0f ""                         "" "" # LATIN SMALL LETTER D WITH LINE BELOW
+0x1e10 "\\c{D}"                   "" "" # LATIN CAPITAL LETTER D WITH CEDILLA
+0x1e11 "\\c{d}"                   "" "" # LATIN SMALL LETTER D WITH CEDILLA
+0x1e12 "\\textsubcircum{D}"       "tipa" "" # LATIN CAPITAL LETTER D WITH CIRCUMFLEX BELOW
+0x1e13 "\\textsubcircum{d}"       "tipa" "" # LATIN SMALL LETTER D WITH CIRCUMFLEX BELOW
+#0x1e14 ""                         "" "" # LATIN CAPITAL LETTER E WITH MACRON AND GRAVE
+#0x1e15 ""                         "" "" # LATIN SMALL LETTER E WITH MACRON AND GRAVE
+#0x1e16 ""                         "" "" # LATIN CAPITAL LETTER E WITH MACRON AND ACUTE
+#0x1e17 ""                         "" "" # LATIN SMALL LETTER E WITH MACRON AND ACUTE
+0x1e18 "\\textsubcircum{E}"       "tipa" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX BELOW
+0x1e19 "\\textsubcircum{e}"       "tipa" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX BELOW
+0x1e1a "\\textsubtilde{E}"        "tipa" "" # LATIN CAPITAL LETTER E WITH TILDE BELOW
+0x1e1b "\\textsubtilde{e}"        "tipa" "" # LATIN SMALL LETTER E WITH TILDE BELOW
+#0x1e1c ""                         "" "" # LATIN CAPITAL LETTER E WITH CEDILLA AND BREVE
+#0x1e1d ""                         "" "" # LATIN SMALL LETTER E WITH CEDILLA AND BREVE
+0x1e1e "\\.{F}"                   "" "" # LATIN CAPITAL LETTER F WITH DOT ABOVE
+0x1e1f "\\.{f}"                   "" "" # LATIN SMALL LETTER F WITH DOT ABOVE
+#0x1e20 ""                         "" "" # LATIN CAPITAL LETTER G WITH MACRON
+#0x1e21 ""                         "" "" # LATIN SMALL LETTER G WITH MACRON
+0x1e22 "\\.{H}"                   "" "" # LATIN CAPITAL LETTER H WITH DOT ABOVE
+0x1e23 "\\.{h}"                   "" "" # LATIN SMALL LETTER H WITH DOT ABOVE
+0x1e24 "\\d{H}"                   "" "" # LATIN CAPITAL LETTER H WITH DOT BELOW
+0x1e25 "\\d{h}"                   "" "" # LATIN SMALL LETTER H WITH DOT BELOW
+0x1e26 "\\\"{H}"                  "" "" # LATIN CAPITAL LETTER H WITH DIAERESIS
+0x1e27 "\\\"{h}"                  "" "" # LATIN SMALL LETTER H WITH DIAERESIS
+0x1e28 "\\c{H}"                   "" "" # LATIN CAPITAL LETTER H WITH CEDILLA
+0x1e29 "\\c{h}"                   "" "" # LATIN SMALL LETTER H WITH CEDILLA
+#0x1e2a ""                         "" "" # LATIN CAPITAL LETTER H WITH BREVE BELOW
+#0x1e2b ""                         "" "" # LATIN SMALL LETTER H WITH BREVE BELOW
+0x1e2c "\\textsubtilde{I}"        "tipa" "" # LATIN CAPITAL LETTER I WITH TILDE BELOW
+0x1e2d "\\textsubtilde{i}"        "tipa" "" # LATIN SMALL LETTER I WITH TILDE BELOW
+#0x1e2e ""                         "" "" # LATIN CAPITAL LETTER I WITH DIAERESIS AND ACUTE
+#0x1e2f ""                         "" "" # LATIN SMALL LETTER I WITH DIAERESIS AND ACUTE
+0x1e30 "\\'{K}"                   "" "" # LATIN CAPITAL LETTER K WITH ACUTE
+0x1e31 "\\'{k}"                   "" "" # LATIN SMALL LETTER K WITH ACUTE
+0x1e32 "\\d{K}"                   "" "" # LATIN CAPITAL LETTER K WITH DOT BELOW
+0x1e33 "\\d{k}"                   "" "" # LATIN SMALL LETTER K WITH DOT BELOW
+#0x1e34 ""                         "" "" # LATIN CAPITAL LETTER K WITH LINE BELOW
+#0x1e35 ""                         "" "" # LATIN SMALL LETTER K WITH LINE BELOW
+0x1e36 "\\d{L}"                   "" "" # LATIN CAPITAL LETTER L WITH DOT BELOW
+0x1e37 "\\d{l}"                   "" "" # LATIN SMALL LETTER L WITH DOT BELOW
+#0x1e38 ""                         "" "" # LATIN CAPITAL LETTER L WITH DOT BELOW AND MACRON
+#0x1e39 ""                         "" "" # LATIN SMALL LETTER L WITH DOT BELOW AND MACRON
+#0x1e3a ""                         "" "" # LATIN CAPITAL LETTER L WITH LINE BELOW
+#0x1e3b ""                         "" "" # LATIN SMALL LETTER L WITH LINE BELOW
+0x1e3c "\\textsubcircum{L}"       "tipa" "" # LATIN CAPITAL LETTER L WITH CIRCUMFLEX BELOW
+0x1e3d "\\textsubcircum{l}"       "tipa" "" # LATIN SMALL LETTER L WITH CIRCUMFLEX BELOW
+0x1e3e "\\'{M}"                   "" "" # LATIN CAPITAL LETTER M WITH ACUTE
+0x1e3f "\\'{m}"                   "" "" # LATIN SMALL LETTER M WITH ACUTE
+0x1e40 "\\.{M}"                   "" "" # LATIN CAPITAL LETTER M WITH DOT ABOVE
+0x1e41 "\\.{m}"                   "" "" # LATIN SMALL LETTER M WITH DOT ABOVE
+0x1e42 "\\d{M}"                   "" "" # LATIN CAPITAL LETTER M WITH DOT BELOW
+0x1e43 "\\d{m}"                   "" "" # LATIN SMALL LETTER M WITH DOT BELOW
+0x1e44 "\\.{N}"                   "" "" # LATIN CAPITAL LETTER N WITH DOT ABOVE
+0x1e45 "\\.{n}"                   "" "" # LATIN SMALL LETTER N WITH DOT ABOVE
+0x1e46 "\\d{N}"                   "" "" # LATIN CAPITAL LETTER N WITH DOT BELOW
+0x1e47 "\\d{n}"                   "" "" # LATIN SMALL LETTER N WITH DOT BELOW
+#0x1e48 ""                         "" "" # LATIN CAPITAL LETTER N WITH LINE BELOW
+#0x1e49 ""                         "" "" # LATIN SMALL LETTER N WITH LINE BELOW
+0x1e4a "\\textsubcircum{N}"       "tipa" "" # LATIN CAPITAL LETTER N WITH CIRCUMFLEX BELOW
+0x1e4b "\\textsubcircum{n}"       "tipa" "" # LATIN SMALL LETTER N WITH CIRCUMFLEX BELOW
+#0x1e4c ""                         "" "" # LATIN CAPITAL LETTER O WITH TILDE AND ACUTE
+#0x1e4d ""                         "" "" # LATIN SMALL LETTER O WITH TILDE AND ACUTE
+#0x1e4e ""                         "" "" # LATIN CAPITAL LETTER O WITH TILDE AND DIAERESIS
+#0x1e4f ""                         "" "" # LATIN SMALL LETTER O WITH TILDE AND DIAERESIS
+#0x1e50 ""                         "" "" # LATIN CAPITAL LETTER O WITH MACRON AND GRAVE
+#0x1e51 ""                         "" "" # LATIN SMALL LETTER O WITH MACRON AND GRAVE
+#0x1e52 ""                         "" "" # LATIN CAPITAL LETTER O WITH MACRON AND ACUTE
+#0x1e53 ""                         "" "" # LATIN SMALL LETTER O WITH MACRON AND ACUTE
+0x1e54 "\\'{P}"                   "" "" # LATIN CAPITAL LETTER P WITH ACUTE
+0x1e55 "\\'{p}"                   "" "" # LATIN SMALL LETTER P WITH ACUTE
+0x1e56 "\\.{P}"                   "" "" # LATIN CAPITAL LETTER P WITH DOT ABOVE
+0x1e57 "\\.{p}"                   "" "" # LATIN SMALL LETTER P WITH DOT ABOVE
+0x1e58 "\\.{R}"                   "" "" # LATIN CAPITAL LETTER R WITH DOT ABOVE
+0x1e59 "\\.{r}"                   "" "" # LATIN SMALL LETTER R WITH DOT ABOVE
+0x1e5a "\\d{R}"                   "" "" # LATIN CAPITAL LETTER R WITH DOT BELOW
+0x1e5b "\\d{r}"                   "" "" # LATIN SMALL LETTER R WITH DOT BELOW
+#0x1e5c ""                         "" "" # LATIN CAPITAL LETTER R WITH DOT BELOW AND MACRON
+#0x1e5d ""                         "" "" # LATIN SMALL LETTER R WITH DOT BELOW AND MACRON
+#0x1e5e ""                         "" "" # LATIN CAPITAL LETTER R WITH LINE BELOW
+#0x1e5f ""                         "" "" # LATIN SMALL LETTER R WITH LINE BELOW
+0x1e60 "\\.{S}"                   "" "" # LATIN CAPITAL LETTER S WITH DOT ABOVE
+0x1e61 "\\.{s}"                   "" "" # LATIN SMALL LETTER S WITH DOT ABOVE
+0x1e62 "\\d{S}"                   "" "" # LATIN CAPITAL LETTER S WITH DOT BELOW
+0x1e63 "\\d{s}"                   "" "" # LATIN SMALL LETTER S WITH DOT BELOW
+#0x1e64 ""                         "" "" # LATIN CAPITAL LETTER S WITH ACUTE AND DOT ABOVE
+#0x1e65 ""                         "" "" # LATIN SMALL LETTER S WITH ACUTE AND DOT ABOVE
+#0x1e66 ""                         "" "" # LATIN CAPITAL LETTER S WITH CARON AND DOT ABOVE
+#0x1e67 ""                         "" "" # LATIN SMALL LETTER S WITH CARON AND DOT ABOVE
+#0x1e68 ""                         "" "" # LATIN CAPITAL LETTER S WITH DOT BELOW AND DOT ABOVE
+#0x1e69 ""                         "" "" # LATIN SMALL LETTER S WITH DOT BELOW AND DOT ABOVE
+0x1e6a "\\.{T}"                   "" "" # LATIN CAPITAL LETTER T WITH DOT ABOVE
+0x1e6b "\\.{t}"                   "" "" # LATIN SMALL LETTER T WITH DOT ABOVE
+0x1e6c "\\d{T}"                   "" "" # LATIN CAPITAL LETTER T WITH DOT BELOW
+0x1e6d "\\d{t}"                   "" "" # LATIN SMALL LETTER T WITH DOT BELOW
+#0x1e6e ""                         "" "" # LATIN CAPITAL LETTER T WITH LINE BELOW
+#0x1e6f ""                         "" "" # LATIN SMALL LETTER T WITH LINE BELOW
+0x1e70 "\\textsubcircum{T}"       "tipa" "" # LATIN CAPITAL LETTER T WITH CIRCUMFLEX BELOW
+0x1e71 "\\textsubcircum{t}"       "tipa" "" # LATIN SMALL LETTER T WITH CIRCUMFLEX BELOW
+#0x1e72 ""                         "" "" # LATIN CAPITAL LETTER U WITH DIAERESIS BELOW
+#0x1e73 ""                         "" "" # LATIN SMALL LETTER U WITH DIAERESIS BELOW
+0x1e74 "\\textsubtilde{U}"        "tipa" "" # LATIN CAPITAL LETTER U WITH TILDE BELOW
+0x1e75 "\\textsubtilde{u}"        "tipa" "" # LATIN SMALL LETTER U WITH TILDE BELOW
+0x1e76 "\\textsubcircum{U}"       "tipa" "" # LATIN CAPITAL LETTER U WITH CIRCUMFLEX BELOW
+0x1e77 "\\textsubcircum{u}"       "tipa" "" # LATIN SMALL LETTER U WITH CIRCUMFLEX BELOW
+#0x1e78 ""                         "" "" # LATIN CAPITAL LETTER U WITH TILDE AND ACUTE
+#0x1e79 ""                         "" "" # LATIN SMALL LETTER U WITH TILDE AND ACUTE
+#0x1e7a ""                         "" "" # LATIN CAPITAL LETTER U WITH MACRON AND DIAERESIS
+#0x1e7b ""                         "" "" # LATIN SMALL LETTER U WITH MACRON AND DIAERESIS
+0x1e7c "\\~{V}"                   "" "" # LATIN CAPITAL LETTER V WITH TILDE
+0x1e7d "\\~{v}"                   "" "" # LATIN SMALL LETTER V WITH TILDE
+0x1e7e "\\d{V}"                   "" "" # LATIN CAPITAL LETTER V WITH DOT BELOW
+0x1e7f "\\d{v}"                   "" "" # LATIN SMALL LETTER V WITH DOT BELOW
+0x1e80 "\\`{W}"                   "" "" # LATIN CAPITAL LETTER W WITH GRAVE
+0x1e81 "\\`{w}"                   "" "" # LATIN SMALL LETTER W WITH GRAVE
+0x1e82 "\\'{W}"                   "" "" # LATIN CAPITAL LETTER W WITH ACUTE
+0x1e83 "\\'{w}"                   "" "" # LATIN SMALL LETTER W WITH ACUTE
+0x1e84 "\\\"{W}"                  "" "" # LATIN CAPITAL LETTER W WITH DIAERESIS
+0x1e85 "\\\"{w}"                  "" "" # LATIN SMALL LETTER W WITH DIAERESIS
+0x1e86 "\\.{W}"                   "" "" # LATIN CAPITAL LETTER W WITH DOT ABOVE
+0x1e87 "\\.{w}"                   "" "" # LATIN SMALL LETTER W WITH DOT ABOVE
+0x1e88 "\\d{W}"                   "" "" # LATIN CAPITAL LETTER W WITH DOT BELOW
+0x1e89 "\\d{w}"                   "" "" # LATIN SMALL LETTER W WITH DOT BELOW
+0x1e8a "\\.{X}"                   "" "" # LATIN CAPITAL LETTER X WITH DOT ABOVE
+0x1e8b "\\.{x}"                   "" "" # LATIN SMALL LETTER X WITH DOT ABOVE
+0x1e8c "\\\"{X}"                  "" "" # LATIN CAPITAL LETTER X WITH DIAERESIS
+0x1e8d "\\\"{x}"                  "" "" # LATIN SMALL LETTER X WITH DIAERESIS
+0x1e8e "\\.{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH DOT ABOVE
+0x1e8f "\\.{y}"                   "" "" # LATIN SMALL LETTER Y WITH DOT ABOVE
+0x1e90 "\\^{Z}"                   "" "" # LATIN CAPITAL LETTER Z WITH CIRCUMFLEX
+0x1e91 "\\^{z}"                   "" "" # LATIN SMALL LETTER Z WITH CIRCUMFLEX
+0x1e92 "\\d{Z}"                   "" "" # LATIN CAPITAL LETTER Z WITH DOT BELOW
+0x1e93 "\\d{z}"                   "" "" # LATIN SMALL LETTER Z WITH DOT BELOW
+#0x1e94 ""                         "" "" # LATIN CAPITAL LETTER Z WITH LINE BELOW
+#0x1e95 ""                         "" "" # LATIN SMALL LETTER Z WITH LINE BELOW
+#0x1e96 ""                         "" "" # LATIN SMALL LETTER H WITH LINE BELOW
+0x1e97 "\\\"{t}"                  "" "" # LATIN SMALL LETTER T WITH DIAERESIS
+0x1e98 "\\r{w}"                   "" "" # LATIN SMALL LETTER W WITH RING ABOVE
+0x1e99 "\\r{y}"                   "" "" # LATIN SMALL LETTER Y WITH RING ABOVE
+#0x1e9a ""                         "" "" # LATIN SMALL LETTER A WITH RIGHT HALF RING
+#0x1e9b ""                         "" "" # LATIN SMALL LETTER LONG S WITH DOT ABOVE
+0x1ea0 "\\d{A}"                   "" "" # LATIN CAPITAL LETTER A WITH DOT BELOW
+0x1ea1 "\\d{a}"                   "" "" # LATIN SMALL LETTER A WITH DOT BELOW
+#0x1ea2 ""                         "" "" # LATIN CAPITAL LETTER A WITH HOOK ABOVE
+#0x1ea3 ""                         "" "" # LATIN SMALL LETTER A WITH HOOK ABOVE
+#0x1ea4 ""                         "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND ACUTE
+#0x1ea5 ""                         "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE
+#0x1ea6 ""                         "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND GRAVE
+#0x1ea7 ""                         "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE
+#0x1ea8 ""                         "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1ea9 ""                         "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1eaa ""                         "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND TILDE
+#0x1eab ""                         "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE
+#0x1eac ""                         "" "" # LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND DOT BELOW
+#0x1ead ""                         "" "" # LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT BELOW
+#0x1eae ""                         "" "" # LATIN CAPITAL LETTER A WITH BREVE AND ACUTE
+#0x1eaf ""                         "" "" # LATIN SMALL LETTER A WITH BREVE AND ACUTE
+#0x1eb0 ""                         "" "" # LATIN CAPITAL LETTER A WITH BREVE AND GRAVE
+#0x1eb1 ""                         "" "" # LATIN SMALL LETTER A WITH BREVE AND GRAVE
+#0x1eb2 ""                         "" "" # LATIN CAPITAL LETTER A WITH BREVE AND HOOK ABOVE
+#0x1eb3 ""                         "" "" # LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE
+#0x1eb4 ""                         "" "" # LATIN CAPITAL LETTER A WITH BREVE AND TILDE
+#0x1eb5 ""                         "" "" # LATIN SMALL LETTER A WITH BREVE AND TILDE
+#0x1eb6 ""                         "" "" # LATIN CAPITAL LETTER A WITH BREVE AND DOT BELOW
+#0x1eb7 ""                         "" "" # LATIN SMALL LETTER A WITH BREVE AND DOT BELOW
+0x1eb8 "\\d{E}"                   "" "" # LATIN CAPITAL LETTER E WITH DOT BELOW
+0x1eb9 "\\d{e}"                   "" "" # LATIN SMALL LETTER E WITH DOT BELOW
+#0x1eba ""                         "" "" # LATIN CAPITAL LETTER E WITH HOOK ABOVE
+#0x1ebb ""                         "" "" # LATIN SMALL LETTER E WITH HOOK ABOVE
+0x1ebc "\\~{E}"                   "" "" # LATIN CAPITAL LETTER E WITH TILDE
+0x1ebd "\\~{e}"                   "" "" # LATIN SMALL LETTER E WITH TILDE
+#0x1ebe ""                         "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND ACUTE
+#0x1ebf ""                         "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX AND ACUTE
+#0x1ec0 ""                         "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND GRAVE
+#0x1ec1 ""                         "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX AND GRAVE
+#0x1ec2 ""                         "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1ec3 ""                         "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1ec4 ""                         "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND TILDE
+#0x1ec5 ""                         "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX AND TILDE
+#0x1ec6 ""                         "" "" # LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND DOT BELOW
+#0x1ec7 ""                         "" "" # LATIN SMALL LETTER E WITH CIRCUMFLEX AND DOT BELOW
+#0x1ec8 ""                         "" "" # LATIN CAPITAL LETTER I WITH HOOK ABOVE
+#0x1ec9 ""                         "" "" # LATIN SMALL LETTER I WITH HOOK ABOVE
+0x1eca "\\d{I}"                   "" "" # LATIN CAPITAL LETTER I WITH DOT BELOW
+0x1ecb "\\d{i}"                   "" "" # LATIN SMALL LETTER I WITH DOT BELOW
+0x1ecc "\\d{O}"                   "" "" # LATIN CAPITAL LETTER O WITH DOT BELOW
+0x1ecd "\\d{o}"                   "" "" # LATIN SMALL LETTER O WITH DOT BELOW
+#0x1ece ""                         "" "" # LATIN CAPITAL LETTER O WITH HOOK ABOVE
+#0x1ecf ""                         "" "" # LATIN SMALL LETTER O WITH HOOK ABOVE
+#0x1ed0 ""                         "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND ACUTE
+#0x1ed1 ""                         "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX AND ACUTE
+#0x1ed2 ""                         "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND GRAVE
+#0x1ed3 ""                         "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX AND GRAVE
+#0x1ed4 ""                         "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1ed5 ""                         "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE
+#0x1ed6 ""                         "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND TILDE
+#0x1ed7 ""                         "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX AND TILDE
+#0x1ed8 ""                         "" "" # LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND DOT BELOW
+#0x1ed9 ""                         "" "" # LATIN SMALL LETTER O WITH CIRCUMFLEX AND DOT BELOW
+#0x1eda ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN AND ACUTE
+#0x1edb ""                         "" "" # LATIN SMALL LETTER O WITH HORN AND ACUTE
+#0x1edc ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN AND GRAVE
+#0x1edd ""                         "" "" # LATIN SMALL LETTER O WITH HORN AND GRAVE
+#0x1ede ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN AND HOOK ABOVE
+#0x1edf ""                         "" "" # LATIN SMALL LETTER O WITH HORN AND HOOK ABOVE
+#0x1ee0 ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN AND TILDE
+#0x1ee1 ""                         "" "" # LATIN SMALL LETTER O WITH HORN AND TILDE
+#0x1ee2 ""                         "" "" # LATIN CAPITAL LETTER O WITH HORN AND DOT BELOW
+#0x1ee3 ""                         "" "" # LATIN SMALL LETTER O WITH HORN AND DOT BELOW
+0x1ee4 "\\d{U}"                   "" "" # LATIN CAPITAL LETTER U WITH DOT BELOW
+0x1ee5 "\\d{u}"                   "" "" # LATIN SMALL LETTER U WITH DOT BELOW
+#0x1ee6 ""                         "" "" # LATIN CAPITAL LETTER U WITH HOOK ABOVE
+#0x1ee7 ""                         "" "" # LATIN SMALL LETTER U WITH HOOK ABOVE
+#0x1ee8 ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN AND ACUTE
+#0x1ee9 ""                         "" "" # LATIN SMALL LETTER U WITH HORN AND ACUTE
+#0x1eea ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN AND GRAVE
+#0x1eeb ""                         "" "" # LATIN SMALL LETTER U WITH HORN AND GRAVE
+#0x1eec ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN AND HOOK ABOVE
+#0x1eed ""                         "" "" # LATIN SMALL LETTER U WITH HORN AND HOOK ABOVE
+#0x1eee ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN AND TILDE
+#0x1eef ""                         "" "" # LATIN SMALL LETTER U WITH HORN AND TILDE
+#0x1ef0 ""                         "" "" # LATIN CAPITAL LETTER U WITH HORN AND DOT BELOW
+#0x1ef1 ""                         "" "" # LATIN SMALL LETTER U WITH HORN AND DOT BELOW
+0x1ef2 "\\`{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH GRAVE
+0x1ef3 "\\`{y}"                   "" "" # LATIN SMALL LETTER Y WITH GRAVE
+0x1ef4 "\\d{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH DOT BELOW
+0x1ef5 "\\d{y}"                   "" "" # LATIN SMALL LETTER Y WITH DOT BELOW
+#0x1ef6 ""                         "" "" # LATIN CAPITAL LETTER Y WITH HOOK ABOVE
+#0x1ef7 ""                         "" "" # LATIN SMALL LETTER Y WITH HOOK ABOVE
+0x1ef8 "\\~{Y}"                   "" "" # LATIN CAPITAL LETTER Y WITH TILDE
+0x1ef9 "\\~{y}"                   "" "" # LATIN SMALL LETTER Y WITH TILDE
+# general punctuation
+0x2010 "-"                        "" "" # HYPHEN # identic in LaTeX to FIGURE DASH
+0x2012 "-"                        "" "" # FIGURE DASH
+0x2013 "\\textendash"             "" "" # EN DASH
+0x2014 "\\textemdash"             "" "" # EM DASH
+# use the following macro for the character HORIZONTAL BAR
+0x2015 "\\LyXbar" "\\newcommand*\\LyXbar{\\rule[0.585ex]{1.2em}{0.25pt}}" ""
+0x2016 "\\textbardbl"             "textcomp" "" # DOUBLE VERTICAL LINE
+#0x2017 ""                         "" "" # DOUBLE LOW LINE
+0x2018 "\\textquoteleft"          "" "" # LEFT SINGLE QUOTATION MARK
+0x2019 "\\textquoteright"         "" "" # RIGHT SINGLE QUOTATION MARK
+0x201a "\\quotesinglbase"         "" "" # SINGLE LOW-9 QUOTATION MARK
+#0x201b ""                         "" "" # SINGLE HIGH-REVERSED-9 QUOTATION MARK
+0x201c "\\textquotedblleft"       "" "" # LEFT DOUBLE QUOTATION MARK
+0x201d "\\textquotedblright"      "" "" # RIGHT DOUBLE QUOTATION MARK
+0x201e "\\quotedblbase"           "" "" # DOUBLE LOW-9 QUOTATION MARK
+#0x201f ""                         "" "" # DOUBLE LOW-REVERSED-9 QUOTATION MARK
+0x2020 "\\dag"                    "" "" # DAGGER
+0x2021 "\\ddag"                   "" "" # DOUBLE DAGGER
+0x2022 "\\textbullet"             "textcomp" "" # BULLET
+0x2023 "\\textifsymbol[ifgeo]{116}" "ifsym" "" # TRIANGULAR BULLET # â 0x25b8
+0x2024 "."                        "" "" # ONE DOT LEADER # â FULL STOP
+0x2025 ".\\,."                    "" "" # TWO DOT LEADER
+0x2026 "\\ldots"                  "" "" # HORIZONTAL ELLIPSIS
+#0x2027 ""                         "" "" # HYPHENATION POINT
+0x2030 "\\textperthousand"        "textcomp" "" # PER MILLE SIGN
+0x2031 "\\textpertenthousand"     "textcomp" "" # PER TEN THOUSAND SIGN
+0x2032 "\\textasciiacute"         "textcomp" "" # PRIME
+0x2033 "\\textacutedbl"           "textcomp" "" # DOUBLE PRIME
+#0x2034 ""                         "" "" # TRIPLE PRIME
+0x2035 "\\textasciigrave"         "textcomp" "" # REVERSED PRIME
+0x2036 "\\textgravedbl"           "textcomp" "" # REVERSED DOUBLE PRIME
+#0x2037 ""                         "" "" # REVERSED TRIPLE PRIME
+0x2038 "\\^{}"                    "" "" # CARET
+0x2039 "\\guilsinglleft"          "" "" # SINGLE LEFT-POINTING ANGLE QUOTATION MARK
+0x203a "\\guilsinglright"         "" "" # SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
+0x203b "\\textreferencemark"      "textcomp" "" # REFERENCE MARK
+0x203c "!!"                       "" "" # DOUBLE EXCLAMATION MARK # â 2ĂEXCLAMATION MARK
+0x203d "\\textinterrobang"        "textcomp" "" # INTERROBANG
+# use the following macro for the character OVERLINE
+0x203e "\\LyXoverline" "\\newcommand*\\LyXoverline{\\raisebox{2.6ex}{\\_}}" ""
+0x2044 "\\textfractionsolidus"    "textcomp" "" # FRACTION SLASH
+0x2045 "\\textlquill"             "textcomp" "" # LEFT SQUARE BRACKET WITH QUILL
+0x2046 "\\textrquill"             "textcomp" "" # RIGHT SQUARE BRACKET WITH QUILL
+0x2047 "??"                       "" "" # DOUBLE QUESTION MARK # â 2ĂQUESTION MARK
+0x2048 "?!"                       "" "" # QUESTION EXCLAMATION MARK
+0x2049 "!?"                       "" "" # EXCLAMATION QUESTION MARK
+0x2052 "\\textdiscount"           "textcomp" "" # COMMERCIAL MINUS SIGN
+0x205d "\\vdots"                  "" "" # TRICOLON # â VERTICAL ELLIPSIS
+# currency symbols
+0x20a1 "\\textcolonmonetary"      "textcomp" "" # COLON SIGN
+0x20a3 "\\textfrenchfranc"        "textcomp" "" # FRENCH FRANC SIGN
+0x20a4 "\\textlira"               "textcomp" "" # LIRA SIGN
+0x20a6 "\\textnaira"              "textcomp" "" # NAIRA SIGN
+#0x20a7 ""                         "" "" # PESETA SIGN
+0x20a9 "\\textwon"                "textcomp" "" # WON SIGN
+#0x20aa ""                         "" "" # NEW SHEQEL SIGN
+0x20ab "\\textdong"               "textcomp" "" # DONG SIGN
+0x20ac "\\texteuro"               "textcomp" "" # EURO SIGN
+0x20b1 "\\textpeso"               "textcomp" "" # PESO SIGN
+0x20b2 "\\textguarani"            "textcomp" "" # GUARANI SIGN
+# letterlike symbols
+# use the following macro for the character ACCOUNT OF
+0x2100 "\\LyXaccountof" "\\newcommand*\\LyXaccountof{\\mbox{\\raisebox{.8ex}{a}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{c}}}" ""
+# use the following macro for the character ADRESSED TO THE SUBJECT
+0x2101 "\\LyXaddressed" "\\newcommand*\\LyXaddressed{\\mbox{\\raisebox{.8ex}{a}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{s}}}" ""
+0x2102 "\\ensuremath{\\mathbb{C}}" "amssymb" "" # DOUBLE-STUCK CAPITAL C
+0x2103 "\\textcelsius"            "textcomp" "" # DEGREE CELSIUS
+# use the following macro for the character CARE OF
+0x2105 "\\LyXcareof" "\\newcommand*\\LyXcareof{\\mbox{\\raisebox{.8ex}{c}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{o}}}" ""
+# use the following macro for the character CADA UNA
+0x2106 "\\LyXcadauna" "\\newcommand*\\LyXcadauna{\\mbox{\\raisebox{.8ex}{c}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{u}}}" ""
+0x2109 "Â°{}F"                     "" "" # DEGREE FARENHEIT
+0x210a "\\ensuremath{\\matscr{g}}" "mathrsfs" "" # SCRIPT SMALL G
+0x210b "\\ensuremath{\\matscr{H}}" "mathrsfs" "" # SCRIPT CAPITAL H
+0x210c "\\ensuremath{\\mathfrak{H}}" "amssymb" "" # BLACK-LETTER CAPITAL H
+0x210d "\\ensuremath{\\mathbb{H}}" "amssymb" "" # DOUBLE-STUCK CAPITAL H
+0x210e "\\ensuremath{h}"          "" "" # PLANCK CONSTANT
+0x210f "\\ensuremath{\\hbar}"     "amssymb" "" # PLANCK CONSTANT OVER TWO PI
+0x2110 "\\ensuremath{\\matscr{I}}" "mathrsfs" "" # SCRIPT CAPITAL I
+0x2111 "\\ensuremath{\\mathfrak{I}}" "amssymb" "" # BLACK-LETTER CAPITAL I
+0x2112 "\\ensuremath{\\matscr{L}}" "mathrsfs" "" # SCRIPT CAPITAL L
+0x2113 "\\ensuremath{\\ell}"      "" "" # SCRIPT SMALL L
+0x2115 "\\ensuremath{\\mathbb{N}}" "amssymb" "" # DOUBLE-STUCK CAPITAL N
+0x2116 "\\textnumero"             "textcomp" "" # NUMERO SIGN
+0x2117 "\\textcircledP"           "textcomp" "" # SOUND RECORDING COYRIGHT
+0x2118 "\\ensuremath{\\matscr{P}}" "mathrsfs" "" # SCRIPT CAPITAL P
+0x2119 "\\ensuremath{\\mathbb{P}}" "amssymb" "" # DOUBLE-STUCK CAPITAL P
+0x211a "\\ensuremath{\\mathbb{Q}}" "amssymb" "" # DOUBLE-STUCK CAPITAL Q
+0x211b "\\ensuremath{\\matscr{R}}" "mathrsfs" "" # SCRIPT CAPITAL R
+0x211c "\\ensuremath{\\mathfrak{R}}" "amssymb" "" # BLACK-LETTER CAPITAL R
+0x211d "\\ensuremath{\\mathbb{R}}" "amssymb" "" # DOUBLE-STUCK CAPITAL R
+0x211e "\\textrecipe"             "textcomp" "" # PRESCRIPTION TAKE
+0x2120 "\\textservicemark"        "textcomp" "" # SERVICE MARK
+#0x2121 ""                         "" "" # TELEPHONE SIGN
+0x2122 "\\texttrademark"          "textcomp" "" # TRADE MARK SIGN
+0x2124 "\\ensuremath{\\mathbb{Z}}" "amssymb" "" # DOUBLE-STUCK CAPITAL Z
+0x2126 "\\textohm"                "textcomp" "" # OHM SIGN
+0x2127 "\\textmho"                "textcomp" "" # INVERTED OHM SIGN
+0x2128 "\\ensuremath{\\mathfrak{Z}}" "amssymb" "" # BLACK-LETTER CAPITAL Z
+0x212a "K"                        "" "" # KELVIN SIGN
+0x212b "\\AA"                     "" "" # ANGSTROM SIGN
+0x212c "\\ensuremath{\\matscr{B}}" "mathrsfs" "" # SCRIPT CAPITAL B
+0x212d "\\ensuremath{\\mathfrak{C}}" "amssymb" "" # BLACK-LETTER CAPITAL C
+0x212e "\\textestimated"          "textcomp" "" # ESTIMATED SYMBOL
+0x212f "\\ensuremath{\\matscr{e}}" "mathrsfs" "" # SCRIPT SMALL E
+0x2130 "\\ensuremath{\\matscr{E}}" "mathrsfs" "" # SCRIPT CAPITAL E
+0x2131 "\\ensuremath{\\matscr{F}}" "mathrsfs" "" # SCRIPT CAPITAL F
+0x2133 "\\ensuremath{\\matscr{M}}" "mathrsfs" "" # SCRIPT CAPITAL M
+0x2134 "\\ensuremath{\\matscr{o}}" "mathrsfs" "" # SCRIPT SMALL O
+0x2135 "\\ensuremath{\\aleph}"    "amssymb" "" # ALEF SYMBOL
+0x2136 "\\ensuremath{\\beth}"     "amssymb" "" # BET SYMBOL
+0x2137 "\\ensuremath{\\gimel}"    "amssymb" "" # GIMEL SYMBOL
+0x2138 "\\ensuremath{\\daleth}"   "amssymb" "" # DALET SYMBOL
+#0x2139 ""                         "" "" # INFORMATION SOURCE
+#0x213b ""                         "" "" # FACSIMILE SIGN
+# use the following macro for the character AKTIESELSKAB
+0x214e "\\LyXaktie" "\\newcommand*\\LyXaktie{\\mbox{\\raisebox{.8ex}{A}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{S}}}" ""
+# number forms
+# use the following macro for the character VULGAR FRACTION ONE THIRD
+0x2153 "\\LyXonethird" "\\newcommand*\\LyXonethird{\\mbox{\\raisebox{.8ex}{1}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{3}}}" ""
+# use the following macro for the character VULGAR FRACTION TWO THIRDS
+0x2154 "\\LyXtwothirds" "\\newcommand*\\LyXtwothirds{\\mbox{\\raisebox{.8ex}{2}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{3}}}" ""
+# use the following macro for the character VULGAR FRACTION ONE FIFTH
+0x2155 "\\LyXonefifth" "\\newcommand*\\LyXonefifth{\\mbox{\\raisebox{.8ex}{1}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{5}}}" ""
+# use the following macro for the character VULGAR FRACTION TWO FIFTHS
+0x2156 "\\LyXtwofifths" "\\newcommand*\\LyXtwofifths{\\mbox{\\raisebox{.8ex}{2}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{5}}}" ""
+# use the following macro for the character VULGAR FRACTION THREE FIFTHS
+0x2157 "\\LyXthreefifths" "\\newcommand*\\LyXthreefifths{\\mbox{\\raisebox{.8ex}{3}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{5}}}" ""
+# use the following macro for the character VULGAR FRACTION FOUR FIFTHS
+0x2158 "\\LyXfourfifths" "\\newcommand*\\LyXfourfifths{\\mbox{\\raisebox{.8ex}{4}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{5}}}" ""
+# use the following macro for the character VULGAR FRACTION ONE SIXTH
+0x2159 "\\LyXonesixth" "\\newcommand*\\LyXonesixth{\\mbox{\\raisebox{.8ex}{1}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{6}}}" ""
+# use the following macro for the character VULGAR FRACTION FIVE SIXTHS
+0x215a "\\LyXfivesixths" "\\newcommand*\\LyXfivesixths{\\mbox{\\raisebox{.8ex}{5}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{6}}}" ""
+# use the following macro for the character VULGAR FRACTION ONE EIGHT
+0x215b "\\LyXoneeight" "\\newcommand*\\LyXoneeight{\\mbox{\\raisebox{.8ex}{1}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{8}}}" ""
+# use the following macro for the character VULGAR FRACTION THREE EIGHTS
+0x215c "\\LyXthreeeights" "\\newcommand*\\LyXthreeeights{\\mbox{\\raisebox{.8ex}{3}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{8}}}" ""
+# use the following macro for the character VULGAR FRACTION FIVE EIGHTS
+0x215d "\\LyXfiveeights" "\\newcommand*\\LyXfiveeights{\\mbox{\\raisebox{.8ex}{5}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{8}}}" ""
+# use the following macro for the character VULGAR FRACTION SEVEN EIGHTS
+0x215e "\\LyXseveneights" "\\newcommand*\\LyXseveneights{\\mbox{\\raisebox{.8ex}{7}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{8}}}" ""
+# use the following macro for the character FRACTION NUMERATOR ONE
+0x215f "\\LyXnumeratorone" "\\newcommand*\\LyXnumeratorone{\\mbox{\\raisebox{.8ex}{1}\\kern-.175em\\raisebox{.2ex}{/}\\kern-.18em\\raisebox{-.2ex}{\\kern-.18em}}}" ""
+0x2160 "\\mbox{I}"                "" "" # ROMAN NUMERAL ONE
+0x2161 "\\mbox{II}"               "" "" # ROMAN NUMERAL TWO
+0x2162 "\\mbox{III}"              "" "" # ROMAN NUMERAL THREE
+0x2163 "\\mbox{IV}"               "" "" # ROMAN NUMERAL FOUR
+0x2164 "\\mbox{V}"                "" "" # ROMAN NUMERAL FIVE
+0x2165 "\\mbox{VI}"               "" "" # ROMAN NUMERAL SIX
+0x2166 "\\mbox{VII}"              "" "" # ROMAN NUMERAL SEVEN
+0x2167 "\\mbox{VIII}"             "" "" # ROMAN NUMERAL EIGHT
+0x2168 "\\mbox{IX}"               "" "" # ROMAN NUMERAL NINE
+0x2169 "\\mbox{X}"                "" "" # ROMAN NUMERAL TEN
+0x216a "\\mbox{XI}"               "" "" # ROMAN NUMERAL ELEVEN
+0x216b "\\mbox{XII}"              "" "" # ROMAN NUMERAL TWELVE
+0x216c "\\mbox{L}"                "" "" # ROMAN NUMERAL FIFTY
+0x216d "\\mbox{C}"                "" "" # ROMAN NUMERAL ONE HUNDRED
+0x216e "\\mbox{D}"                "" "" # ROMAN NUMERAL FIVE HUNDRED
+0x216f "\\mbox{M}"                "" "" # ROMAN NUMERAL ONE THOUSAND
+0x2170 "\\mbox{i}"                "" "" # SMALL ROMAN NUMERAL ONE
+0x2171 "\\mbox{ii}"               "" "" # SMALL ROMAN NUMERAL TWO
+0x2172 "\\mbox{iii}"              "" "" # SMALL ROMAN NUMERAL THREE
+0x2173 "\\mbox{iv}"               "" "" # SMALL ROMAN NUMERAL FOUR
+0x2174 "\\mbox{v}"                "" "" # SMALL ROMAN NUMERAL FIVE
+0x2175 "\\mbox{vi}"               "" "" # SMALL ROMAN NUMERAL SIX
+0x2176 "\\mbox{vii}"              "" "" # SMALL ROMAN NUMERAL SEVEN
+0x2177 "\\mbox{viii}"             "" "" # SMALL ROMAN NUMERAL EIGHT
+0x2178 "\\mbox{ix}"               "" "" # SMALL ROMAN NUMERAL NINE
+0x2179 "\\mbox{x}"                "" "" # SMALL ROMAN NUMERAL TEN
+0x217a "\\mbox{xi}"               "" "" # SMALL ROMAN NUMERAL ELEVEN
+0x217b "\\mbox{xii}"              "" "" # SMALL ROMAN NUMERAL TWELVE
+0x217c "\\mbox{l}"                "" "" # SMALL ROMAN NUMERAL FIFTY
+0x217d "\\mbox{c}"                "" "" # SMALL ROMAN NUMERAL ONE HUNDRED
+0x217e "\\mbox{d}"                "" "" # SMALL ROMAN NUMERAL FIVE HUNDRED
+0x217f "\\mbox{m}"                "" "" # SMALL ROMAN NUMERAL ONE THOUSAND
+# arrows
+0x2190 "\\textleftarrow"          "textcomp" "" # LEFTWARDS ARROW
+0x2191 "\\textuparrow"            "textcomp" "" # UPWARDS ARROW
+0x2192 "\\textrightarrow"         "textcomp" "" # RIGHTWARDS ARROW
+0x2193 "\\textdownarrow"          "textcomp" "" # DOWNWARDS ARROW
+0x2194 "\\ensuremath{\\leftrightarrow}" "" "" # LEFT RIGHT ARROW
+0x2195 "\\ensuremath{\\updownarrow}" "" "" # UP DOWN ARROW
+0x21a8 "{\\ascii\\ETB}"           "ascii" "" # UP DOWN ARROW WITH BASE
+# math symbols
+# besides textcomp only those used in Windows standard fonts
+0x2202 "\\ensuremath{\\partial}"  "" "" # PARTIAL DIFFERENTIAL
+0x2206 "\\ensuremath{\\Delta}"    "" "" # INCREMENT
+0x220f "\\ensuremath{\\prod}"     "" "" # N-ARY PRODUCT
+0x2211 "\\ensuremath{\\sum}"      "" "" # N-ARY SUMMATION
+0x2212 "\\textminus"              "textcomp" "" # MINUS SIGN
+0x2215 "\\ensuremath{\\slash}"    "" "" # DIVISION SLASH
+0x2217 "\\textasteriskcentered"   "textcomp" "" # ASTERISK OPERATOR
+0x2219 "\\ensuremath{\\centerdot}" "amssymb" "" # BULLET OPERATOR
+0x221a "\\textsurd"               "textcomp" "" # SQUARE ROOT
+0x221e "\\ensuremath{\\infty}"    "" "" # INFINITY
+# use the following macro for the character RIGHT ANGLE
+0x221f "\\LyXrightangle" "\\newcommand*\\LyXrightangle{{\\usefont{U}{msa}{m}{n}\\char120}}" ""
+0x2229 "\\ensuremath{\\bigcap}"   "" "" # INTERSECTION
+0x222b "\\ensuremath{\\int}"      "" "" # INTEGRAL
+0x2248 "\\ensuremath{\\approx}"   "" "" # ALMOST EQUAL TO
+0x2260 "\\ensuremath{\\neq}"      "" "" # NOT EQUAL TO
+0x2261 "\\ensuremath{\\equiv}"    "" "" # IDENTICAL TO
+0x2264 "\\ensuremath{\\le}"       "" "" # LESS-THAN OR EQUAL TO
+0x2265 "\\ensuremath{\\ge}"       "" "" # GREATER-THAN OR EQUAL TO
+# miscellaneous technical
+0x2302 "{\\ascii\\DEL}"           "ascii" "" # HOUSE
+0x2310 "\\ensuremath{\\invneg}"   "wasysym" "" # REVERSED NOT SIGN
+0x231a "\\Clocklogo"              "marvosym" "" # WATCH
+#0x2320 ""                         "" "" # TOP HALF INTEGRAL
+#0x2321 ""                         "" "" # BOTTOM HALF INTEGRAL
+0x2328 "\\Keyboard"               "marvosym" "" # KEYBOARD
+# control pictures
+0x2422 "\\textblank"              "textcomp" "" # BLANK SYMBOL
+0x2423 "\\textvisiblespace"       "textcomp" "" # OPEN BOX
+# box drawing
+0x2500 "\\textSFx"                "pmboxdraw" "" # BOX DRAWINGS LIGHT HORIZONTAL
+0x2502 "\\textSFxi"               "pmboxdraw" "" # BOX DRAWINGS LIGHT VERTICAL
+0x250c "\\textSFi"                "pmboxdraw" "" # BOX DRAWINGS LIGHT DOWN AND RIGHT
+0x2510 "\\textSFiii"              "pmboxdraw" "" # BOX DRAWINGS LIGHT DOWN AND LEFT
+0x2514 "\\textSFii"               "pmboxdraw" "" # BOX DRAWINGS LIGHT UP AND RIGHT
+0x2518 "\\textSFiv"               "pmboxdraw" "" # BOX DRAWINGS LIGHT UP AND LEFT
+0x251c "\\textSFviii"             "pmboxdraw" "" # BOX DRAWINGS LIGHT VERTICAL AND RIGHT
+0x2524 "\\textSFix"               "pmboxdraw" "" # BOX DRAWINGS LIGHT VERTICAL AND LEFT
+0x252c "\\textSFvi"               "pmboxdraw" "" # BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
+0x2534 "\\textSFvii"              "pmboxdraw" "" # BOX DRAWINGS LIGHT UP AND HORIZONTAL
+0x253c "\\textSFv"                "pmboxdraw" "" # BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
+0x2550 "\\textSFxliii"            "pmboxdraw" "" # BOX DRAWINGS DOUBLE HORIZONTAL
+0x2551 "\\textSFxxiv"             "pmboxdraw" "" # BOX DRAWINGS DOUBLE VERTICAL
+0x2552 "\\textSFli"               "pmboxdraw" "" # BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE
+0x2553 "\\textSFlii"              "pmboxdraw" "" # BOX DRAWINGS DOWN DOUBLE AND RIGHT SINGLE
+0x2554 "\\textSFxxxix"            "pmboxdraw" "" # BOX DRAWINGS DOUBLE DOWN AND RIGHT
+0x2555 "\\textSFxxii"             "pmboxdraw" "" # BOX DRAWINGS DOWN SINGLE AND LEFT DOUBLE
+0x2556 "\\textSFxxi"              "pmboxdraw" "" # BOX DRAWINGS DOWN DOUBLE AND LEFT SINGLE
+0x2557 "\\textSFxxv"              "pmboxdraw" "" # BOX DRAWINGS DOUBLE DOWN AND LEFT
+0x2558 "\\textSFl"                "pmboxdraw" "" # BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE
+0x2559 "\\textSFxlix"             "pmboxdraw" "" # BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE
+0x255a "\\textSFxxxviii"          "pmboxdraw" "" # BOX DRAWINGS DOUBLE UP AND RIGHT
+0x255b "\\textSFxxviii"           "pmboxdraw" "" # BOX DRAWINGS UP SINGLE AND LEFT DOUBLE
+0x255c "\\textSFxxvii"            "pmboxdraw" "" # BOX DRAWINGS UP DOUBLE AND LEFT SINGLE
+0x255d "\\textSFxxvi"             "pmboxdraw" "" # BOX DRAWINGS DOUBLE UP AND LEFT
+0x255e "\\textSFxxxvi"            "pmboxdraw" "" # BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
+0x255f "\\textSFxxxvii"           "pmboxdraw" "" # BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
+0x2560 "\\textSFxlii"             "pmboxdraw" "" # BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
+0x2561 "\\textSFxix"              "pmboxdraw" "" # BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
+0x2562 "\\textSFxx"               "pmboxdraw" "" # BOX DRAWINGS VERTICAL DOUBLE AND LEFT SINGLE
+0x2563 "\\textSFxxiii"            "pmboxdraw" "" # BOX DRAWINGS DOUBLE VERTICAL AND LEFT
+0x2564 "\\textSFxlvii"            "pmboxdraw" "" # BOX DRAWINGS DOWN SINGLE AND HORIZONTAL DOUBLE
+0x2565 "\\textSFxlviii"           "pmboxdraw" "" # BOX DRAWINGS DOWN DOUBLE AND HORIZONTAL SINGLE
+0x2566 "\\textSFxli"              "pmboxdraw" "" # BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
+0x2567 "\\textSFxlv"              "pmboxdraw" "" # BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
+0x2568 "\\textSFxlvi"             "pmboxdraw" "" # BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
+0x2569 "\\textSFxl"               "pmboxdraw" "" # BOX DRAWINGS DOUBLE UP AND HORIZONTAL
+0x256a "\\textSFliv"              "pmboxdraw" "" # BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE
+0x256b "\\textSFliii"             "pmboxdraw" "" # BOX DRAWINGS VERTICAL DOUBLE AND HORIZONTAL SINGLE
+0x256c "\\textSFxliv"             "pmboxdraw" "" # BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL
+# block elements
+0x2580 "\\textupblock"            "pmboxdraw" "" # UPPER HALF BLOCK
+0x2584 "\\textdnblock"            "pmboxdraw" "" # LOWER HALF BLOCK
+0x2588 "\\textblock"              "pmboxdraw" "" # FULL BLOCK
+0x258c "\\textlfblock"            "pmboxdraw" "" # LEFT HALF BLOCK
+0x2590 "\\textrtblock"            "pmboxdraw" "" # RIGHT HALF BLOCK
+0x2591 "\\textltshade"            "pmboxdraw" "" # LIGHT SHADE
+0x2592 "\\textshade"              "pmboxdraw" "" # MEDIUM SHADE
+0x2593 "\\textdkshade"            "pmboxdraw" "" # DARK SHADE
+# geometric shapes
+0x25a0 "\\textifsymbol[ifgeo]{80}" "ifsym" "" # BLACK SQUARE
+0x25a1 "\\textifsymbol[ifgeo]{32}" "ifsym" "" # WHITE SQUARE
+0x25aa "\\textifsymbol[ifgeo]{112}" "ifsym" "" # BLACK SMALL SQUARE
+0x25ab "\\textifsymbol[ifgeo]{64}" "ifsym" "" # WHITE SMALL SQUARE
+0x25ac "{\\ascii\\SYN}"           "ascii" "" # BLACK RECTANGLE
+0x25b2 "\\textifsymbol[ifgeo]{97}" "ifsym" "" # BLACK UP-POINTING TRIANGLE
+0x25b3 "\\textifsymbol[ifgeo]{49}" "ifsym" "" # WHITE UP-POINTING TRIANGLE
+0x25b4 "\\textifsymbol[ifgeo]{113}" "ifsym" "" # BLACK UP-POINTING SMALL TRIANGLE
+0x25b5 "\\textifsymbol[ifgeo]{65}" "ifsym" "" # WHITE UP-POINTING SMALL TRIANGLE
+0x25b6 "\\textifsymbol[ifgeo]{100}" "ifsym" "" # BLACK RIGHT-POINTING TRIANGLE
+0x25b7 "\\textifsymbol[ifgeo]{52}" "ifsym" "" # WHITE RIGHT-POINTING TRIANGLE
+0x25b8 "\\textifsymbol[ifgeo]{116}" "ifsym" "" # BLACK RIGHT-POINTING SMALL TRIANGLE
+0x25b9 "\\textifsymbol[ifgeo]{68}" "ifsym" "" # WHITE RIGHT-POINTING SMALL TRIANGLE
+0x25ba "\\RIGHTarrow"             "wasysym" "" # BLACK RIGHT-POINTING POINTER
+0x25bc "\\textifsymbol[ifgeo]{99}" "ifsym" "" # BLACK DOWN-POINTING TRIANGLE
+0x25bd "\\textifsymbol[ifgeo]{51}" "ifsym" "" # WHITE DOWN-POINTING TRIANGLE
+0x25be "\\textifsymbol[ifgeo]{115}" "ifsym" "" # BLACK DOWN-POINTING SMALL TRIANGLE
+0x25bf "\\textifsymbol[ifgeo]{67}" "ifsym" "" # WHITE DOWN-POINTING SMALL TRIANGLE
+0x25c0 "\\textifsymbol[ifgeo]{98}" "ifsym" "" # BLACK LEFT-POINTING TRIANGLE
+0x25c1 "\\textifsymbol[ifgeo]{50}" "ifsym" "" # WHITE LEFT-POINTING TRIANGLE
+0x25c2 "\\textifsymbol[ifgeo]{114}" "ifsym" "" # BLACK LEFT-POINTING SMALL TRIANGLE
+0x25c3 "\\textifsymbol[ifgeo]{66}" "ifsym" "" # WHITE LEFT-POINTING SMALL TRIANGLE
+0x25c4 "\\LEFTarrow"              "wasysym" "" # BLACK LEFT-POINTING POINTER
+0x25c6 "\\textifsymbol[ifgeo]{102}" "ifsym" "" # BLACK DIAMOND
+0x25c7 "\\textifsymbol[ifgeo]{54}" "ifsym" "" # WHITE DIAMOND
+0x25ca "\\ensuremath{\\lozenge}"  "amssymb" "" # LOZENGE
+0x25cb "\\Circle"                 "wasysym" "" # CIRCLE
+0x25cf "\\CIRCLE"                 "wasysym" "" # BLACK CIRCLE
+0x25d0 "\\LEFTcircle"             "wasysym" "" # CIRCLE WITH LEFT HALF BLACK
+0x25d1 "\\RIGHTcircle"            "wasysym" "" # CIRCLE WITH RIGHT HALF BLACK
+0x25d6 "\\LEFTCIRCLE"             "wasysym" "" # LEFT HALF BLACK CIRCLE
+0x25d7 "\\RIGHTCIRCLE"            "wasysym" "" # RIGHT HALF BLACK CIRCLE
+0x25d8 "{\\ascii\\BS}"            "ascii" "" # INVERSE BULLET
+0x25d9 "{\\ascii\\LF}"            "ascii" "" # INVERSE WHITE CIRCLE
+0x25e6 "\\textopenbullet"         "textcomp" "" # WHITE BULLET
+0x25ef "\\textbigcircle"          "textcomp" "" # LARGE CIRCLE
+0x25fb "\\textifsymbol[ifgeo]{48}" "ifsym" "" # WHITE MEDIUM SQUARE
+0x25fc "\\textifsymbol[ifgeo]{96}" "ifsym" "" # BLACK MEDIUM SQUARE
+# miscellaneous symbols
+0x2605 "\\FiveStar"               "bbding" "" # BLACK STAR
+0x2606 "\\FiveStarOpen"           "bbding" "" # WHITE STAR
+0x260e "\\Telefon"                "marvosym" "" # BLACK TELEPHON
+0x2610 "\\Square"                 "wasysym" "" # BALLOT BOX
+0x2611 "\\CheckedBox"             "wasysym" "" # BALLOT BOX WITH CHECK
+0x2612 "\\XBox"                   "wasysym" "" # BALLOT BOX WITH X
+0x261a "\\HandCuffLeft"           "bbding" "" # BLACK LEFT POINTING INDEX
+0x261b "\\HandCuffRight"          "bbding" "" # BLACK RIGHT POINTING INDEX
+0x261c "\\HandLeft"               "bbding" "" # WHITE LEFT POINTING INDEX
+0x261e "\\HandRight"              "bbding" "" # WHITE RIGHT POINTING INDEX
+0x2622 "\\Radioactivity"          "marvosym" "" # RADIOACTIVE SIGN
+0x2623 "\\Biohazard"              "marvosym" "" # BIOHAZARD SIGN
+0x2625 "\\Ankh"                   "marvosym" "" # ANKH
+0x262f "\\Yinyang"                "marvosym" "" # YIN YANG
+0x2639 "\\frownie"                "wasysym" "" # WHITE FROWNING FACE
+0x263a "\\smiley"                 "wasysym" "" # WHITE SMILING FACE
+0x263b "\\blacksmiley"            "wasysym" "" # BLACK SMILING FACE
+0x263c "\\sun"                    "wasysym" "" # WHITE SUN WITH RAYS
+0x263d "\\rightmoon"              "wasysym" "" # FIRST QUARTER MOON
+0x263e "\\leftmoon"               "wasysym" "" # LAST QUARTER MOON
+0x263f "\\mercury"                "wasysym" "" # MERCURY
+0x2640 "\\female"                 "wasysym" "" # FEMALE SIGN
+0x2641 "\\earth"                  "wasysym" "" # EARTH
+0x2642 "\\male"                   "wasysym" "" # MALE SIGN
+0x2643 "\\jupiter"                "wasysym" "" # JUPITER
+0x2644 "\\saturn"                 "wasysym" "" # SATURN
+0x2645 "\\uranus"                 "wasysym" "" # URANUS
+0x2646 "\\neptune"                "wasysym" "" # NEPTUNE
+0x2647 "\\pluto"                  "wasysym" "" # PLUTO
+0x2648 "\\aries"                  "wasysym" "" # ARIES
+0x2649 "\\taurus"                 "wasysym" "" # TAURUS
+0x264a "\\gemini"                 "wasysym" "" # GEMINI
+0x264b "\\cancer"                 "wasysym" "" # CANCER
+0x264c "\\leo"                    "wasysym" "" # LEO
+0x264d "\\virgo"                  "wasysym" "" # VIRGO
+0x264e "\\libra"                  "wasysym" "" # LIBRA
+0x264f "\\scorpio"                "wasysym" "" # SCORPIO
+0x2650 "\\sagittarius"            "wasysym" "" # SAGITTARIUS
+0x2651 "\\capricornus"            "wasysym" "" # CAPRICORNUS
+0x2652 "\\aquarius"               "wasysym" "" # AQUARIUS
+0x2653 "\\pisces"                 "wasysym" "" # PISCES
+0x2660 "\\ensuremath{\\spadesuit}" "" "" # BLACK SPADE SUIT
+0x2661 "\\ensuremath{\\heartsuit}" "" "" # WHITE HEART SUIT
+0x2662 "\\ensuremath{\\diamondsuit}" "" "" # WHITE DIAMOND SUIT
+0x2663 "\\ensuremath{\\clubsuit}" "" "" # BLACK CLUB SUIT
+0x2664 "\\ensuremath{\\varspadesuit}" "txfonts" "" # WHITE SPADE SUIT
+0x2665 "\\ensuremath{\\varheartsuit}" "txfonts" "" # BLACK HEART SUIT
+0x2666 "\\ensuremath{\\vardiamondsuit}" "txfonts" "" # BLACK DIAMOND SUIT
+0x2667 "\\ensuremath{\\varclubsuit}" "txfonts" "" # WHITE CLUB SUIT
+0x2669 "\\quarternote"            "wasysym" "" # QUARTER NOTE
+0x266a "\\textmusicalnote"        "textcomp" "" # EIGHTH NOTE
+0x266b "\\twonotes"               "wasysym" "" # BEAMED EIGHTH NOTES
+0x26a2 "\\FemaleFemale"           "marvosym" "" # DOUBLED FEMALE SIGN
+0x26a3 "\\MaleMale"               "marvosym" "" # DOUBLED MALE SIGN
+0x26a4 "\\FemaleMale"             "marvosym" "" # INTERLOCKED FEMALE AND MALE SIGN
+0x26a5 "\\Hermaphrodite"          "marvosym" "" # MALE AND FEMALE SIGN
+0x26ad "\\textmarried"            "textcomp" "" # MARRIAGE SYMBOL
+0x26ae "\\textdivorced"           "textcomp" "" # DIVORCE SYMBOL
+# dingbats
+0x2701 "\\ScissorRightBrokenBottom" "bbding" "" # UPPER BLADE SCISSORS
+0x2702 "\\ScissorRight"           "bbding" "" # BLACK SCISSORS
+0x2703 "\\ScissorRightBrokenTop"  "bbding" "" # LOWER BLADE SCISSORS
+0x2704 "\\ScissorHollowRight"     "bbding" "" # WHITE SCISSORS
+0x2709 "\\Letter"                 "marvosym" "" # ENVELOPE
+0x270d "\\HandPencilLeft"         "bbding" "" # WRITING HAND
+0x270e "\\PencilRightDown"        "bbding" "" # LOWER RIGHT PENCIL
+0x270f "\\PencilRight"            "bbding" "" # PENCIL
+0x2710 "\\PencilRightUp"          "bbding" "" # UPPER RIGHT PENCIL
+0x2711 "\\NibRight"               "bbding" "" # WHITE NIB
+0x2712 "\\NibSolidRight"          "bbding" "" # BLACK NIB
+0x2713 "\\Checkmark"              "bbding" "" # CHECK MARK
+0x2714 "\\CheckmarkBold"          "bbding" "" # HEAVY CHECK MARK
+0x2715 "\\XSolid"                 "bbding" "" # MULTIPLICATION X
+0x2716 "\\XSolidBold"             "bbding" "" # HEAVY MULTIPLICATION X
+0x2717 "\\XSolidBrush"            "bbding" "" # BALLOT X
+0x2719 "\\PlusOutline"            "bbding" "" # OUTLINED GREEK CROSS
+0x271a "\\Plus"                   "bbding" "" # HEAVY GREEK CROSS
+0x271b "\\PlusThinCenterOpen"     "bbding" "" # OPEN CENTRE CROSS
+0x271c "\\PlusCenterOpen"         "bbding" "" # HEAVY OPEN CENTRE CROSS
+0x271d "\\Cross"                  "bbding" "" # LATIN CROSS
+0x271e "\\CrossOpenShadow"        "bbding" "" # SHADOWED WHITE LATIN CROSS
+0x271f "\\CrossOutline"           "bbding" "" # OUTLINED LATIN CROSS
+0x2720 "\\CrossMaltese"           "bbding" "" # MALTESE CROSS
+0x2721 "\\DavidStar"              "bbding" "" # STAR OF DAVID
+0x2722 "\\FourAsterisk"           "bbding" "" # too lazy to add the follwing unicode names
+0x2723 "\\JackStar"               "bbding" "" # 
+0x2724 "\\JackStarBold"           "bbding" "" # 
+#0x2725 ""                         "" "" # 
+0x2726 "\\FourStar"               "bbding" "" # 
+0x2727 "\\FourStarOpen"           "bbding" "" # 
+#0x2728 ""                         "" "" # 
+#0x2729 ""                         "" "" # 
+0x272a "\\FiveStarOpenCircled"    "bbding" "" # 
+0x272b "\\FiveStarCenterOpen"     "bbding" "" # 
+0x272c "\\FiveStarOpenDotted"     "bbding" "" # 
+0x272d "\\FiveStarOutline"        "bbding" "" # 
+0x272e "\\FiveStarOutlineHeavy"   "bbding" "" # 
+0x272f "\\FiveStarConvex"         "bbding" "" # 
+0x2730 "\\FiveStarShadow"         "bbding" "" # 
+0x2731 "\\AsteriskBold"           "bbding" "" # 
+0x2732 "\\AsteriskCenterOpen"     "bbding" "" # 
+#0x2733 ""                         "" "" # 
+0x2734 "\\EightStarTaper"         "bbding" "" # 
+0x2735 "\\EightStarConvex"        "bbding" "" # 
+0x2736 "\\SixStar"                "bbding" "" # 
+0x2737 "\\EightStar"              "bbding" "" # 
+0x2738 "\\EightStarBold"          "bbding" "" # 
+0x2739 "\\TwelweStar"             "bbding" "" # 
+0x273a "\\SixteenStarLight"       "bbding" "" # 
+0x273b "\\SixFlowerPetalRemoved"  "bbding" "" # 
+0x273c "\\SixFlowerOpenCenter"    "bbding" "" #
+0x273d "\\Asterisk"               "bbding" "" # 
+0x273e "\\SixFlowerAlternate"     "bbding" "" # 
+0x273f "\\FiveFlowerPetal"        "bbding" "" # 
+0x2740 "\\FiveFlowerOpen"         "bbding" "" # 
+0x2741 "\\EightFlowerPetal"       "bbding" "" # 
+#0x2742 ""                         "" "" #  
+0x2743 "\\SixFlowerAltPetal"      "bbding" "" # 
+0x2744 "\\SnowflakeChevron"       "bbding" "" # 
+0x2745 "\\Snowflake"              "bbding" "" # 
+0x2746 "\\SnowflakeChevronBold"   "bbding" "" # 
+0x2747 "\\Sparkle"                "bbding" "" # 
+0x2748 "\\SparkleBold"            "bbding" "" # 
+0x2749 "\\AsteriskRoundedEnds"    "bbding" "" # 
+0x274a "\\EightFlowerPetalRemoved" "bbding" "" # 
+0x274b "\\EightAsterisk"          "bbding" "" # 
+0x2776 "\\ding{182}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT ONE
+0x2777 "\\ding{183}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT TWO
+0x2778 "\\ding{184}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT THREE
+0x2779 "\\ding{185}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT FOUR
+0x277a "\\ding{186}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT FIVE
+0x277b "\\ding{187}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT SIX
+0x277c "\\ding{188}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT SEVEN
+0x277d "\\ding{189}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT EIGHT
+0x277e "\\ding{190}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT NINE
+0x277f "\\ding{191}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED DIGIT TEN
+0x2780 "\\ding{192}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF DIGIT ONE
+0x2781 "\\ding{193}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF TWO
+0x2782 "\\ding{194}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF THREE
+0x2783 "\\ding{195}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF FOUR
+0x2784 "\\ding{196}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF FIVE
+0x2785 "\\ding{197}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF SIX
+0x2786 "\\ding{198}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF SEVEN
+0x2787 "\\ding{199}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF EIGHT
+0x2788 "\\ding{200}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF NINE
+0x2789 "\\ding{201}"              "pifont" "" # DINGBAT CIRCLED SANS-SERIF TEN
+0x278a "\\ding{202}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ONE
+0x278b "\\ding{203}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF TWO
+0x278c "\\ding{204}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF THREE
+0x278d "\\ding{205}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF FOUR
+0x278e "\\ding{206}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF FIVE
+0x278f "\\ding{207}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF SIX
+0x2790 "\\ding{208}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF SEVEN
+0x2791 "\\ding{209}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF EIGHT
+0x2792 "\\ding{210}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF NINE
+0x2793 "\\ding{211}"              "pifont" "" # DINGBAT NEGATIVE CIRCLED SANS-SERIF TEN
+# miscellaneous mathematical symbols-A
+0x27e8 "\\textlangle"             "textcomp" "" # MATHEMATICAL LEFT ANGLE BRACKET
+0x27e9 "\\textrangle"             "textcomp" "" # MATHEMATICAL RIGHT ANGLE BRACKET
+