2002-08-01 15:26:32 +00:00
|
|
|
# This file is part of lyx2lyx
|
|
|
|
# Copyright (C) 2002 Dekel Tsur <dekel@lyx.org>
|
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or
|
|
|
|
# modify it under the terms of the GNU General Public License
|
|
|
|
# as published by the Free Software Foundation; either version 2
|
|
|
|
# of the License, or (at your option) any later version.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program; if not, write to the Free Software
|
|
|
|
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
|
|
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
import sys,string,re
|
2002-08-01 15:26:32 +00:00
|
|
|
from parser_tools import *
|
|
|
|
|
|
|
|
floats = {
|
2002-08-02 19:25:14 +00:00
|
|
|
"footnote": ["\\begin_inset Foot",
|
|
|
|
"collapsed true"],
|
|
|
|
"margin": ["\\begin_inset Marginal",
|
|
|
|
"collapsed true"],
|
|
|
|
"fig": ["\\begin_inset Float figure",
|
|
|
|
"placement htbp",
|
|
|
|
"wide false",
|
|
|
|
"collapsed false"],
|
|
|
|
"tab": ["\\begin_inset Float table",
|
|
|
|
"placement htbp",
|
|
|
|
"wide false",
|
|
|
|
"collapsed false"],
|
|
|
|
"alg": ["\\begin_inset Float algorithm",
|
|
|
|
"placement htbp",
|
|
|
|
"wide false",
|
|
|
|
"collapsed false"],
|
|
|
|
"wide-fig": ["\\begin_inset Float figure",
|
|
|
|
"placement htbp",
|
|
|
|
"wide true",
|
|
|
|
"collapsed false"],
|
|
|
|
"wide-tab": ["\\begin_inset Float table",
|
|
|
|
"placement htbp",
|
|
|
|
"wide true",
|
|
|
|
"collapsed false"]
|
2002-08-01 15:26:32 +00:00
|
|
|
}
|
|
|
|
|
2002-08-03 14:29:12 +00:00
|
|
|
font_tokens = ["\\family", "\\series", "\\shape", "\\size", "\\emph",
|
|
|
|
"\\bar", "\\noun", "\\color", "\\lang"]
|
|
|
|
|
|
|
|
#
|
|
|
|
# Change \begin_float .. \end_float into \begin_inset Float .. \end_inset
|
|
|
|
#
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
def remove_oldfloat(lines, language):
|
2002-08-01 15:26:32 +00:00
|
|
|
i = 0
|
|
|
|
while 1:
|
|
|
|
i = find_token(lines, "\\begin_float", i)
|
|
|
|
if i == -1:
|
|
|
|
break
|
|
|
|
j = find_token(lines, "\\end_float", i+1)
|
|
|
|
floattype = string.split(lines[i])[1]
|
2002-08-02 19:25:14 +00:00
|
|
|
if not floats.has_key(floattype):
|
|
|
|
sys.stderr.write("Error! Unknown float type "+floattype+"\n")
|
|
|
|
floattype = "fig"
|
|
|
|
|
|
|
|
# skip \end_deeper tokens
|
|
|
|
i2 = i+1
|
|
|
|
while check_token(lines[i2], "\\end_deeper"):
|
|
|
|
i2 = i2+1
|
|
|
|
if i2 > i+1:
|
|
|
|
j2 = find_token(lines, "\\layout", j+1)
|
|
|
|
lines[j2:j2] = ["\\end_deeper "]*(i2-(i+1))
|
|
|
|
|
2002-08-03 14:29:12 +00:00
|
|
|
new = floats[floattype]+[""]
|
2002-08-05 15:49:20 +00:00
|
|
|
new = new+lines[i2:j]+["\\end_inset ", ""]
|
2002-08-03 14:29:12 +00:00
|
|
|
# After a float, all font attribute are reseted.
|
|
|
|
# We need to output '\foo default' for every attribute foo
|
|
|
|
# whose value is not default before the float.
|
|
|
|
# The check here is not accurate, but it doesn't matter
|
|
|
|
# as extra '\foo default' commands are ignored.
|
|
|
|
# In fact, it might be safer to output '\foo default' for all
|
|
|
|
# font attributes.
|
|
|
|
k = get_paragraph(lines, i)
|
2002-08-05 15:49:20 +00:00
|
|
|
flag = 0
|
2002-08-03 14:29:12 +00:00
|
|
|
for token in font_tokens:
|
|
|
|
if find_token(lines, token, k, i) != -1:
|
2002-08-05 15:49:20 +00:00
|
|
|
if not flag:
|
|
|
|
# This is not necessary, but we want the output to be
|
|
|
|
# as similar as posible to the lyx format
|
|
|
|
flag = 1
|
|
|
|
new.append("")
|
2002-08-03 14:29:12 +00:00
|
|
|
if token == "\\lang":
|
|
|
|
new.append(token+" "+language+" ")
|
|
|
|
else:
|
|
|
|
new.append(token+" default ")
|
|
|
|
lines[i:j+1]= new
|
2002-08-02 19:25:14 +00:00
|
|
|
|
2002-08-01 15:26:32 +00:00
|
|
|
i = i+1
|
|
|
|
|
|
|
|
def remove_oldminipage(lines):
|
|
|
|
i = 0
|
|
|
|
flag = 0
|
|
|
|
while 1:
|
|
|
|
i = find_token(lines, "\\pextra_type 2", i)
|
|
|
|
if i == -1:
|
|
|
|
break
|
|
|
|
hfill = 0
|
|
|
|
line = string.split(lines[i])
|
|
|
|
if line[4] == "\\pextra_hfill":
|
|
|
|
hfill = 1
|
2002-08-02 19:25:14 +00:00
|
|
|
line[4:6] = []
|
2002-08-01 15:26:32 +00:00
|
|
|
if line[4] == "\\pextra_start_minipage":
|
2002-08-02 19:25:14 +00:00
|
|
|
# We just ignore this
|
2002-08-01 15:26:32 +00:00
|
|
|
line[4:6] = []
|
2002-08-02 19:25:14 +00:00
|
|
|
|
|
|
|
position = line[3]
|
2002-08-01 15:26:32 +00:00
|
|
|
width = line[5]
|
|
|
|
if line[4] == "\\pextra_widthp":
|
|
|
|
width = line[5]+"col%"
|
2002-08-02 19:25:14 +00:00
|
|
|
|
2002-08-01 15:26:32 +00:00
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
start = ["\\begin_inset Minipage",
|
|
|
|
"position " + position,
|
|
|
|
"inner_position 0",
|
|
|
|
'height "0pt"',
|
|
|
|
'width "%s"' % width,
|
|
|
|
"collapsed false"
|
2002-08-01 15:26:32 +00:00
|
|
|
]
|
|
|
|
if flag:
|
|
|
|
flag = 0
|
|
|
|
if hfill:
|
2002-08-02 19:25:14 +00:00
|
|
|
start = ["","\hfill",""]+start
|
2002-08-01 15:26:32 +00:00
|
|
|
else:
|
2002-08-02 19:25:14 +00:00
|
|
|
start = ["\\layout Standard"] + start
|
2002-08-01 15:26:32 +00:00
|
|
|
|
|
|
|
j = find_token_backwards(lines,"\\layout", i-1)
|
|
|
|
j0 = j
|
|
|
|
mid = lines[j:i]
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
|
|
|
|
# j can be -1, but this is still ok
|
2002-08-01 15:26:32 +00:00
|
|
|
mid = mid+lines[i+1:j]
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
count = 0
|
2002-08-01 15:26:32 +00:00
|
|
|
while 1:
|
2002-08-02 19:25:14 +00:00
|
|
|
# collect more paragraphs to the minipage
|
|
|
|
count = count+1
|
|
|
|
if j == -1 or not check_token(lines[j], "\\layout"):
|
|
|
|
break
|
|
|
|
i = find_tokens(lines, ["\\layout", "\\pextra_type"], j+1)
|
|
|
|
if i == -1 or not check_token(lines[i], "\\pextra_type"):
|
2002-08-01 15:26:32 +00:00
|
|
|
break
|
|
|
|
line = string.split(lines[i])
|
|
|
|
if line[4] == "\\pextra_hfill":
|
|
|
|
line[4:6] = []
|
|
|
|
if line[4] == "\\pextra_start_minipage" and line[5] == "1":
|
|
|
|
flag = 1
|
|
|
|
break
|
|
|
|
j = find_token_backwards(lines,"\\layout", i-1)
|
|
|
|
mid = mid+lines[j:i]
|
2002-08-02 19:25:14 +00:00
|
|
|
j = find_tokens(lines, ["\\layout", "\\end_float"], i+1)
|
2002-08-01 15:26:32 +00:00
|
|
|
mid = mid+lines[i+1:j]
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
end = ["\\end_inset "]
|
2002-08-01 15:26:32 +00:00
|
|
|
|
|
|
|
lines[j0:j] = start+mid+end
|
|
|
|
i = i+1
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
def is_empty(lines):
|
2002-08-02 20:34:20 +00:00
|
|
|
return filter(is_nonempty_line, lines) == []
|
2002-08-02 19:25:14 +00:00
|
|
|
|
|
|
|
font_rexp = re.compile(r"\\(family|series|shape|size|emph|numeric|bar|noun)")
|
|
|
|
ert_rexp = re.compile(r"\\begin_inset|.*\\SpecialChar")
|
|
|
|
spchar_rexp = re.compile(r"(.*)(\\SpecialChar.*)")
|
2002-08-02 20:34:20 +00:00
|
|
|
ert_begin = ["\\begin_inset ERT",
|
|
|
|
"status Collapsed",
|
|
|
|
"",
|
|
|
|
"\\layout Standard"]
|
2002-08-02 19:25:14 +00:00
|
|
|
|
|
|
|
def remove_oldert(lines):
|
|
|
|
i = 0
|
|
|
|
while 1:
|
2002-08-02 20:34:20 +00:00
|
|
|
i = find_tokens(lines, ["\\latex latex", "\\layout LaTeX"], i)
|
2002-08-02 19:25:14 +00:00
|
|
|
if i == -1:
|
|
|
|
break
|
2002-08-06 12:10:09 +00:00
|
|
|
j = i+1
|
|
|
|
while 1:
|
|
|
|
j = find_tokens(lines, ["\\latex default", "\\begin_inset", "\\layout", "\\end_float", "\\the_end"],
|
|
|
|
j)
|
|
|
|
if check_token(lines[j], "\\begin_inset"):
|
2002-08-10 13:34:57 +00:00
|
|
|
j = find_end_of_inset(lines, j)
|
2002-08-06 12:10:09 +00:00
|
|
|
else:
|
|
|
|
break
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
if check_token(lines[j], "\\layout"):
|
|
|
|
while j-1 >= 0 and check_token(lines[j-1], "\\begin_deeper"):
|
|
|
|
j = j-1
|
|
|
|
|
|
|
|
# We need to remove insets, special chars & font commands from ERT text
|
|
|
|
new = []
|
|
|
|
new2 = []
|
2002-08-02 20:34:20 +00:00
|
|
|
if check_token(lines[i], "\\layout LaTeX"):
|
|
|
|
new = ["\layout Standard", "", ""]
|
|
|
|
# We have a problem with classes in which Standard is not the default layout!
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
k = i+1
|
|
|
|
while 1:
|
|
|
|
k2 = find_re(lines, ert_rexp, k, j)
|
|
|
|
inset = specialchar = 0
|
|
|
|
if k2 == -1:
|
|
|
|
k2 = j
|
|
|
|
elif check_token(lines[k2], "\\begin_inset"):
|
|
|
|
inset = 1
|
|
|
|
else:
|
|
|
|
specialchar = 1
|
|
|
|
mo = spchar_rexp.match(lines[k2])
|
|
|
|
lines[k2] = mo.group(1)
|
|
|
|
specialchar_str = mo.group(2)
|
|
|
|
k2 = k2+1
|
|
|
|
|
|
|
|
tmp = []
|
|
|
|
for line in lines[k:k2]:
|
|
|
|
if font_rexp.match(line):
|
2002-08-05 15:49:20 +00:00
|
|
|
if new2 == []:
|
|
|
|
# This is not necessary, but we want the output to be
|
|
|
|
# as similar as posible to the lyx format
|
|
|
|
new2 = [""]
|
2002-08-02 19:25:14 +00:00
|
|
|
new2.append(line)
|
2002-08-12 21:48:47 +00:00
|
|
|
elif not check_token(line, "\\latex"):
|
2002-08-02 19:25:14 +00:00
|
|
|
tmp.append(line)
|
|
|
|
|
|
|
|
if is_empty(tmp):
|
2002-08-05 15:49:20 +00:00
|
|
|
if filter(lambda x:x != "", tmp) != []:
|
|
|
|
if new == []:
|
|
|
|
# This is not necessary, but we want the output to be
|
|
|
|
# as similar as posible to the lyx format
|
|
|
|
lines[i-1] = lines[i-1]+" "
|
|
|
|
else:
|
|
|
|
new = new+[" "]
|
2002-08-02 19:25:14 +00:00
|
|
|
else:
|
|
|
|
new = new+ert_begin+tmp+["\\end_inset ", ""]
|
|
|
|
|
|
|
|
if inset:
|
2002-08-10 13:34:57 +00:00
|
|
|
k3 = find_end_of_inset(lines, k2)
|
2002-08-05 15:49:20 +00:00
|
|
|
new = new+[""]+lines[k2:k3+1]+[""] # Put an empty line after \end_inset
|
2002-08-02 19:25:14 +00:00
|
|
|
k = k3+1
|
2002-08-05 15:49:20 +00:00
|
|
|
# Skip the empty line after \end_inset
|
|
|
|
if not is_nonempty_line(lines[k]):
|
|
|
|
k = k+1
|
|
|
|
new.append("")
|
2002-08-02 19:25:14 +00:00
|
|
|
elif specialchar:
|
2002-08-05 15:49:20 +00:00
|
|
|
if new == []:
|
|
|
|
# This is not necessary, but we want the output to be
|
|
|
|
# as similar as posible to the lyx format
|
|
|
|
lines[i-1] = lines[i-1]+specialchar_str
|
|
|
|
new = [""]
|
|
|
|
else:
|
|
|
|
new = new+[specialchar_str, ""]
|
2002-08-02 19:25:14 +00:00
|
|
|
k = k2
|
|
|
|
else:
|
|
|
|
break
|
|
|
|
|
|
|
|
new = new+new2
|
|
|
|
if not check_token(lines[j], "\\latex default"):
|
|
|
|
new = new+[""]+[lines[j]]
|
|
|
|
lines[i:j+1] = new
|
|
|
|
i = i+1
|
|
|
|
|
2002-08-12 21:48:47 +00:00
|
|
|
def remove_oldertinset(lines):
|
2002-08-06 12:10:09 +00:00
|
|
|
i = 0
|
|
|
|
while 1:
|
|
|
|
i = find_token(lines, "\\begin_inset ERT", i)
|
|
|
|
if i == -1:
|
|
|
|
break
|
2002-08-10 13:34:57 +00:00
|
|
|
j = find_end_of_inset(lines, i)
|
2002-08-12 21:48:47 +00:00
|
|
|
k = find_token(lines, "\\layout", i+1)
|
|
|
|
l = get_paragraph(lines, i)
|
|
|
|
if lines[k] == lines[l]: # same layout
|
|
|
|
k = k+1
|
|
|
|
new = lines[k:j]
|
|
|
|
lines[i:j+1] = new
|
2002-08-06 12:10:09 +00:00
|
|
|
i = i+1
|
|
|
|
|
2002-08-02 20:34:20 +00:00
|
|
|
def is_ert_paragraph(lines, i):
|
|
|
|
i = find_nonempty_line(lines, i+1)
|
|
|
|
if not check_token(lines[i], "\\begin_inset ERT"):
|
|
|
|
return 0
|
2002-08-10 13:34:57 +00:00
|
|
|
j = find_end_of_inset(lines, i)
|
2002-08-02 20:34:20 +00:00
|
|
|
k = find_nonempty_line(lines, j+1)
|
|
|
|
return check_token(lines[k], "\\layout")
|
|
|
|
|
|
|
|
def combine_ert(lines):
|
|
|
|
i = 0
|
|
|
|
while 1:
|
|
|
|
i = find_token(lines, "\\begin_inset ERT", i)
|
|
|
|
if i == -1:
|
|
|
|
break
|
|
|
|
j = find_token_backwards(lines,"\\layout", i-1)
|
|
|
|
count = 0
|
|
|
|
text = []
|
|
|
|
while is_ert_paragraph(lines, j):
|
|
|
|
|
|
|
|
count = count+1
|
|
|
|
i2 = find_token(lines, "\\layout", j+1)
|
|
|
|
k = find_token(lines, "\\end_inset", i2+1)
|
|
|
|
text = text+lines[i2:k]
|
|
|
|
j = find_token(lines, "\\layout", k+1)
|
|
|
|
if j == -1:
|
|
|
|
break
|
2002-08-02 19:25:14 +00:00
|
|
|
|
2002-08-02 20:34:20 +00:00
|
|
|
if count >= 2:
|
2002-08-03 10:31:31 +00:00
|
|
|
j = find_token(lines, "\\layout", i+1)
|
|
|
|
lines[j:k] = text
|
2002-08-02 20:34:20 +00:00
|
|
|
|
|
|
|
i = i+1
|
|
|
|
|
2002-08-02 19:25:14 +00:00
|
|
|
oldunits = ["pt", "cm", "in", "text%", "col%"]
|
|
|
|
|
|
|
|
def get_length(lines, name, start, end):
|
|
|
|
i = find_token(lines, name, start, end)
|
|
|
|
if i == -1:
|
|
|
|
return ""
|
|
|
|
x = string.split(lines[i])
|
|
|
|
return x[2]+oldunits[int(x[1])]
|
|
|
|
|
|
|
|
def append(x, token, value):
|
|
|
|
if value != "":
|
|
|
|
x.append("\t"+token+" "+value)
|
|
|
|
|
|
|
|
def remove_figinset(lines):
|
|
|
|
i = 0
|
|
|
|
while 1:
|
|
|
|
i = find_token(lines, "\\begin_inset Figure", i)
|
|
|
|
if i == -1:
|
|
|
|
break
|
2002-08-10 13:34:57 +00:00
|
|
|
j = find_end_of_inset(lines, i)
|
2002-08-02 19:25:14 +00:00
|
|
|
|
|
|
|
lyxwidth = string.split(lines[i])[3]+"pt"
|
|
|
|
lyxheight = string.split(lines[i])[4]+"pt"
|
|
|
|
|
|
|
|
filename = get_value(lines, "file", i+1, j)
|
|
|
|
|
|
|
|
width = get_length(lines, "width", i+1, j)
|
|
|
|
# what does width=5 mean ?
|
|
|
|
height = get_length(lines, "height", i+1, j)
|
|
|
|
rotateAngle = get_value(lines, "angle", i+1, j)
|
|
|
|
if width == "" and height == "":
|
|
|
|
size_type = "0"
|
|
|
|
else:
|
|
|
|
size_type = "1"
|
|
|
|
|
|
|
|
flags = get_value(lines, "flags", i+1, j)
|
|
|
|
x = int(flags)%4
|
|
|
|
if x == 1:
|
|
|
|
display = "monochrome"
|
|
|
|
elif x == 2:
|
|
|
|
display = "gray"
|
|
|
|
else:
|
|
|
|
display = "color"
|
|
|
|
|
|
|
|
subcaptionText = get_value(lines, "subcaption", i+1, j)
|
|
|
|
if subcaptionText != "":
|
|
|
|
subcaptionText = '"'+subcaptionText+'"'
|
|
|
|
k = find_token(lines, "subfigure", i+1,j)
|
|
|
|
if k == -1:
|
|
|
|
subcaption = 0
|
|
|
|
else:
|
|
|
|
subcaption = 1
|
|
|
|
|
|
|
|
new = ["\\begin_inset Graphics FormatVersion 1"]
|
|
|
|
append(new, "filename", filename)
|
|
|
|
append(new, "display", display)
|
|
|
|
if subcaption:
|
|
|
|
new.append("\tsubcaption")
|
|
|
|
append(new, "subcaptionText", subcaptionText)
|
|
|
|
append(new, "size_type", size_type)
|
|
|
|
append(new, "width", width)
|
|
|
|
append(new, "height", height)
|
|
|
|
if rotateAngle != "":
|
|
|
|
new.append("\trotate")
|
|
|
|
append(new, "rotateAngle", rotateAngle)
|
|
|
|
new.append("\trotateOrigin center")
|
|
|
|
new.append("\tlyxsize_type 1")
|
|
|
|
append(new, "lyxwidth", lyxwidth)
|
|
|
|
append(new, "lyxheight", lyxheight)
|
|
|
|
new = new + ["\end_inset"]
|
|
|
|
lines[i:j+1] = new
|
|
|
|
|
|
|
|
def change_preamble(lines):
|
|
|
|
i = find_token(lines, "\\use_amsmath", 0)
|
|
|
|
if i == -1:
|
|
|
|
return
|
|
|
|
lines[i+1:i+1] = ["\\use_natbib 0",
|
|
|
|
"\use_numerical_citations 0"]
|
|
|
|
|
|
|
|
def convert(header, body):
|
|
|
|
language = get_value(header, "\\language", 0)
|
|
|
|
if language == "":
|
|
|
|
language = "english"
|
|
|
|
|
|
|
|
change_preamble(header)
|
2002-08-12 21:48:47 +00:00
|
|
|
remove_oldertinset(body)
|
2002-08-02 19:25:14 +00:00
|
|
|
remove_oldert(body)
|
2002-08-02 20:34:20 +00:00
|
|
|
combine_ert(body)
|
2002-08-01 15:26:32 +00:00
|
|
|
remove_oldminipage(body)
|
2002-08-02 19:25:14 +00:00
|
|
|
remove_oldfloat(body, language)
|
|
|
|
remove_figinset(body)
|
2002-08-01 15:26:32 +00:00
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
pass
|