2002-08-04 23:11:50 +00:00
|
|
|
/**
|
|
|
|
* \file ispell.C
|
|
|
|
* Copyright 2002 the LyX Team
|
|
|
|
* Read the file COPYING
|
2001-07-13 11:50:39 +00:00
|
|
|
*
|
2002-08-04 23:11:50 +00:00
|
|
|
* \author unknown
|
|
|
|
* \author John Levon <levon@movementarian.org>
|
2001-07-13 11:50:39 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include <config.h>
|
|
|
|
|
|
|
|
#ifdef __GNUG__
|
|
|
|
#pragma implementation
|
|
|
|
#endif
|
|
|
|
|
2002-02-28 14:06:24 +00:00
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/wait.h>
|
2001-07-13 11:50:39 +00:00
|
|
|
#include <unistd.h>
|
|
|
|
#include <fcntl.h>
|
2002-06-10 21:04:06 +00:00
|
|
|
#include <cstdio>
|
2001-07-13 11:50:39 +00:00
|
|
|
|
2002-08-04 23:11:50 +00:00
|
|
|
// FIXME: do we need any of this horrible gook ?
|
2001-07-16 10:03:38 +00:00
|
|
|
#if TIME_WITH_SYS_TIME
|
|
|
|
# include <sys/time.h>
|
|
|
|
# include <ctime>
|
|
|
|
#else
|
|
|
|
# if HAVE_SYS_TIME_H
|
|
|
|
# include <sys/time.h>
|
|
|
|
# else
|
|
|
|
# include <ctime>
|
|
|
|
# endif
|
|
|
|
#endif
|
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
#ifdef HAVE_SYS_SELECT_H
|
|
|
|
# ifdef HAVE_STRINGS_H
|
|
|
|
// <strings.h> is needed at least on AIX because FD_ZERO uses bzero().
|
|
|
|
// BUT we cannot include both string.h and strings.h on Irix 6.5 :(
|
|
|
|
# ifdef _AIX
|
|
|
|
# include <strings.h>
|
|
|
|
# endif
|
|
|
|
# endif
|
|
|
|
#include <sys/select.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "LString.h"
|
|
|
|
#include "support/lstrings.h"
|
2001-07-16 10:03:38 +00:00
|
|
|
#include "lyxrc.h"
|
2001-11-26 18:03:23 +00:00
|
|
|
#include "language.h"
|
2001-07-16 10:03:38 +00:00
|
|
|
#include "debug.h"
|
|
|
|
#include "encoding.h"
|
2002-08-04 23:11:50 +00:00
|
|
|
#include "ispell.h"
|
2001-07-16 10:03:38 +00:00
|
|
|
|
2002-06-10 07:57:39 +00:00
|
|
|
#ifndef CXX_GLOBAL_CSTD
|
|
|
|
using std::strcpy;
|
|
|
|
using std::strlen;
|
|
|
|
using std::strpbrk;
|
|
|
|
using std::strstr;
|
|
|
|
#endif
|
|
|
|
|
2001-07-16 10:03:38 +00:00
|
|
|
using std::endl;
|
|
|
|
|
|
|
|
namespace {
|
2002-03-21 17:27:08 +00:00
|
|
|
/// pid for the `ispell' process.
|
|
|
|
pid_t isp_pid = -1;
|
2001-07-16 10:03:38 +00:00
|
|
|
}
|
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
|
|
|
|
ISpell::ISpell(BufferParams const & params, string const & lang)
|
2002-08-04 23:11:50 +00:00
|
|
|
: str(0)
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
|
|
|
static char o_buf[BUFSIZ]; // jc: it could be smaller
|
2001-10-12 14:05:47 +00:00
|
|
|
int pipein[2];
|
|
|
|
int pipeout[2];
|
2001-07-13 11:50:39 +00:00
|
|
|
char * argv[14];
|
|
|
|
int argc;
|
|
|
|
|
|
|
|
isp_pid = -1;
|
|
|
|
|
|
|
|
if (pipe(pipein) == -1 || pipe(pipeout) == -1) {
|
|
|
|
lyxerr << "LyX: Can't create pipe for spellchecker!" << endl;
|
|
|
|
goto END;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((out = fdopen(pipein[1], "w")) == 0) {
|
|
|
|
lyxerr << "LyX: Can't create stream for pipe for spellchecker!"
|
|
|
|
<< endl;
|
|
|
|
goto END;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((in = fdopen(pipeout[0], "r")) == 0) {
|
|
|
|
lyxerr <<"LyX: Can't create stream for pipe for spellchecker!"
|
|
|
|
<< endl;
|
|
|
|
goto END;
|
|
|
|
}
|
|
|
|
|
|
|
|
setvbuf(out, o_buf, _IOLBF, BUFSIZ);
|
|
|
|
|
|
|
|
isp_fd = pipeout[0];
|
|
|
|
|
|
|
|
isp_pid = fork();
|
|
|
|
|
|
|
|
if (isp_pid == -1) {
|
|
|
|
lyxerr << "LyX: Can't create child process for spellchecker!"
|
|
|
|
<< endl;
|
|
|
|
goto END;
|
|
|
|
}
|
2002-03-21 17:27:08 +00:00
|
|
|
|
|
|
|
if (isp_pid == 0) {
|
2001-07-13 11:50:39 +00:00
|
|
|
/* child process */
|
|
|
|
dup2(pipein[0], STDIN_FILENO);
|
|
|
|
dup2(pipeout[1], STDOUT_FILENO);
|
|
|
|
::close(pipein[0]);
|
|
|
|
::close(pipein[1]);
|
|
|
|
::close(pipeout[0]);
|
|
|
|
::close(pipeout[1]);
|
|
|
|
|
|
|
|
argc = 0;
|
|
|
|
char * tmp = new char[lyxrc.isp_command.length() + 1];
|
|
|
|
lyxrc.isp_command.copy(tmp, lyxrc.isp_command.length());
|
|
|
|
tmp[lyxrc.isp_command.length()] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
tmp = new char[3];
|
|
|
|
string("-a").copy(tmp, 2); tmp[2] = '\0'; // pipe mode
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
|
|
|
|
if (lang != "default") {
|
|
|
|
tmp = new char[3];
|
|
|
|
string("-d").copy(tmp, 2); tmp[2] = '\0'; // Dictionary file
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
tmp = new char[lang.length() + 1];
|
|
|
|
lang.copy(tmp, lang.length()); tmp[lang.length()] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (lyxrc.isp_accept_compound) {
|
|
|
|
// Consider run-together words as legal compounds
|
|
|
|
tmp = new char[3];
|
|
|
|
string("-C").copy(tmp, 2); tmp[2] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
} else {
|
|
|
|
// Report run-together words with
|
|
|
|
// missing blanks as errors
|
2002-03-21 17:27:08 +00:00
|
|
|
tmp = new char[3];
|
2001-07-13 11:50:39 +00:00
|
|
|
string("-B").copy(tmp, 2); tmp[2] = '\0';
|
2002-03-21 17:27:08 +00:00
|
|
|
argv[argc++] = tmp;
|
2001-07-13 11:50:39 +00:00
|
|
|
}
|
|
|
|
if (lyxrc.isp_use_esc_chars) {
|
|
|
|
// Specify additional characters that
|
|
|
|
// can be part of a word
|
|
|
|
tmp = new char[3];
|
|
|
|
string("-w").copy(tmp, 2); tmp[2] = '\0';
|
2002-03-21 17:27:08 +00:00
|
|
|
argv[argc++] = tmp;
|
2001-07-13 11:50:39 +00:00
|
|
|
// Put the escape chars in ""s
|
|
|
|
string tms = "\"" + lyxrc.isp_esc_chars + "\"";
|
|
|
|
tmp = new char[tms.length() + 1];
|
|
|
|
tms.copy(tmp, tms.length()); tmp[tms.length()] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
}
|
|
|
|
if (lyxrc.isp_use_pers_dict) {
|
|
|
|
// Specify an alternate personal dictionary
|
|
|
|
tmp = new char[3];
|
|
|
|
string("-p").copy(tmp, 2);
|
|
|
|
tmp[2]= '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
tmp = new char[lyxrc.isp_pers_dict.length() + 1];
|
|
|
|
lyxrc.isp_pers_dict.copy(tmp, lyxrc.isp_pers_dict.length());
|
|
|
|
tmp[lyxrc.isp_pers_dict.length()] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
}
|
|
|
|
if (lyxrc.isp_use_input_encoding &&
|
|
|
|
params.inputenc != "default") {
|
|
|
|
string enc = (params.inputenc == "auto")
|
|
|
|
? params.language->encoding()->LatexName()
|
|
|
|
: params.inputenc;
|
|
|
|
string::size_type n = enc.length();
|
|
|
|
tmp = new char[3];
|
2001-10-12 14:05:47 +00:00
|
|
|
string("-T").copy(tmp, 2);
|
|
|
|
tmp[2] = '\0';
|
2001-07-13 11:50:39 +00:00
|
|
|
argv[argc++] = tmp; // Input encoding
|
|
|
|
tmp = new char[n + 1];
|
|
|
|
enc.copy(tmp, n);
|
|
|
|
tmp[n] = '\0';
|
|
|
|
argv[argc++] = tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
argv[argc++] = 0;
|
|
|
|
|
|
|
|
execvp(argv[0], const_cast<char * const *>(argv));
|
|
|
|
|
|
|
|
// free the memory used by string::copy in the
|
|
|
|
// setup of argv
|
2001-10-12 14:05:47 +00:00
|
|
|
for (int i = 0; i < argc - 1; ++i)
|
2001-07-13 11:50:39 +00:00
|
|
|
delete[] argv[i];
|
2002-03-21 17:27:08 +00:00
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
lyxerr << "LyX: Failed to start ispell!" << endl;
|
|
|
|
_exit(0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
/* Parent process: Read ispells identification message */
|
|
|
|
// Hmm...what are we using this id msg for? Nothing? (Lgb)
|
|
|
|
// Actually I used it to tell if it's truly Ispell or if it's
|
|
|
|
// aspell -- (kevinatk@home.com)
|
2002-08-04 23:11:50 +00:00
|
|
|
// But no code actually used the results for anything useful
|
|
|
|
// so I removed it again. Perhaps we can remove this code too.
|
|
|
|
// - jbl
|
2001-07-13 11:50:39 +00:00
|
|
|
char buf[2048];
|
|
|
|
fd_set infds;
|
|
|
|
struct timeval tv;
|
|
|
|
int retval = 0;
|
|
|
|
FD_ZERO(&infds);
|
|
|
|
FD_SET(pipeout[0], &infds);
|
|
|
|
tv.tv_sec = 15; // fifteen second timeout. Probably too much,
|
|
|
|
// but it can't really hurt.
|
|
|
|
tv.tv_usec = 0;
|
|
|
|
|
|
|
|
// Configure provides us with macros which are supposed to do
|
|
|
|
// the right typecast.
|
2002-03-21 17:27:08 +00:00
|
|
|
retval = select(SELECT_TYPE_ARG1 (pipeout[0]+1),
|
|
|
|
SELECT_TYPE_ARG234 (&infds),
|
|
|
|
0,
|
|
|
|
0,
|
2001-07-13 11:50:39 +00:00
|
|
|
SELECT_TYPE_ARG5 (&tv));
|
|
|
|
|
|
|
|
if (retval > 0) {
|
|
|
|
// Ok, do the reading. We don't have to FD_ISSET since
|
|
|
|
// there is only one fd in infds.
|
|
|
|
fgets(buf, 2048, in);
|
2002-03-21 17:27:08 +00:00
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
fputs("!\n", out); // Set terse mode (silently accept correct words)
|
|
|
|
|
|
|
|
} else if (retval == 0) {
|
|
|
|
// timeout. Give nice message to user.
|
|
|
|
lyxerr << "Ispell read timed out, what now?" << endl;
|
|
|
|
// This probably works but could need some thought
|
|
|
|
isp_pid = -1;
|
|
|
|
::close(pipeout[0]);
|
|
|
|
::close(pipeout[1]);
|
|
|
|
::close(pipein[0]);
|
|
|
|
::close(pipein[1]);
|
|
|
|
isp_fd = -1;
|
|
|
|
} else {
|
|
|
|
// Select returned error
|
|
|
|
lyxerr << "Select on ispell returned error, what now?" << endl;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
END:
|
|
|
|
if (isp_pid == -1) {
|
2002-03-21 17:27:08 +00:00
|
|
|
error_ =
|
2001-07-13 11:50:39 +00:00
|
|
|
"\n\n"
|
2001-11-28 16:09:25 +00:00
|
|
|
"The spellcheck-process has died for some reason.\n"
|
|
|
|
"*One* possible reason could be that you do not have\n"
|
|
|
|
"a dictionary file for the language of this document\n"
|
|
|
|
"installed.\n"
|
|
|
|
"Check your spellchecker or set another dictionary\n"
|
|
|
|
"in the Spellchecker Options menu.\n\n";
|
2001-07-13 11:50:39 +00:00
|
|
|
} else {
|
|
|
|
error_ = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-08-04 23:11:50 +00:00
|
|
|
ISpell::~ISpell()
|
|
|
|
{
|
|
|
|
delete[] str;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-02-28 14:06:24 +00:00
|
|
|
/* FIXME: this is a minimalist solution until the above
|
|
|
|
* code is able to work with forkedcall.h. We only need
|
|
|
|
* to reap the zombies here.
|
|
|
|
*/
|
|
|
|
void reapSpellchecker(void)
|
|
|
|
{
|
2002-03-21 17:27:08 +00:00
|
|
|
if (isp_pid == -1)
|
2002-02-28 14:06:24 +00:00
|
|
|
return;
|
|
|
|
|
|
|
|
waitpid(isp_pid, 0, WNOHANG);
|
|
|
|
}
|
|
|
|
|
2002-03-21 17:27:08 +00:00
|
|
|
|
2002-08-04 23:11:50 +00:00
|
|
|
string const ISpell::nextMiss()
|
|
|
|
{
|
|
|
|
if (str == 0 || *(e+1) == '\0')
|
|
|
|
return "";
|
|
|
|
char * b = e + 2;
|
|
|
|
e = strpbrk(b, ",\n");
|
|
|
|
*e = '\0';
|
|
|
|
if (b)
|
|
|
|
return b;
|
|
|
|
return "";
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
bool ISpell::alive()
|
|
|
|
{
|
|
|
|
return isp_pid != -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-03-21 17:27:08 +00:00
|
|
|
void ISpell::cleanUp()
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
|
|
|
::fclose(out);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-08-06 22:38:44 +00:00
|
|
|
enum ISpell::Result ISpell::check(WordLangTuple const & word)
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
2002-08-04 23:11:50 +00:00
|
|
|
// FIXME Please rewrite to use string.
|
2001-07-13 11:50:39 +00:00
|
|
|
|
2002-08-04 23:11:50 +00:00
|
|
|
Result res;
|
|
|
|
|
2002-08-06 22:38:44 +00:00
|
|
|
::fputs(word.word().c_str(), out);
|
2001-07-13 11:50:39 +00:00
|
|
|
::fputc('\n', out);
|
2002-03-21 17:27:08 +00:00
|
|
|
|
2001-07-13 11:50:39 +00:00
|
|
|
char buf[1024];
|
2002-03-21 17:27:08 +00:00
|
|
|
::fgets(buf, 1024, in);
|
|
|
|
|
2001-10-12 14:05:47 +00:00
|
|
|
// I think we have to check if ispell is still alive here because
|
2002-03-21 17:27:08 +00:00
|
|
|
// the signal-handler could have disabled blocking on the fd
|
2002-08-04 23:11:50 +00:00
|
|
|
if (!alive())
|
|
|
|
return UNKNOWN;
|
2001-07-13 11:50:39 +00:00
|
|
|
|
|
|
|
switch (*buf) {
|
2002-08-04 23:11:50 +00:00
|
|
|
case '*':
|
|
|
|
res = OK;
|
2001-07-13 11:50:39 +00:00
|
|
|
break;
|
2002-08-04 23:11:50 +00:00
|
|
|
case '+':
|
|
|
|
res = ROOT;
|
2001-07-13 11:50:39 +00:00
|
|
|
break;
|
2002-08-04 23:11:50 +00:00
|
|
|
case '-':
|
|
|
|
res = COMPOUNDWORD;
|
2001-07-13 11:50:39 +00:00
|
|
|
break;
|
2002-08-04 23:11:50 +00:00
|
|
|
case '\n':
|
|
|
|
res = IGNORE;
|
2001-07-13 11:50:39 +00:00
|
|
|
break;
|
|
|
|
case '#': // Not found, no near misses and guesses
|
2002-08-04 23:11:50 +00:00
|
|
|
res = UNKNOWN;
|
2001-07-13 11:50:39 +00:00
|
|
|
break;
|
|
|
|
case '?': // Not found, and no near misses, but guesses (guesses are ignored)
|
|
|
|
case '&': // Not found, but we have near misses
|
|
|
|
{
|
2002-08-04 23:11:50 +00:00
|
|
|
res = MISSED;
|
2001-07-13 11:50:39 +00:00
|
|
|
char * p = strpbrk(buf, ":");
|
|
|
|
str = new char[strlen(p) + 1];
|
|
|
|
e = str;
|
|
|
|
strcpy(str, p);
|
|
|
|
break;
|
|
|
|
}
|
2002-08-04 23:11:50 +00:00
|
|
|
default: // This shouldn't happen, but you know Murphy
|
|
|
|
res = UNKNOWN;
|
2001-07-13 11:50:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
*buf = 0;
|
2002-08-04 23:11:50 +00:00
|
|
|
if (res != IGNORE) {
|
|
|
|
/* wait for ispell to finish */
|
|
|
|
while (*buf!= '\n')
|
|
|
|
fgets(buf, 255, in);
|
2001-07-13 11:50:39 +00:00
|
|
|
}
|
2002-08-04 23:11:50 +00:00
|
|
|
return res;
|
2001-07-13 11:50:39 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void ISpell::close()
|
|
|
|
{
|
2002-03-21 17:27:08 +00:00
|
|
|
// Note: If you decide to optimize this out when it is not
|
|
|
|
// needed please note that when Aspell is used this command
|
2001-10-12 14:05:47 +00:00
|
|
|
// is also needed to save the replacement dictionary.
|
|
|
|
// -- Kevin Atkinson (kevinatk@home.com)
|
2001-07-13 11:50:39 +00:00
|
|
|
|
|
|
|
fputs("#\n", out); // Save personal dictionary
|
|
|
|
|
|
|
|
fflush(out);
|
|
|
|
fclose(out);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-08-06 22:38:44 +00:00
|
|
|
void ISpell::insert(WordLangTuple const & word)
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
|
|
|
::fputc('*', out); // Insert word in personal dictionary
|
2002-08-06 22:38:44 +00:00
|
|
|
::fputs(word.word().c_str(), out);
|
2001-07-13 11:50:39 +00:00
|
|
|
::fputc('\n', out);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-08-06 22:38:44 +00:00
|
|
|
void ISpell::accept(WordLangTuple const & word)
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
|
|
|
::fputc('@', out); // Accept in this session
|
2002-08-06 22:38:44 +00:00
|
|
|
::fputs(word.word().c_str(), out);
|
2001-07-13 11:50:39 +00:00
|
|
|
::fputc('\n', out);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2002-08-04 23:11:50 +00:00
|
|
|
string const ISpell::error()
|
2001-07-13 11:50:39 +00:00
|
|
|
{
|
2002-08-04 23:11:50 +00:00
|
|
|
if (error_)
|
|
|
|
return error_;
|
|
|
|
return "";
|
2001-07-13 11:50:39 +00:00
|
|
|
}
|