mirror of
https://git.lyx.org/repos/lyx.git
synced 2025-01-04 00:36:17 +00:00
543 lines
16 KiB
C++
543 lines
16 KiB
C++
// -*- C++ -*-
|
|
/**
|
|
* \file Paragraph.h
|
|
* This file is part of LyX, the document processor.
|
|
* Licence details can be found in the file COPYING.
|
|
*
|
|
* \author Asger Alstrup
|
|
* \author Lars Gullik Bjønnes
|
|
* \author John Levon
|
|
* \author André Pönitz
|
|
* \author Jürgen Vigna
|
|
*
|
|
* Full author contact details are available in file CREDITS.
|
|
*/
|
|
|
|
#ifndef PARAGRAPH_H
|
|
#define PARAGRAPH_H
|
|
|
|
#include "LayoutEnums.h"
|
|
#include "SpellChecker.h"
|
|
|
|
#include "support/strfwd.h"
|
|
#include "support/types.h"
|
|
|
|
#include <set>
|
|
#include <vector>
|
|
|
|
namespace lyx {
|
|
|
|
class AuthorList;
|
|
class Buffer;
|
|
class BufferParams;
|
|
class Change;
|
|
class DocIterator;
|
|
class docstring_list;
|
|
class DocumentClass;
|
|
class Inset;
|
|
class LaTeXFeatures;
|
|
class InsetList;
|
|
class Language;
|
|
class Layout;
|
|
class Font;
|
|
class OutputParams;
|
|
class ParagraphParameters;
|
|
class TocBackend;
|
|
class WordLangTuple;
|
|
class XMLStream;
|
|
class otexstream;
|
|
|
|
/// Inset identifier (above 0x10ffff, for ucs-4)
|
|
char_type const META_INSET = 0x200001;
|
|
|
|
class FontSpan {
|
|
public:
|
|
/// Invalid font span containing no character
|
|
FontSpan() : first(0), last(-1) {}
|
|
/// Span including first and last
|
|
FontSpan(pos_type f, pos_type l) : first(f), last(l) {}
|
|
|
|
public:
|
|
/// Range including first and last.
|
|
pos_type first, last;
|
|
|
|
inline bool operator<(FontSpan const & s) const
|
|
{
|
|
return first < s.first;
|
|
}
|
|
|
|
inline bool operator==(FontSpan const & s) const
|
|
{
|
|
return first == s.first && last == s.last;
|
|
}
|
|
|
|
inline bool contains(pos_type p) const
|
|
{
|
|
return first <= p && p <= last;
|
|
}
|
|
|
|
inline size_t size() const
|
|
{
|
|
return empty() ? 0 : last - first;
|
|
}
|
|
|
|
|
|
inline FontSpan intersect(FontSpan const & f) const
|
|
{
|
|
FontSpan result = FontSpan();
|
|
if (contains(f.first))
|
|
result.first = f.first;
|
|
else if (f.contains(first))
|
|
result.first = first;
|
|
else
|
|
return result;
|
|
if (contains(f.last))
|
|
result.last = f.last;
|
|
else if (f.contains(last))
|
|
result.last = last;
|
|
return result;
|
|
}
|
|
|
|
inline bool empty() const
|
|
{
|
|
return first > last;
|
|
}
|
|
};
|
|
|
|
///
|
|
enum TextCase {
|
|
///
|
|
text_lowercase = 0,
|
|
///
|
|
text_capitalization = 1,
|
|
///
|
|
text_uppercase = 2
|
|
};
|
|
|
|
|
|
///
|
|
enum AsStringParameter
|
|
{
|
|
AS_STR_NONE = 0, ///< No option, only printable characters.
|
|
AS_STR_LABEL = 1, ///< Prefix with paragraph label.
|
|
AS_STR_INSETS = 2, ///< Go into insets.
|
|
AS_STR_NEWLINES = 4, ///< Get also newline characters.
|
|
AS_STR_SKIPDELETE = 8, ///< Skip deleted text in change tracking.
|
|
AS_STR_PLAINTEXT = 16, ///< Don't export formatting when descending into insets.
|
|
AS_STR_MATHED = 32 ///< Use a format suitable for mathed (eg. for InsetRef).
|
|
};
|
|
|
|
|
|
/// A Paragraph holds all text, attributes and insets in a text paragraph
|
|
class Paragraph
|
|
{
|
|
public:
|
|
///
|
|
Paragraph();
|
|
/// Copy constructor.
|
|
Paragraph(Paragraph const &);
|
|
/// Partial copy constructor.
|
|
/// Copy the Paragraph contents from \p beg to \p end (without end).
|
|
Paragraph(Paragraph const & par, pos_type beg, pos_type end);
|
|
///
|
|
Paragraph & operator=(Paragraph const &);
|
|
///
|
|
~Paragraph();
|
|
///
|
|
int id() const;
|
|
///
|
|
void setId(int id);
|
|
|
|
///
|
|
void addChangesToToc(DocIterator const & cdit, Buffer const & buf,
|
|
bool output_active, TocBackend & backend) const;
|
|
///
|
|
Language const * getParLanguage(BufferParams const &) const;
|
|
///
|
|
bool isRTL(BufferParams const &) const;
|
|
///
|
|
void changeLanguage(BufferParams const & bparams,
|
|
Language const * from, Language const * to);
|
|
///
|
|
bool isMultiLingual(BufferParams const &) const;
|
|
///
|
|
void getLanguages(std::set<Language const *> &) const;
|
|
|
|
/// Convert the paragraph to a string.
|
|
/// \param AsStringParameter options. This can contain any combination of
|
|
/// asStringParameter values. Valid examples:
|
|
/// asString(AS_STR_LABEL)
|
|
/// asString(AS_STR_LABEL | AS_STR_INSETS)
|
|
/// asString(AS_STR_INSETS)
|
|
docstring asString(int options = AS_STR_NONE) const;
|
|
|
|
/// Convert the paragraph to a string.
|
|
/// \note If options includes AS_STR_PLAINTEXT, then runparams must be != 0
|
|
docstring asString(pos_type beg, pos_type end,
|
|
int options = AS_STR_NONE,
|
|
const OutputParams *runparams = 0) const;
|
|
///
|
|
void forOutliner(docstring &, size_t maxlen, bool shorten = true,
|
|
bool label = true) const;
|
|
|
|
///
|
|
void write(std::ostream &, BufferParams const &,
|
|
depth_type & depth) const;
|
|
///
|
|
void validate(LaTeXFeatures &) const;
|
|
|
|
/// \param force means: output even if layout.inpreamble is true.
|
|
void latex(BufferParams const &, Font const & outerfont, otexstream &,
|
|
OutputParams const &, int start_pos = 0, int end_pos = -1,
|
|
bool force = false) const;
|
|
|
|
/// Can we drop the standard paragraph wrapper?
|
|
bool emptyTag() const;
|
|
|
|
/// Get the id of the paragraph, useful for DocBook
|
|
std::string getID(Buffer const & buf, OutputParams const & runparams) const;
|
|
|
|
/// Output the first word of a paragraph, return the position where it left.
|
|
pos_type firstWordDocBook(XMLStream & xs, OutputParams const & runparams) const;
|
|
|
|
/// Output the first word of a paragraph, return the position where it left.
|
|
pos_type firstWordLyXHTML(XMLStream & xs, OutputParams const & runparams) const;
|
|
|
|
/// Outputs to stream the DocBook representation, one element per paragraph.
|
|
std::tuple<std::vector<docstring>, std::vector<docstring>, std::vector<docstring>>
|
|
simpleDocBookOnePar(Buffer const & buf,
|
|
OutputParams const & runparams,
|
|
Font const & outerfont,
|
|
pos_type initial = 0,
|
|
bool is_last_par = false,
|
|
bool ignore_fonts = false) const;
|
|
|
|
/// \return any material that has had to be deferred until after the
|
|
/// paragraph has closed.
|
|
docstring simpleLyXHTMLOnePar(Buffer const & buf,
|
|
XMLStream & xs,
|
|
OutputParams const & runparams,
|
|
Font const & outerfont,
|
|
bool start_paragraph = true,
|
|
bool close_paragraph = true,
|
|
pos_type initial = 0) const;
|
|
|
|
///
|
|
bool hasSameLayout(Paragraph const & par) const;
|
|
|
|
///
|
|
void makeSameLayout(Paragraph const & par);
|
|
|
|
///
|
|
void setInsetOwner(Inset const * inset);
|
|
///
|
|
Inset const & inInset() const;
|
|
///
|
|
bool allowParagraphCustomization() const;
|
|
///
|
|
bool usePlainLayout() const;
|
|
///
|
|
bool isPassThru() const;
|
|
///
|
|
bool parbreakIsNewline() const;
|
|
///
|
|
bool isPartOfTextSequence() const;
|
|
///
|
|
pos_type size() const;
|
|
///
|
|
bool empty() const;
|
|
|
|
///
|
|
Layout const & layout() const;
|
|
/// Do not pass a temporary to this!
|
|
void setLayout(Layout const & layout);
|
|
///
|
|
void setPlainOrDefaultLayout(DocumentClass const & tc);
|
|
///
|
|
void setDefaultLayout(DocumentClass const & tc);
|
|
///
|
|
void setPlainLayout(DocumentClass const & tc);
|
|
|
|
/// This is the item depth, only used by enumerate and itemize
|
|
signed char itemdepth;
|
|
|
|
/// look up change at given pos
|
|
Change const & lookupChange(pos_type pos) const;
|
|
|
|
/// is there a change within the given range (does not
|
|
/// check contained paragraphs)
|
|
bool isChanged(pos_type start, pos_type end) const;
|
|
/// Are there insets containing changes in the range?
|
|
bool hasChangedInsets(pos_type start, pos_type end) const;
|
|
/// is there an unchanged char at the given pos ?
|
|
bool isChanged(pos_type pos) const;
|
|
/// is there a change in the paragraph ?
|
|
bool isChanged() const;
|
|
|
|
/// is there an insertion at the given pos ?
|
|
bool isInserted(pos_type pos) const;
|
|
/// is there a deletion at the given pos ?
|
|
bool isDeleted(pos_type pos) const;
|
|
/// is the whole paragraph deleted ?
|
|
bool isDeleted(pos_type start, pos_type end) const;
|
|
|
|
/// will the paragraph be physically merged with the next
|
|
/// one if the imaginary end-of-par character is logically deleted?
|
|
bool isMergedOnEndOfParDeletion(bool trackChanges) const;
|
|
/// Return Change form of paragraph break
|
|
Change parEndChange() const;
|
|
|
|
/// set change for the entire par
|
|
void setChange(Change const & change);
|
|
|
|
/// set change at given pos
|
|
void setChange(pos_type pos, Change const & change);
|
|
|
|
/// accept changes within the given range
|
|
void acceptChanges(pos_type start, pos_type end);
|
|
|
|
/// reject changes within the given range
|
|
void rejectChanges(pos_type start, pos_type end);
|
|
|
|
/// Paragraphs can contain "manual labels", for example, Description
|
|
/// environment. The text for this user-editable label is stored in
|
|
/// the paragraph alongside the text of the rest of the paragraph
|
|
/// (the body). This function returns the starting position of the
|
|
/// body of the text in the paragraph.
|
|
pos_type beginOfBody() const;
|
|
/// recompute this value
|
|
void setBeginOfBody();
|
|
|
|
///
|
|
docstring expandLabel(Layout const &, BufferParams const &) const;
|
|
///
|
|
docstring const & labelString() const;
|
|
/// the next two functions are for the manual labels
|
|
docstring const getLabelWidthString() const;
|
|
/// Set label width string.
|
|
void setLabelWidthString(docstring const & s);
|
|
/// Actual paragraph alignment used
|
|
LyXAlignment getAlign(BufferParams const &) const;
|
|
/// Default paragraph alignment as determined by layout
|
|
LyXAlignment getDefaultAlign(BufferParams const &) const;
|
|
/// The nesting depth of a paragraph
|
|
depth_type getDepth() const;
|
|
/// The maximal possible depth of a paragraph after this one
|
|
depth_type getMaxDepthAfter() const;
|
|
///
|
|
void applyLayout(Layout const & new_layout);
|
|
|
|
/// (logically) erase the char at pos; return true if it was actually erased
|
|
bool eraseChar(pos_type pos, bool trackChanges);
|
|
/// (logically) erase the given range; return the number of chars actually erased
|
|
int eraseChars(pos_type start, pos_type end, bool trackChanges);
|
|
|
|
///
|
|
void resetFonts(Font const & font);
|
|
|
|
/** Get uninstantiated font setting. Returns the difference
|
|
between the characters font and the layoutfont.
|
|
This is what is stored in the fonttable
|
|
*/
|
|
Font const &
|
|
getFontSettings(BufferParams const &, pos_type pos) const;
|
|
///
|
|
Font const & getFirstFontSettings(BufferParams const &) const;
|
|
|
|
/** Get fully instantiated font, i.e., one that does not have any
|
|
attributes with values FONT_INHERIT, FONT_IGNORE or FONT_TOGGLE.
|
|
*/
|
|
Font const getFont(BufferParams const &, pos_type pos,
|
|
Font const & outerfont) const;
|
|
Font const getLayoutFont(BufferParams const &,
|
|
Font const & outerfont) const;
|
|
Font const getLabelFont(BufferParams const &,
|
|
Font const & outerfont) const;
|
|
/**
|
|
* The font returned by the above functions is the same in a
|
|
* span of characters. This method will return the first and
|
|
* the last positions in the paragraph for which that font is
|
|
* the same. This can be used to avoid unnecessary calls to getFont.
|
|
*/
|
|
FontSpan fontSpan(pos_type pos) const;
|
|
///
|
|
char_type getChar(pos_type pos) const;
|
|
/// Get the char, but mirror all bracket characters if it is right-to-left
|
|
char_type getUChar(BufferParams const &, OutputParams const &,
|
|
pos_type pos) const;
|
|
/// pos <= size() (there is a dummy font change at the end of each par)
|
|
void setFont(pos_type pos, Font const & font);
|
|
///
|
|
void insert(pos_type pos, docstring const & str,
|
|
Font const & font, Change const & change);
|
|
|
|
///
|
|
void appendString(docstring const & s, Font const & font,
|
|
Change const & change);
|
|
///
|
|
void appendChar(char_type c, Font const & font, Change const & change);
|
|
///
|
|
void insertChar(pos_type pos, char_type c, bool trackChanges);
|
|
///
|
|
void insertChar(pos_type pos, char_type c,
|
|
Font const &, bool trackChanges);
|
|
///
|
|
void insertChar(pos_type pos, char_type c,
|
|
Font const &, Change const & change);
|
|
/// Insert \p inset at position \p pos with \p change traking status and
|
|
/// \p font.
|
|
/// \return true if successful.
|
|
bool insertInset(pos_type pos, Inset * inset,
|
|
Font const & font, Change const & change);
|
|
///
|
|
Inset * getInset(pos_type pos);
|
|
///
|
|
Inset const * getInset(pos_type pos) const;
|
|
|
|
/// Release inset at given position.
|
|
/// \warning does not honour change tracking!
|
|
/// Therefore, it should only be used for breaking and merging
|
|
/// paragraphs
|
|
Inset * releaseInset(pos_type pos);
|
|
|
|
///
|
|
InsetList const & insetList() const;
|
|
///
|
|
void setInsetBuffers(Buffer &);
|
|
///
|
|
void resetBuffer();
|
|
|
|
///
|
|
bool isHfill(pos_type pos) const;
|
|
|
|
/// hinted by profiler
|
|
bool isInset(pos_type pos) const;
|
|
///
|
|
bool isNewline(pos_type pos) const;
|
|
///
|
|
bool isEnvSeparator(pos_type pos) const;
|
|
/// return true if the char is a word separator
|
|
bool isSeparator(pos_type pos) const;
|
|
///
|
|
bool isLineSeparator(pos_type pos) const;
|
|
/// True if the character/inset at this point is a word separator.
|
|
/// Note that digits in particular are not considered as word separator.
|
|
bool isWordSeparator(pos_type pos, bool const ignore_deleted = false) const;
|
|
/// True if the element at this point is a character that is not a letter.
|
|
bool isChar(pos_type pos) const;
|
|
/// True if the element at this point is a space
|
|
bool isSpace(pos_type pos) const;
|
|
/// True if the element at this point is a hard hyphen or a apostrophe
|
|
/// If it is enclosed by spaces return false
|
|
bool isHardHyphenOrApostrophe(pos_type pos) const;
|
|
/// Return true if this paragraph has verbatim content that needs to be
|
|
/// protected by \cprotect
|
|
bool needsCProtection(bool const fragile = false) const;
|
|
|
|
/// returns true if at least one line break or line separator has been deleted
|
|
/// at the beginning of the paragraph (either physically or logically)
|
|
bool stripLeadingSpaces(bool trackChanges);
|
|
|
|
/// return true if we allow multiple spaces
|
|
bool isFreeSpacing() const;
|
|
|
|
/// return true if we allow this par to stay empty
|
|
bool allowEmpty() const;
|
|
///
|
|
ParagraphParameters & params();
|
|
///
|
|
ParagraphParameters const & params() const;
|
|
|
|
/// Check whether a call to fixBiblio is needed.
|
|
bool brokenBiblio() const;
|
|
/// Check if we are in a Biblio environment and insert or
|
|
/// delete InsetBibitems as necessary.
|
|
/// \retval int 1, if we had to add an inset, in which case
|
|
/// the cursor will need to move cursor forward; -pos, if we deleted
|
|
/// an inset, in which case pos is the position from which the inset
|
|
/// was deleted, and the cursor will need to be moved back one if it
|
|
/// was previously past that position. Return 0 otherwise.
|
|
int fixBiblio(Buffer const & buffer);
|
|
|
|
/// For each author, set 'used' to true if there is a change
|
|
/// by this author in the paragraph.
|
|
void checkAuthors(AuthorList const & authorList);
|
|
|
|
///
|
|
void changeCase(BufferParams const & bparams, pos_type pos,
|
|
pos_type & right, TextCase action);
|
|
|
|
/// find \param str string inside Paragraph.
|
|
/// \return non-zero if the specified string is at the specified
|
|
/// position; returned value is the actual match length in positions
|
|
/// \param del specifies whether deleted strings in ct mode will be considered
|
|
int find(
|
|
docstring const & str, ///< string to search
|
|
bool cs, ///<
|
|
bool mw, ///<
|
|
pos_type pos, ///< start from here.
|
|
bool del = true) const;
|
|
|
|
void locateWord(pos_type & from, pos_type & to,
|
|
word_location const loc, bool const ignore_deleted = false) const;
|
|
///
|
|
void updateWords();
|
|
|
|
/// Spellcheck word at position \p from and fill in found misspelled word
|
|
/// and \p suggestions if \p do_suggestion is true.
|
|
/// \return result from spell checker, SpellChecker::UNKNOWN_WORD when misspelled.
|
|
SpellChecker::Result spellCheck(pos_type & from, pos_type & to, WordLangTuple & wl,
|
|
docstring_list & suggestions, bool do_suggestion = true,
|
|
bool check_learned = false) const;
|
|
|
|
/// Spell checker status at position \p pos.
|
|
/// If \p check_boundary is true the status of position immediately
|
|
/// before \p pos is tested too if it is at word boundary.
|
|
/// \return true if one of the tested positions is misspelled.
|
|
bool isMisspelled(pos_type pos, bool check_boundary = false) const;
|
|
|
|
/// \return the spell range (misspelled area) around position.
|
|
/// Range is empty if word at position is correctly spelled.
|
|
FontSpan const & getSpellRange(pos_type pos) const;
|
|
|
|
/// spell check of whole paragraph
|
|
/// remember results until call of requestSpellCheck()
|
|
void spellCheck() const;
|
|
|
|
/// query state of spell checker results
|
|
bool needsSpellCheck() const;
|
|
/// mark position of text manipulation to inform the spell checker
|
|
/// default value -1 marks the whole paragraph to be checked (again)
|
|
void requestSpellCheck(pos_type pos = -1);
|
|
|
|
/// an automatically generated identifying label for this paragraph.
|
|
/// presently used only in the XHTML output routines.
|
|
std::string magicLabel() const;
|
|
|
|
/// anonymizes the paragraph contents (but not the paragraphs
|
|
/// contained inside it. Does not handle undo.
|
|
void anonymize();
|
|
|
|
private:
|
|
/// Expand the counters for the labelstring of \c layout
|
|
docstring expandParagraphLabel(Layout const &, BufferParams const &,
|
|
bool process_appendix) const;
|
|
///
|
|
void deregisterWords();
|
|
///
|
|
void collectWords();
|
|
///
|
|
void registerWords();
|
|
|
|
/// Pimpl away stuff
|
|
class Private;
|
|
///
|
|
friend class Paragraph::Private;
|
|
///
|
|
Private * d;
|
|
};
|
|
|
|
} // namespace lyx
|
|
|
|
#endif // PARAGRAPH_H
|