The SWORD Project  1.9.0.svnversion
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
TEIXHTML Class Reference

#include <teixhtml.h>

+ Inheritance diagram for TEIXHTML:
+ Collaboration diagram for TEIXHTML:

Classes

class  MyUserData
 

Public Member Functions

virtual const char * getHeader () const
 
virtual char processText (SWBuf &text, const SWKey *key=0, const SWModule *module=0)
 
void setRenderNoteNumbers (bool val=true)
 
 TEIXHTML ()
 

Protected Member Functions

void addAllowedEscapeString (const char *findString)
 
void addEscapeStringSubstitute (const char *findString, const char *replaceString)
 
void addTokenSubstitute (const char *findString, const char *replaceString)
 
void appendEscapeString (SWBuf &buf, const char *escString)
 
virtual BasicFilterUserDatacreateUserData (const SWModule *module, const SWKey *key)
 
virtual bool handleEscapeString (SWBuf &buf, const char *escString, BasicFilterUserData *userData)
 
virtual bool handleNumericEscapeString (SWBuf &buf, const char *escString)
 
virtual bool handleToken (SWBuf &buf, const char *token, BasicFilterUserData *userData)
 
bool passAllowedEscapeString (SWBuf &buf, const char *escString)
 
virtual bool processStage (char, SWBuf &, char *&, BasicFilterUserData *)
 
void removeAllowedEscapeString (const char *findString)
 
void removeEscapeStringSubstitute (const char *findString)
 
void removeTokenSubstitute (const char *findString)
 
void setEscapeEnd (const char *escEnd)
 
void setEscapeStart (const char *escStart)
 
void setEscapeStringCaseSensitive (bool val)
 
void setPassThruNumericEscapeString (bool val)
 
void setPassThruUnknownEscapeString (bool val)
 
void setPassThruUnknownToken (bool val)
 
virtual void setStageProcessing (char stages)
 
void setTokenCaseSensitive (bool val)
 
void setTokenEnd (const char *tokenEnd)
 
void setTokenStart (const char *tokenStart)
 
bool substituteEscapeString (SWBuf &buf, const char *escString)
 
bool substituteToken (SWBuf &buf, const char *token)
 

Static Protected Attributes

static const char FINALIZE = 8
 
static const char INITIALIZE = 1
 
static const char POSTCHAR = 4
 
static const char PRECHAR = 2
 

Private Attributes

bool renderNoteNumbers
 

Detailed Description

this filter converts TEI text to XHTML text

Definition at line 33 of file teixhtml.h.

Constructor & Destructor Documentation

TEIXHTML::TEIXHTML ( )

Definition at line 74 of file teixhtml.cpp.

74  {
75  setTokenStart("<");
76  setTokenEnd(">");
77 
78  setEscapeStart("&");
79  setEscapeEnd(";");
80 
82 
83  addAllowedEscapeString("quot");
84  addAllowedEscapeString("apos");
88 
90 
91  renderNoteNumbers = false;
92 }
void setTokenEnd(const char *tokenEnd)
void addAllowedEscapeString(const char *findString)
bool renderNoteNumbers
Definition: teixhtml.h:36
void setTokenCaseSensitive(bool val)
void setEscapeStart(const char *escStart)
void setTokenStart(const char *tokenStart)
void setEscapeStringCaseSensitive(bool val)
void setEscapeEnd(const char *escEnd)

Member Function Documentation

void SWBasicFilter::addAllowedEscapeString ( const char *  findString)
protectedinherited

Registers an esc control sequence that can pass unchanged

Definition at line 156 of file swbasicfilter.cpp.

156  {
157  char *buf = 0;
158 
159  if (!escStringCaseSensitive) {
160  stdstr(&buf, findString);
161  toupperstr(buf);
162  p->escPassSet.insert(StringSet::value_type(buf));
163  delete [] buf;
164  }
165  else p->escPassSet.insert(StringSet::value_type(findString));
166 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
bool escStringCaseSensitive
Definition: swbasicfilter.h:74
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::addEscapeStringSubstitute ( const char *  findString,
const char *  replaceString 
)
protectedinherited

Registers an esc control sequence

Definition at line 176 of file swbasicfilter.cpp.

176  {
177  char *buf = 0;
178 
179  if (!escStringCaseSensitive) {
180  stdstr(&buf, findString);
181  toupperstr(buf);
182  p->escSubMap.insert(DualStringMap::value_type(buf, replaceString));
183  delete [] buf;
184  }
185  else p->escSubMap.insert(DualStringMap::value_type(findString, replaceString));
186 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
bool escStringCaseSensitive
Definition: swbasicfilter.h:74
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::addTokenSubstitute ( const char *  findString,
const char *  replaceString 
)
protectedinherited

Registers a simple token substitutions. Usually called from the c-tor of a subclass

Definition at line 136 of file swbasicfilter.cpp.

136  {
137  char *buf = 0;
138 
139  if (!tokenCaseSensitive) {
140  stdstr(&buf, findString);
141  toupperstr(buf);
142  p->tokenSubMap[buf] = replaceString;
143  delete [] buf;
144  }
145  else p->tokenSubMap[findString] = replaceString;
146 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
bool tokenCaseSensitive
Definition: swbasicfilter.h:75
DualStringMap tokenSubMap
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::appendEscapeString ( SWBuf buf,
const char *  escString 
)
protectedinherited

This appends escString to buf as an entity

Definition at line 216 of file swbasicfilter.cpp.

216  {
217  buf += escStart;
218  buf += escString;
219  buf += escEnd;
220 }
virtual BasicFilterUserData* TEIXHTML::createUserData ( const SWModule module,
const SWKey key 
)
inlineprotectedvirtual

Reimplemented from SWBasicFilter.

Definition at line 48 of file teixhtml.h.

48  {
49  return new MyUserData(module, key);
50  }
SWORD_NAMESPACE_START const char * TEIXHTML::getHeader ( ) const
virtual

This method can supply a header associated with the processing done with this filter. A typical example is a suggested CSS style block for classed containers.

Reimplemented from SWFilter.

Definition at line 35 of file teixhtml.cpp.

35  {
36  // <pos>, <gen>, <case>, <gram>, <number>, <mood>, <pron>, <def> <tr> <orth> <etym> <usg>
37  const static char *header = "\n\
38  .entryFree, .form, .etym, .def, .usg, .quote {display:block;}\n\
39  .pron, .pos, .oVar, .ref, {display:inline}\n\
40  [type=headword] {font-weight:bold; font-variant:small-caps; text-decoration:underline;}\n\
41  [type=derivative] {font-weight:bold; font-variant:small-caps;}\n\
42  [rend=italic] {font-style:italic;}\n\
43  [rend=bold] {font-weight:bold;}\n\
44  [rend=small-caps] {font-variant:small-caps}\n\
45  .pos:before {content: \"Pos.: \"; font-weight:bold;}\n\
46  .pron:before {content:\" \\\\ \";}\n\
47  .pron:after {content:\" \\\\ \";}\n\
48  .etym:before {content:\"Etym.:\"; display:block; font-weight:bold;}\n\
49  .usg:before {content:\"Usg.:\"; display:block; font-weight:bold;}\n\
50  .def:before {content:\"Def.:\" display:block; font-weight:bold;}\n\
51  .quote {background-color:#cfcfdf; padding:0.3em; margin:0.5em; border-width:1px; border-style:solid;}\n\
52  .cit:before {content:\"quote:\" ; display:block; margin-top:0.5em; font-size:small;}\n\
53  .cit {align:center;}\n\
54  .persName:before {content:\" (\"; font-size:small;}\n\
55  .persName:after {content:\") \"; font-size:small;}\n\
56  .persName {font-size:small;}\n\
57  .number {font-style:bold;}\n\
58  .def {font-style:bold;}\n\
59  ";
60  return header;
61 }
bool SWBasicFilter::handleEscapeString ( SWBuf buf,
const char *  escString,
BasicFilterUserData userData 
)
protectedvirtualinherited

This function is called for every escape sequence encountered in the input text.

Parameters
bufthe output buffer
escStringthe escape sequence (e.g. "amp" for &amp;)
userDatauser storage space for data transient to 1 full buffer parse
Returns
false if was not handled and should be handled in
subclasses should return true if they handled the esc seq, or false if they did not.

Definition at line 286 of file swbasicfilter.cpp.

286  {
287  return substituteEscapeString(buf, escString);
288 }
bool substituteEscapeString(SWBuf &buf, const char *escString)
bool SWBasicFilter::handleNumericEscapeString ( SWBuf buf,
const char *  escString 
)
protectedvirtualinherited

This function is called for all numeric escape sequences. If passThrough

Parameters
bufthe output buffer
escStringthe escape sequence (e.g. "#235" for &235;)
Returns
subclasses should return true if they handled the esc seq, or false if they did not.

Definition at line 244 of file swbasicfilter.cpp.

244  {
245  if (passThruNumericEsc) {
246  appendEscapeString(buf, escString);
247  return true;
248  }
249  return false;
250 }
bool passThruNumericEsc
Definition: swbasicfilter.h:78
void appendEscapeString(SWBuf &buf, const char *escString)
bool TEIXHTML::handleToken ( SWBuf buf,
const char *  token,
BasicFilterUserData userData 
)
protectedvirtual

This function is called for every token encountered in the input text.

Parameters
bufthe output buffer
tokenthe token (e.g. "p align='left'"
userDatauser storage space for data transient to 1 full buffer parse
Returns
subclasses should return true if they handled the token, or false if they did not.

Reimplemented from SWBasicFilter.

Definition at line 94 of file teixhtml.cpp.

94  {
95  // manually process if it wasn't a simple substitution
96  if (!substituteToken(buf, token)) {
97  MyUserData *u = (MyUserData *)userData;
98  XMLTag tag(token);
99 
100  if (!strcmp(tag.getName(), "p")) {
101  if ((!tag.isEndTag()) && (!tag.isEmpty())) { // non-empty start tag
102  buf += "<!P><br />";
103  }
104  else if (tag.isEndTag()) { // end tag
105  buf += "<!/P><br />";
106  //userData->supressAdjacentWhitespace = true;
107  }
108  else { // empty paragraph break marker
109  buf += "<!P><br />";
110  //userData->supressAdjacentWhitespace = true;
111  }
112  }
113 
114  // <hi>
115  else if (!strcmp(tag.getName(), "hi")) {
116  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
117  SWBuf rend = tag.getAttribute("rend");
118 
119  u->lastHi = rend;
120  if (rend == "italic" || rend == "ital")
121  buf += "<i>";
122  else if (rend == "bold")
123  buf += "<b>";
124  else if (rend == "super" || rend == "sup")
125  buf += "<sup>";
126  else if (rend == "sub")
127  buf += "<sub>";
128  else if (rend == "overline")
129  buf += "<span style=\"text-decoration:overline\">";
130 
131  }
132  else if (tag.isEndTag()) {
133  SWBuf rend = u->lastHi;
134  if (rend == "italic" || rend == "ital")
135  buf += "</i>";
136  else if (rend == "bold")
137  buf += "</b>";
138  else if (rend == "super" || rend == "sup")
139  buf += "</sup>";
140  else if (rend == "sub")
141  buf += "</sub>";
142  else if (rend == "overline")
143  buf += "</span>";
144  }
145  }
146 
147  // <entryFree>
148  else if (!strcmp(tag.getName(), "entryFree")) {
149  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
150  SWBuf n = tag.getAttribute("n");
151  if (n != "") {
152  buf += "<span class=\"entryFree\">";
153  buf += n;
154  buf += "</span>";
155  }
156  }
157  }
158 
159  // <sense>
160  else if (!strcmp(tag.getName(), "sense")) {
161  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
162  SWBuf n = tag.getAttribute("n");
163  buf += "<br/><span class=\"sense";
164  if (n != "") {
165  buf += "\" n=\"";
166  buf += n;
167 
168 
169  }
170  buf += "\">";
171  }
172  else if (tag.isEndTag()) {
173  buf += "</span> ";
174  }
175  }
176 
177  // <div>
178  else if (!strcmp(tag.getName(), "div")) {
179 
180  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
181  buf += "<!P>";
182  }
183  else if (tag.isEndTag()) {
184  }
185  }
186 
187  // <lb.../>
188  else if (!strcmp(tag.getName(), "lb")) {
189  buf += "<br />";
190  }
191 
192  // <pos>, <gen>, <case>, <gram>, <number>, <mood>, <pron>, <def> <tr> <orth> <etym> <usg>
193  else if (!strcmp(tag.getName(), "pos") ||
194  !strcmp(tag.getName(), "gen") ||
195  !strcmp(tag.getName(), "case") ||
196  !strcmp(tag.getName(), "gram") ||
197  !strcmp(tag.getName(), "number") ||
198  !strcmp(tag.getName(), "pron") ||
199  !strcmp(tag.getName(), "def") ||
200  !strcmp(tag.getName(), "tr") ||
201  !strcmp(tag.getName(), "orth") ||
202  !strcmp(tag.getName(), "etym") ||
203  !strcmp(tag.getName(), "usg") ||
204  !strcmp(tag.getName(), "quote")||
205  !strcmp(tag.getName(), "cit")||
206  !strcmp(tag.getName(), "persName")||
207  !strcmp(tag.getName(), "oVar"))
208  {
209  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
210  buf += "<span class=\"";
211  buf += tag.getName();
212  if (tag.getAttribute("type")) {
213  buf += "\" type =\"";
214  buf += tag.getAttribute("type");
215  }
216  if (tag.getAttribute("rend")) {
217  buf += "\" rend =\"";
218  buf += tag.getAttribute("rend");
219  }
220  buf += "\">";
221  }
222  else if (tag.isEndTag()) {
223  buf += "</span>";
224  }
225  }
226 
227  else if (!strcmp(tag.getName(), "ref")) {
228  if (!tag.isEndTag()) {
229  u->suspendTextPassThru = true;
230  SWBuf target;
231  SWBuf work;
232  SWBuf ref;
233 
234  int was_osisref = false;
235  if(tag.getAttribute("osisRef"))
236  {
237  target += tag.getAttribute("osisRef");
238  was_osisref=true;
239  }
240  else if(tag.getAttribute("target"))
241  target += tag.getAttribute("target");
242 
243  if(target.size())
244  {
245  const char* the_ref = strchr(target, ':');
246 
247  if(!the_ref) {
248  // No work
249  ref = target;
250  }
251  else {
252  // Compensate for starting :
253  ref = the_ref + 1;
254 
255  int size = target.size() - ref.size() - 1;
256  work.setSize(size);
257  strncpy(work.getRawData(), target, size);
258  }
259 
260  if(was_osisref)
261  {
262  buf.appendFormatted("<a href=\"passagestudy.jsp?action=showRef&type=scripRef&value=%s&module=%s\">",
263  (ref) ? URL::encode(ref.c_str()).c_str() : "",
264  (work.size()) ? URL::encode(work.c_str()).c_str() : "");
265  }
266  else
267  {
268  // Dictionary link, or something
269  buf.appendFormatted("<a href=\"sword://%s/%s\">",
270  (work.size()) ? URL::encode(work.c_str()).c_str() : u->version.c_str(),
271  (ref) ? URL::encode(ref.c_str()).c_str() : ""
272  );
273  }
274  }
275  else
276  {
277  //std::cout << "TARGET WASN'T\n";
278  }
279 
280  }
281  else {
282  buf += u->lastTextNode.c_str();
283  buf += "</a>";
284 
285  u->suspendTextPassThru = false;
286  }
287  }
288 
289  // <note> tag
290  else if (!strcmp(tag.getName(), "note")) {
291  if (!tag.isEndTag()) {
292  if (!tag.isEmpty()) {
293  u->suspendTextPassThru = true;
294  }
295  }
296  // how does any of this work??? If isEndTag is true, </note>, there will be no attributes.
297  if (tag.isEndTag()) {
298  SWBuf footnoteNumber = tag.getAttribute("swordFootnote");
299  SWBuf noteName = tag.getAttribute("n");
300 
301  buf.appendFormatted("<a href=\"passagestudy.jsp?action=showNote&type=n&value=%s&module=%s&passage=%s\"><small><sup class=\"n\">*n%s</sup></small></a>",
302  URL::encode(footnoteNumber.c_str()).c_str(),
303  URL::encode(u->version.c_str()).c_str(),
304  URL::encode(u->key->getText()).c_str(),
305  (renderNoteNumbers ? URL::encode(noteName.c_str()).c_str() : ""));
306 
307  u->suspendTextPassThru = false;
308  }
309  }
310  // <graphic> image tag
311  else if (!strcmp(tag.getName(), "graphic")) {
312  const char *url = tag.getAttribute("url");
313  if (url) { // assert we have a url attribute
314  SWBuf filepath;
315  if (userData->module) {
316  filepath = userData->module->getConfigEntry("AbsoluteDataPath");
317  if ((filepath.size()) && (filepath[filepath.size()-1] != '/') && (url[0] != '/'))
318  filepath += '/';
319  }
320  filepath += url;
321  buf.appendFormatted("<a href=\"passagestudy.jsp?action=showImage&value=%s&module=%s\"><img src=\"file:%s\" border=\"0\" /></a>",
322  URL::encode(filepath.c_str()).c_str(),
323  URL::encode(u->version.c_str()).c_str(),
324  filepath.c_str());
325  u->suspendTextPassThru = false;
326  }
327  }
328  // <table> <row> <cell>
329  else if (!strcmp(tag.getName(), "table")) {
330  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
331  buf += "<table><tbody>\n";
332  }
333  else if (tag.isEndTag()) {
334  buf += "</tbody></table>\n";
335  u->supressAdjacentWhitespace = true;
336  }
337  }
338  else if (!strcmp(tag.getName(), "row")) {
339  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
340  buf += "\t<tr>";
341  }
342  else if (tag.isEndTag()) {
343  buf += "</tr>\n";
344  }
345  }
346  else if (!strcmp(tag.getName(), "cell")) {
347  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
348  buf += "<td>";
349  }
350  else if (tag.isEndTag()) {
351  buf += "</td>";
352  }
353  }
354  // <list> <item>
355  else if (!strcmp(tag.getName(), "list")) {
356  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
357 
358  SWBuf rend = tag.getAttribute("rend");
359 
360  u->lastHi = rend;
361  if (rend == "numbered") {
362  buf += "<ol>\n";
363  }
364  else if (rend == "lettered") {
365  buf += "<ol type=\"A\">\n";
366  }
367  else if (rend == "bulleted") {
368  buf += "<ul>\n";
369  }
370  else {
371  buf += "<ul class=\"list ";
372  buf += rend.c_str();
373  buf += "\">";
374  }
375  }
376  else if (tag.isEndTag()) {
377  SWBuf rend = u->lastHi;
378  if (rend == "numbered") {
379  buf += "</ol>\n>";
380  }
381  else if (rend == "lettered") {
382  buf += "</ol>\n";
383  }
384  else if (rend == "bulleted") {
385  buf += "</ul>\n";
386  }
387  else {
388  buf += "</ul>\n";
389  }
390  u->supressAdjacentWhitespace = true;
391  }
392  }
393  else if (!strcmp(tag.getName(), "item")) {
394  if ((!tag.isEndTag()) && (!tag.isEmpty())) {
395  buf += "<li>";
396  }
397  else if (tag.isEndTag()) {
398  buf += "</li>\n";
399  }
400  }
401  else {
402  return false; // we still didn't handle token
403  }
404 
405 
406  }
407  return true;
408 }
SWBuf & appendFormatted(const char *format,...)
Definition: swbuf.cpp:81
Definition: swbuf.h:47
virtual const char * getConfigEntry(const char *key) const
Definition: swmodule.cpp:1159
const SWModule * module
Definition: swbasicfilter.h:42
Definition: utilxml.h:38
bool renderNoteNumbers
Definition: teixhtml.h:36
bool substituteToken(SWBuf &buf, const char *token)
char * getRawData()
Definition: swbuf.h:379
const char * c_str() const
Definition: swbuf.h:158
unsigned long size() const
Definition: swbuf.h:185
int size
Definition: regex.c:5043
static const SWBuf encode(const char *urlText)
Definition: url.cpp:231
void setSize(unsigned long len)
Definition: swbuf.h:255
bool SWBasicFilter::passAllowedEscapeString ( SWBuf buf,
const char *  escString 
)
protectedinherited

This passes allowed escapeStrings

Definition at line 223 of file swbasicfilter.cpp.

223  {
224  StringSet::iterator it;
225 
226  if (!escStringCaseSensitive) {
227  char *tmp = 0;
228  stdstr(&tmp, escString);
229  toupperstr(tmp);
230  it = p->escPassSet.find(tmp);
231  delete [] tmp;
232  } else
233  it = p->escPassSet.find(escString);
234 
235  if (it != p->escPassSet.end()) {
236  appendEscapeString(buf, escString);
237  return true;
238  }
239 
240  return false;
241 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
bool escStringCaseSensitive
Definition: swbasicfilter.h:74
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82
void appendEscapeString(SWBuf &buf, const char *escString)
virtual bool SWBasicFilter::processStage ( char  ,
SWBuf ,
char *&  ,
BasicFilterUserData  
)
inlineprotectedvirtualinherited

Reimplemented in OSISPlain.

Definition at line 185 of file swbasicfilter.h.

185 { return false; }
char SWBasicFilter::processText ( SWBuf text,
const SWKey key = 0,
const SWModule module = 0 
)
virtualinherited

This method processes and appropriately modifies the text given it for a particular filter task

Parameters
textThe text to be filtered/converted
keyCurrent key That was used.
moduleCurrent module.
Returns
0

Implements SWFilter.

Reimplemented in ThMLRTF, OSISOSIS, and OSISRTF.

Definition at line 315 of file swbasicfilter.cpp.

315  {
316  char *from;
317  char token[4096];
318  int tokpos = 0;
319  bool intoken = false;
320  bool inEsc = false;
321  int escStartPos = 0, escEndPos = 0;
322  int tokenStartPos = 0, tokenEndPos = 0;
323  SWBuf lastTextNode;
324  BasicFilterUserData *userData = createUserData(module, key);
325 
326  SWBuf orig = text;
327  from = orig.getRawData();
328  text = "";
329 
330  if (processStages & INITIALIZE) {
331  if (processStage(INITIALIZE, text, from, userData)) { // processStage handled it all
332  delete userData;
333  return 0;
334  }
335  }
336 
337  for (;*from; from++) {
338 
339  if (processStages & PRECHAR) {
340  if (processStage(PRECHAR, text, from, userData)) // processStage handled this char
341  continue;
342  }
343 
344  if (*from == tokenStart[tokenStartPos]) {
345  if (tokenStartPos == (tokenStartLen - 1)) {
346  intoken = true;
347  tokpos = 0;
348  token[0] = 0;
349  token[1] = 0;
350  token[2] = 0;
351  inEsc = false;
352  }
353  else tokenStartPos++;
354  continue;
355  }
356 
357  if (*from == escStart[escStartPos]) {
358  if (escStartPos == (escStartLen - 1)) {
359  intoken = true;
360  tokpos = 0;
361  token[0] = 0;
362  token[1] = 0;
363  token[2] = 0;
364  inEsc = true;
365  }
366  else escStartPos++;
367  continue;
368  }
369 
370  if (inEsc) {
371  if (*from == escEnd[escEndPos]) {
372  if (escEndPos == (escEndLen - 1)) {
373  intoken = inEsc = false;
374  userData->lastTextNode = lastTextNode;
375 
376  if (!userData->suspendTextPassThru) { //if text through is disabled no tokens should pass, too
377  if ((!handleEscapeString(text, token, userData)) && (passThruUnknownEsc)) {
378  appendEscapeString(text, token);
379  }
380  }
381  escEndPos = escStartPos = tokenEndPos = tokenStartPos = 0;
382  lastTextNode = "";
383  continue;
384  }
385  }
386  }
387 
388  if (!inEsc) {
389  if (*from == tokenEnd[tokenEndPos]) {
390  if (tokenEndPos == (tokenEndLen - 1)) {
391  intoken = false;
392  userData->lastTextNode = lastTextNode;
393  if ((!handleToken(text, token, userData)) && (passThruUnknownToken)) {
394  text += tokenStart;
395  text += token;
396  text += tokenEnd;
397  }
398  escEndPos = escStartPos = tokenEndPos = tokenStartPos = 0;
399  lastTextNode = "";
400  if (!userData->suspendTextPassThru) {
401  userData->lastSuspendSegment.size(0);
402  }
403  continue;
404  }
405  }
406  }
407 
408  if (intoken) {
409  if (tokpos < 4090) {
410  token[tokpos++] = *from;
411  token[tokpos+2] = 0;
412  }
413  }
414  else {
415  if ((!userData->supressAdjacentWhitespace) || (*from != ' ')) {
416  if (!userData->suspendTextPassThru) {
417  text.append(*from);
418  }
419  else userData->lastSuspendSegment.append(*from);
420  lastTextNode.append(*from);
421  }
422  userData->supressAdjacentWhitespace = false;
423  }
424 
425  if (processStages & POSTCHAR)
426  processStage(POSTCHAR, text, from, userData);
427 
428  }
429 
430  if (processStages & FINALIZE)
431  processStage(FINALIZE, text, from, userData);
432 
433  delete userData;
434  return 0;
435 }
static const char PRECHAR
Definition: swbasicfilter.h:97
Definition: swbuf.h:47
static const char POSTCHAR
Definition: swbasicfilter.h:98
char * tokenStart
Definition: swbasicfilter.h:64
virtual bool handleToken(SWBuf &buf, const char *token, BasicFilterUserData *userData)
bool passThruUnknownEsc
Definition: swbasicfilter.h:77
virtual bool handleEscapeString(SWBuf &buf, const char *escString, BasicFilterUserData *userData)
bool passThruUnknownToken
Definition: swbasicfilter.h:76
static const char FINALIZE
Definition: swbasicfilter.h:99
char * getRawData()
Definition: swbuf.h:379
SWBuf & append(const char *str, long max=-1)
Definition: swbuf.h:274
virtual bool processStage(char, SWBuf &, char *&, BasicFilterUserData *)
virtual BasicFilterUserData * createUserData(const SWModule *module, const SWKey *key)
Definition: swbasicfilter.h:91
unsigned long size() const
Definition: swbuf.h:185
static const char INITIALIZE
Definition: swbasicfilter.h:96
void appendEscapeString(SWBuf &buf, const char *escString)
void SWBasicFilter::removeAllowedEscapeString ( const char *  findString)
protectedinherited

Unregisters an esc control sequence that can pass unchanged

Definition at line 169 of file swbasicfilter.cpp.

169  {
170  if (p->escPassSet.find(findString) != p->escPassSet.end()) {
171  p->escPassSet.erase( p->escPassSet.find(findString) );
172  }
173 }
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::removeEscapeStringSubstitute ( const char *  findString)
protectedinherited

Unregisters an esc control sequence

Definition at line 189 of file swbasicfilter.cpp.

189  {
190  if (p->escSubMap.find(findString) != p->escSubMap.end()) {
191  p->escSubMap.erase( p->escSubMap.find(findString) );
192  }
193 }
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::removeTokenSubstitute ( const char *  findString)
protectedinherited

Unregisters a simple token substitute

Definition at line 149 of file swbasicfilter.cpp.

149  {
150  if (p->tokenSubMap.find(findString) != p->tokenSubMap.end()) {
151  p->tokenSubMap.erase( p->tokenSubMap.find(findString) );
152  }
153 }
DualStringMap tokenSubMap
Private * p
Definition: swbasicfilter.h:82
void SWBasicFilter::setEscapeEnd ( const char *  escEnd)
protectedinherited

Sets the end of escape sequence (by default ";").

Definition at line 297 of file swbasicfilter.cpp.

297  {
298  stdstr(&(this->escEnd), escEnd);
299  escEndLen = strlen(escEnd);
300 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
void SWBasicFilter::setEscapeStart ( const char *  escStart)
protectedinherited

Sets the beginning of escape sequence (by default "&").

Definition at line 291 of file swbasicfilter.cpp.

291  {
292  stdstr(&(this->escStart), escStart);
293  escStartLen = strlen(escStart);
294 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
void SWBasicFilter::setEscapeStringCaseSensitive ( bool  val)
protectedinherited

Are escapeStrings case sensitive or not? Call this function before addEscapeStingSubstitute()

Definition at line 131 of file swbasicfilter.cpp.

131  {
133 }
bool escStringCaseSensitive
Definition: swbasicfilter.h:74
void SWBasicFilter::setPassThruNumericEscapeString ( bool  val)
protectedinherited

Sets whether to pass thru a numeric escape sequence unchanged or allow it to be handled otherwise. Default is false.

Definition at line 121 of file swbasicfilter.cpp.

121  {
122  passThruUnknownEsc = val;
123 }
bool passThruUnknownEsc
Definition: swbasicfilter.h:77
void SWBasicFilter::setPassThruUnknownEscapeString ( bool  val)
protectedinherited

Sets whether to pass thru an unknown escape sequence unchanged or just remove it. Default is false.

Definition at line 116 of file swbasicfilter.cpp.

116  {
117  passThruUnknownEsc = val;
118 }
bool passThruUnknownEsc
Definition: swbasicfilter.h:77
void SWBasicFilter::setPassThruUnknownToken ( bool  val)
protectedinherited

Sets whether to pass thru an unknown token unchanged or just remove it. Default is false.

Definition at line 111 of file swbasicfilter.cpp.

111  {
112  passThruUnknownToken = val;
113 }
bool passThruUnknownToken
Definition: swbasicfilter.h:76
void TEIXHTML::setRenderNoteNumbers ( bool  val = true)
inline

Definition at line 54 of file teixhtml.h.

54 { renderNoteNumbers = val; }
bool renderNoteNumbers
Definition: teixhtml.h:36
virtual void SWBasicFilter::setStageProcessing ( char  stages)
inlineprotectedvirtualinherited

Definition at line 186 of file swbasicfilter.h.

186 { processStages = stages; } // see STATICs up above
void SWBasicFilter::setTokenCaseSensitive ( bool  val)
protectedinherited

Are tokens case sensitive (like in GBF) or not? Call this function before addTokenSubstitute()

Definition at line 126 of file swbasicfilter.cpp.

126  {
127  tokenCaseSensitive = val;
128 }
bool tokenCaseSensitive
Definition: swbasicfilter.h:75
void SWBasicFilter::setTokenEnd ( const char *  tokenEnd)
protectedinherited

Sets the end of token start sequence (by default ">").

Definition at line 309 of file swbasicfilter.cpp.

309  {
310  stdstr(&(this->tokenEnd), tokenEnd);
311  tokenEndLen = strlen(tokenEnd);
312 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
void SWBasicFilter::setTokenStart ( const char *  tokenStart)
protectedinherited

Sets the beginning of token start sequence (by default "<").

Definition at line 303 of file swbasicfilter.cpp.

303  {
304  stdstr(&(this->tokenStart), tokenStart);
305  tokenStartLen = strlen(tokenStart);
306 }
char * tokenStart
Definition: swbasicfilter.h:64
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
bool SWBasicFilter::substituteEscapeString ( SWBuf buf,
const char *  escString 
)
protectedinherited

This function performs the substitution of escapeStrings

Definition at line 253 of file swbasicfilter.cpp.

253  {
254  DualStringMap::iterator it;
255 
256  if (*escString == '#') {
257  return handleNumericEscapeString(buf, escString);
258  }
259 
260  if (passAllowedEscapeString(buf, escString)) {
261  return true;
262  }
263 
264  if (!escStringCaseSensitive) {
265  char *tmp = 0;
266  stdstr(&tmp, escString);
267  toupperstr(tmp);
268  it = p->escSubMap.find(tmp);
269  delete [] tmp;
270  } else
271  it = p->escSubMap.find(escString);
272 
273  if (it != p->escSubMap.end()) {
274  buf += it->second.c_str();
275  return true;
276  }
277  return false;
278 }
virtual bool handleNumericEscapeString(SWBuf &buf, const char *escString)
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
const char * c_str() const
Definition: swbuf.h:158
bool escStringCaseSensitive
Definition: swbasicfilter.h:74
bool passAllowedEscapeString(SWBuf &buf, const char *escString)
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82
bool SWBasicFilter::substituteToken ( SWBuf buf,
const char *  token 
)
protectedinherited

This function performs the substitution of tokens

Definition at line 196 of file swbasicfilter.cpp.

196  {
197  DualStringMap::iterator it;
198 
199  if (!tokenCaseSensitive) {
200  char *tmp = 0;
201  stdstr(&tmp, token);
202  toupperstr(tmp);
203  it = p->tokenSubMap.find(tmp);
204  delete [] tmp;
205  } else
206  it = p->tokenSubMap.find(token);
207 
208  if (it != p->tokenSubMap.end()) {
209  buf += it->second.c_str();
210  return true;
211  }
212  return false;
213 }
SWORD_NAMESPACE_START char * stdstr(char **ipstr, const char *istr, unsigned int memPadFactor=1)
Definition: utilstr.h:44
const char * c_str() const
Definition: swbuf.h:158
bool tokenCaseSensitive
Definition: swbasicfilter.h:75
DualStringMap tokenSubMap
char * toupperstr(char *t, unsigned int max=0)
Definition: stringmgr.h:107
Private * p
Definition: swbasicfilter.h:82

Member Data Documentation

const char SWBasicFilter::FINALIZE = 8
staticprotectedinherited

Definition at line 99 of file swbasicfilter.h.

const char SWBasicFilter::INITIALIZE = 1
staticprotectedinherited

Definition at line 96 of file swbasicfilter.h.

const char SWBasicFilter::POSTCHAR = 4
staticprotectedinherited

Definition at line 98 of file swbasicfilter.h.

const char SWBasicFilter::PRECHAR = 2
staticprotectedinherited

Definition at line 97 of file swbasicfilter.h.

bool TEIXHTML::renderNoteNumbers
private

Definition at line 36 of file teixhtml.h.


The documentation for this class was generated from the following files: