void ConvertString(char *string) /****************************************************************************** purpose : converts string in TeX-format to Rtf-format ******************************************************************************/ { char temp[256]; if (string==NULL) return; if (strlen(string)<250) strncpy(temp,string,250); else { strncpy(temp,string,125); strncpy(temp+125,"\n...\n", 5); strncpy(temp+130,string+strlen(string)-125,125); temp[255] = '\0'; } if (PushSource(NULL, string) == 0) { diagnostics(4, "Entering Convert() from StringConvert()\n******\n%s\n*****",temp); while (StillSource()) Convert(); PopSource(); diagnostics(4, "Exiting Convert() from StringConvert()"); } }
int getStringDimension(char *s) { int size = 0; if (s != NULL) { PushSource(NULL, s); size = getDimension(); PopSource(); } diagnostics(5, "getStringDimension fore '%s' is %d twips", s, size); return size; }
void ConvertAllttString(char *s) /****************************************************************************** purpose : converts string in TeX-format to Rtf-format according to the alltt environment, which is like verbatim environment except that \, {, and } have their usual meanings ******************************************************************************/ { char cThis; if (s==NULL) return; diagnostics(4, "Entering Convert() from StringAllttConvert()"); if(PushSource(NULL, s)==0) { while (StillSource()) { cThis = getRawTexChar(); /* it is a verbatim like environment */ switch (cThis) { case '\\': PushLevels(); TranslateCommand(); CleanStack(); break; case '{': PushBrace(); fprintRTF("{"); break; case '}': ret = RecursionLevel - PopBrace(); fprintRTF("}"); break; default: putRtfChar(cThis); break; } } PopSource(); } diagnostics(4, "Exiting Convert() from StringAllttConvert()"); }
void CmdBibliography(int code) { int err; char *s; s = getBraceParam(); /*throw away bibliography name */ free(s); err=PushSource(g_bbl_name, NULL); if (!err) { diagnostics(4, "CmdBibliography ... begin Convert()"); Convert(); diagnostics(4, "CmdBibliography ... done Convert()"); PopSource(); } else diagnostics(WARNING, "Cannot open bibliography file. Create %s using BibTeX", g_bbl_name); }
/****************************************************************************** purpose: return a copy of tag from \label{tag} in the string text ******************************************************************************/ char *ExtractLabelTag(const char *text) { char *s, *label_with_spaces, *label; s = strstr(text, "\\label{"); if (!s) s = strstr(text, "\\label "); if (!s) return NULL; s += strlen("\\label"); PushSource(NULL, s); label_with_spaces = getBraceParam(); PopSource(); label = strdup_nobadchars(label_with_spaces); free(label_with_spaces); diagnostics(4, "LabelTag = <%s>", (label) ? label : "missing"); return label; }
char * ExtractAndRemoveTag(char *tag, char *text) /****************************************************************************** purpose: remove 'tag{contents}' from text and return contents note that tag should typically be "\\caption" ******************************************************************************/ { char *s, *contents, *start, *end; s = text; diagnostics(5, "target tag = <%s>", tag); diagnostics(5, "original text = <%s>", text); while (s) { /* find start of caption */ start = strstr(s,tag); if (!start) return NULL; s = start+strlen(tag); if (*s == ' ' || *s == '{') break; } PushSource(NULL,s); contents = getBraceParam(); PopSource(); if (!contents) return NULL; end = strstr(s,contents)+strlen(contents)+1; /* end just after '}' */ free(contents); contents = my_strndup(start,(size_t) (end-start)); do *start++=*end++; while (*end); /* erase "tag{contents}" */ *start='\0'; diagnostics(5, "final contents = <%s>", contents); diagnostics(5, "final text = <%s>", text); return contents; }
char * ExtractLabelTag(char *text) /****************************************************************************** purpose: return a copy of tag from \label{tag} in the string text ******************************************************************************/ { char *s, *label_with_spaces, *label; s = strstr(text,"\\label{"); if (!s) s = strstr(text,"\\label "); if (!s) return NULL; s += strlen("\\label"); PushSource(NULL,s); label_with_spaces = getBraceParam(); PopSource(); label = strdup_nobadchars(label_with_spaces); free(label_with_spaces); diagnostics(4, "LabelTag = <%s>", (label) ? label : "missing"); return label; }
void preParse(char **body, char **header, char **label) /************************************************************************** purpose: obtain the next section of the latex file This is now a preparsing routine that breaks a file up into sections. Macro expansion happens here as well. \input and \include are also handled here. The reason for this routine is allow \labels to refer to sections. This routine reads text until a new section heading is found. The text is returned in body and the *next* header is returned in header. If no header follows then NULL is returned. **************************************************************************/ { int any_possible_match, found; char cNext, cThis, *s, *text, *next_header, *str, *p; int i; int possible_match[43]; char *command[43] = { "", /* 0 entry is for user definitions */ "", /* 1 entry is for user environments */ "\\begin{verbatim}", "\\begin{figure}", "\\begin{figure*}", "\\begin{equation}", "\\begin{equation*}", "\\begin{eqnarray}", "\\begin{eqnarray*}", "\\begin{table}", "\\begin{table*}", "\\begin{description}", "\\begin{comment}", "\\end{verbatim}", "\\end{figure}", "\\end{figure*}", "\\end{equation}", "\\end{equation*}", "\\end{eqnarray}", "\\end{eqnarray*}", "\\end{table}", "\\end{table*}", "\\end{description}", "\\end{comment}", "\\part", "\\chapter", "\\section", "\\subsection", "\\subsubsection", "\\section*", "\\subsection*", "\\subsubsection*", "\\label", "\\input", "\\include", "\\verb", "\\url", "\\nolinkurl", "\\newcommand", "\\def", "\\renewcommand", "\\endinput", "\\end{document}", }; int ncommands = 43; const int b_verbatim_item = 2; const int b_figure_item = 3; const int b_figure_item2 = 4; const int b_equation_item = 5; const int b_equation_item2 = 6; const int b_eqnarray_item = 7; const int b_eqnarray_item2 = 8; const int b_table_item = 9; const int b_table_item2 = 10; const int b_description_item = 11; const int b_comment_item = 12; const int e_verbatim_item = 13; const int e_figure_item = 14; const int e_figure_item2 = 15; const int e_equation_item = 16; const int e_equation_item2 = 17; const int e_eqnarray_item = 18; const int e_eqnarray_item2 = 19; const int e_table_item = 20; const int e_table_item2 = 21; const int e_description_item = 22; const int e_comment_item = 23; const int label_item = 32; const int input_item = 33; const int include_item = 34; const int verb_item = 35; const int url_item = 36; const int nolinkurl_item = 37; const int new_item = 38; const int def_item = 39; const int renew_item = 40; const int endinput_item = 41; const int e_document_item = 42; int bs_count = 0; /* number of backslashes encountered in a row */ size_t cmd_pos = 0; /* position of start of command relative to end of buffer */ int label_depth = 0; int i_match = 0; text = NULL; next_header = NULL; /* typically becomes \subsection{Cows eat grass} */ *body = NULL; *header = NULL; *label = NULL; PushTrackLineNumber(FALSE); reset_buffer(); while (1) { cThis = getRawTexChar(); while (cThis == '\0' && getParserDepth() > 0) { PopSource(); diagnostics(4,"parser depth is now %d", getParserDepth()); cThis = getRawTexChar(); } if (cThis == '\0') diagnostics(6, "[%ld] xchar=000 '\\0' (backslash count=%d)", section_buffer_end, bs_count); else if (cThis == '\n') diagnostics(6, "[%ld] xchar=012 '\\n' (backslash count=%d)", section_buffer_end, bs_count); else diagnostics(6, "[%ld] xchar=%03d '%c' (backslash count=%d)", section_buffer_end, (int) cThis, cThis, bs_count); cThis = skipBOM(cThis); add_chr_to_buffer(cThis); if (cThis == '\0') break; if (cThis == '%' && even(bs_count)) { int n = 1; /* remove initial % */ do { cNext = getRawTexChar(); add_chr_to_buffer(cNext); n++; } while (cNext != '\n' && cNext != '\0'); move_end_of_buffer(-n); if (0) show_buffer("percent"); continue; } /* cmd_pos > 0 means that we have encountered a '\' and some fraction of a command, e.g., '\sec', therefore the first time that a backslash is found then cmd_pos becomes 1, */ if (cThis == '\\') { bs_count++; if (odd(bs_count)) { /* avoid "\\section" and "\\\\section" */ for (i = 0; i < ncommands; i++) possible_match[i] = TRUE; cmd_pos = 1; continue; } } else bs_count = 0; if (cmd_pos == 0) continue; /* replace "\ " and "\\n" with a space */ if (cmd_pos == 1 && (cThis == '\n' || cThis == ' ') ) { move_end_of_buffer(-1); add_chr_to_buffer(' '); cmd_pos = 0; continue; } /* at this point we are have encountered a command and may have to do something. if it is a user definition, then the user definition is expanded here if it is a user environment, then expansion also happens here it it is something else then we may or may not have to mess with it. */ /* hack to convert '\begin {' --> '\begin{' */ if (cThis==' ' && (matches_buffer_tail("\\begin") || matches_buffer_tail("\\end")) ) { diagnostics(5, "matched '\\begin ' or '\\end '"); do {cThis = getRawTexChar();} while (cThis == ' '); } /* hack to convert '\begin{ ' --> '\begin{' */ if (cThis==' ' && (matches_buffer_tail("\\begin{") || matches_buffer_tail("\\end{")) ) { diagnostics(5, "matched '\\begin{ ' or '\\end{ '"); do {cThis = getRawTexChar();} while (cThis == ' '); } any_possible_match = FALSE; found = FALSE; /* is is possibly a user defined command? */ if (possible_match[0]) { possible_match[0] = maybeDefinition(section_buffer + section_buffer_end - cmd_pos + 1, cmd_pos - 1); if (possible_match[0]) { /* test to make sure \userdef is complete */ any_possible_match = TRUE; cNext = getRawTexChar(); /* wrong when cNext == '%' */ ungetTexChar(cNext); if (!isalpha((int) cNext)) { /* is macro name complete? */ *(section_buffer + section_buffer_end + 1) = '\0'; i = existsDefinition(section_buffer + section_buffer_end - cmd_pos + 1); if (i > -1) { diagnostics(4, "matched <%s> ", section_buffer + section_buffer_end - cmd_pos); if (cNext == ' ') { cNext = getNonSpace(); ungetTexChar(cNext); } move_end_of_buffer(-cmd_pos-1); /* remove \userdef */ str = expandDefinition(i); PushSource(NULL, str); free(str); cmd_pos = 0; bs_count = 0; continue; } } } } /* is it a user defined environment? */ if (possible_match[1]) { char *pp = section_buffer + section_buffer_end - cmd_pos; possible_match[1] = maybeEnvironment(pp, cmd_pos); if (possible_match[1] == TRUE) { any_possible_match = TRUE; cNext = getRawTexChar(); /* wrong when cNext == '%' */ /* \begin{name} or \end{name} will end with '}' */ if (cNext == '}') { char *ss = NULL; *(pp + cmd_pos + 1) = '\0'; if (*(pp + 1) == 'e') { i = existsEnvironment(pp + strlen("\\end{")); ss = expandEnvironment(i, CMD_END); } else { i = existsEnvironment(pp + strlen("\\begin{")); ss = expandEnvironment(i, CMD_BEGIN); } if (ss) { /* found */ diagnostics(5, "matched <%s}>", pp); diagnostics(5, "expanded to <%s>", ss); PushSource(NULL, ss); move_end_of_buffer(-cmd_pos-1); /* remove \begin{userenvironment} */ free(ss); cmd_pos = 0; continue; } } ungetTexChar(cNext); /* put the character back */ } } /* is it one of the commands listed above? */ for (i = 2; i < ncommands; i++) { if (possible_match[i]) { if (cThis == command[i][cmd_pos]) any_possible_match = TRUE; else possible_match[i] = FALSE; diagnostics(6,"cmd_pos = %d, char = %c, possible match %s, size=%d, possible=%d", \ cmd_pos,cThis,command[i],strlen(command[i]),possible_match[i]); } } i_match = -1; for (i = 2; i < ncommands; i++) { /* discover any exact matches */ if (possible_match[i]) { diagnostics(6, "testing for <%s>", command[i]); /* right length? */ if (cmd_pos+1 == strlen(command[i])) { if (i<=e_comment_item || i==e_comment_item) { /* these entries are complete matches */ found = TRUE; } else { /* these entries we need to be a bit more careful and check next character */ cNext = getRawTexChar(); ungetTexChar(cNext); /* this test for the end of commands may still need tweaking */ if (!isalpha(cNext) && cNext != '*') { found = TRUE; } } } } if (found == TRUE) { diagnostics(6,"preparse matched '%s'",command[i]); i_match = i; break; } } if (any_possible_match) cmd_pos++; else cmd_pos = 0; /* no possible matches, reset and wait for next '\\' */ if (!found) continue; if (i_match == endinput_item) { diagnostics(6, "\\endinput"); move_end_of_buffer(-9); /* remove \endinput */ PopSource(); cmd_pos = 0; /* keep looking */ continue; } /* \end{document} reached! Stop processing */ if (i_match == e_document_item) { diagnostics(6, "\\end{document}"); move_end_of_buffer(-strlen(command[e_document_item])); add_chr_to_buffer('\0'); safe_free(*header); *header = strdup(command[e_document_item]); p = section_buffer; while (*p==' ' || *p == '\n') p++; *body = strdup(p); PopTrackLineNumber(); diagnostics(6, "body = %s", section_buffer); diagnostics(6, "next header = '%s'", command[e_document_item]); return; } if (i_match == verb_item) { /* slurp \verb#text# */ char cc; cNext = getRawTexChar(); add_chr_to_buffer(cNext); diagnostics(6, "verb char = %c", cNext); do { cc = getRawTexChar(); add_chr_to_buffer(cc); } while (cc != cNext && cc != '\0'); cmd_pos = 0; /* reset the command position */ continue; } /* cannot ignore this because it may contain unescaped '%' */ if (i_match == url_item || i_match == nolinkurl_item) { char cc; do { cc = getRawTexChar(); add_chr_to_buffer(cc); } while (cc != '\0' && cc != '}'); cmd_pos = 0; /* reset the command position */ continue; } if (i_match == include_item) { CmdInclude(0); move_end_of_buffer(-strlen(command[i])); cmd_pos = 0; /* reset the command position */ continue; } if (i_match == input_item) { CmdInclude(1); move_end_of_buffer(-strlen(command[i])); cmd_pos = 0; /* reset the command position */ continue; } if (i_match == label_item) { char *tag; tag = getBraceParam(); /* append \label{tag} to the buffer */ add_chr_to_buffer('{'); add_str_to_buffer(tag); add_chr_to_buffer('}'); if (!(*label) && strlen(tag) && label_depth == 0) *label = strdup_nobadchars(tag); free(tag); cmd_pos = 0; /* keep looking */ continue; } /* process any new definitions */ if (i_match == def_item || i_match == new_item || i_match == renew_item) { cNext = getRawTexChar(); /* wrong when cNext == '%' */ ungetTexChar(cNext); if (isalpha((int) cNext)) /* is macro name complete? */ continue; move_end_of_buffer(-strlen(command[i])); /* do not include in buffer */ if (i_match == def_item) CmdNewDef(DEF_DEF); else if (i_match == new_item) CmdNewDef(DEF_NEW); else CmdNewDef(DEF_RENEW); cmd_pos = 0; /* keep looking */ continue; } if (i_match == b_figure_item || i_match == b_figure_item2 || i_match == b_equation_item || i_match == b_equation_item2 || i_match == b_eqnarray_item || i_match == b_eqnarray_item2 || i_match == b_table_item || i_match == b_table_item2 || i_match == b_description_item) { label_depth++; /* labels now will not be the section label */ cmd_pos = 0; continue; } if (i_match == e_figure_item || i_match == e_figure_item2 || i_match == e_equation_item || i_match == e_equation_item2 || i_match == e_eqnarray_item || i_match == e_eqnarray_item2 || i_match == e_table_item || i_match == e_table_item2 || i_match == e_description_item) { label_depth--; /* labels may now be the section label */ cmd_pos = 0; continue; } if (i_match == b_verbatim_item) { /* slurp environment ... toxic contents! */ s = getTexUntil(command[e_verbatim_item], TRUE); add_str_to_buffer(s); free(s); add_str_to_buffer(command[e_verbatim_item]); diagnostics(4,"matched \\end{verbatim}"); cmd_pos = 0; /* keep looking */ continue; } if (i_match == b_comment_item) { /* slurp environment ... toxic contents! */ s = getTexUntil(command[e_comment_item], TRUE); add_str_to_buffer(s); free(s); add_str_to_buffer(command[e_comment_item]); cmd_pos = 0; /* keep looking */ continue; } diagnostics(4, "possible end of section"); diagnostics(4, "label_depth = %d", label_depth); if (label_depth > 0) /* still in a \begin{xxx} environment? */ continue; /* actually found command to end the section */ diagnostics(4, "preParse() found command to end section"); s = getBraceParam(); next_header = strdup_together4(command[i], "{", s, "}"); free(s); move_end_of_buffer(-strlen(command[i])); add_chr_to_buffer('\0'); break; } /*eliminate white space at beginning of buffer */ p = section_buffer; while (*p==' ' || *p == '\n') p++; *body = strdup(p); safe_free(*header); *header = next_header; PopTrackLineNumber(); }
static void ConvertNatbib(char *s, int code, char *pre, char *post) { char *n, *year, *abbv, *full, *v; PushSource(NULL,s); n=getBraceParam(); year=getBraceParam(); abbv=getBraceParam(); full=getBraceParam(); PopSource(); diagnostics(5,"natbib [%s] <%s> <%s> <%s> <%s>",pre,n,year,abbv,full); switch (code) { case CITE_CITE: case CITE_T: case CITE_T_STAR: v=abbv; if (CITE_T==code && g_citation_longnamesfirst && !g_current_cite_seen) if (!isEmptyName(full)) v = full; if (CITE_T_STAR==code) if (!isEmptyName(full)) v = full; if (CITE_CITE==code && g_citation_longnamesfirst) if (!isEmptyName(full)) v = full; ConvertString(v); fprintRTF(" ("); ConvertString(year); if (pre){ fprintRTF(", "); ConvertString(pre); } if (post) { fprintRTF(", "); ConvertString(post); } fprintRTF(")"); break; case CITE_P: case CITE_P_STAR: v=abbv; if (CITE_P==code && g_citation_longnamesfirst && !g_current_cite_seen) if (!isEmptyName(full)) v = full; if (CITE_P_STAR==code) if (!isEmptyName(full)) v = full; if (pre && g_current_cite_item==1){ ConvertString(pre); fprintRTF(" "); } if (strcmp(v,g_last_author_cited)!=0) { /*suppress repeated names */ ConvertString(v); strcpy(g_last_author_cited,v); } fprintRTF(", "); ConvertString(year); if (post && *post !='\0') { fprintRTF(", "); ConvertString(post); fprintRTF(" "); } break; case CITE_AUTHOR: case CITE_AUTHOR_STAR: v=abbv; if (CITE_AUTHOR==code && g_citation_longnamesfirst && !g_current_cite_seen) v = full; if (CITE_AUTHOR_STAR==code) v = full; ConvertString(v); break; case CITE_YEAR: case CITE_YEAR_P: if (pre){ ConvertString(pre); fprintRTF(" "); } ConvertString(year); if (post) { fprintRTF(", "); ConvertString(post); } break; } free(n); free(year); free(abbv); free(full); }