docstring cleanAttr(docstring const & str) { docstring newname; docstring::const_iterator it = str.begin(); docstring::const_iterator en = str.end(); for (; it != en; ++it) { char_type const c = *it; newname += isAlnumASCII(c) ? c : char_type('_'); } return newname; }
static docstring const cleanupWhitespace(docstring const & citelist) { docstring::const_iterator it = citelist.begin(); docstring::const_iterator end = citelist.end(); // Paranoia check: make sure that there is no whitespace in here // -- at least not behind commas or at the beginning docstring result; char_type last = ','; for (; it != end; ++it) { if (*it != ' ') last = *it; if (*it != ' ' || last != ',') result += *it; } return result; }
static docstring const printable_list(docstring const & invalid_chars) { docstring s; docstring::const_iterator const begin = invalid_chars.begin(); docstring::const_iterator const end = invalid_chars.end(); docstring::const_iterator it = begin; for (; it != end; ++it) { if (it != begin) s += ", "; if (*it == ' ') s += _("space"); else s += *it; } return s; }
docstring sgml::cleanID(Buffer const & buf, OutputParams const & runparams, docstring const & orig) { // The standard DocBook SGML declaration only allows letters, // digits, '-' and '.' in a name. // Since users might change that declaration one has to cater // for additional allowed characters. // This routine replaces illegal characters by '-' or '.' // and adds a number for uniqueness. // If you know what you are doing, you can set allowed=="" // to disable this mangling. DocumentClass const & tclass = buf.params().documentClass(); docstring const allowed = from_ascii( runparams.flavor == OutputParams::XML ? ".-_:" : tclass.options()); if (allowed.empty()) return orig; docstring::const_iterator it = orig.begin(); docstring::const_iterator end = orig.end(); docstring content; // FIXME THREAD typedef map<docstring, docstring> MangledMap; static MangledMap mangledNames; static int mangleID = 1; MangledMap::const_iterator const known = mangledNames.find(orig); if (known != mangledNames.end()) return known->second; // make sure it starts with a letter if (!isAlphaASCII(*it) && allowed.find(*it) >= allowed.size()) content += "x"; bool mangle = false; for (; it != end; ++it) { char_type c = *it; if (isAlphaASCII(c) || isDigitASCII(c) || c == '-' || c == '.' || allowed.find(c) < allowed.size()) content += c; else if (c == '_' || c == ' ') { mangle = true; content += "-"; } else if (c == ':' || c == ',' || c == ';' || c == '!') { mangle = true; content += "."; } else { mangle = true; } } if (mangle) content += "-" + convert<docstring>(mangleID++); else if (isDigitASCII(content[content.size() - 1])) content += "."; mangledNames[orig] = content; return content; }