...warning about (for now only) functions and variables with external linkage that likely don't need it. The problems with moving entities into unnamed namespacs and breaking ADL (as alluded to in comments in compilerplugins/clang/external.cxx) are illustrated by the fact that while struct S1 { int f() { return 0; } }; int f(S1 s) { return s.f(); } namespace N { struct S2: S1 { int f() { return 1; } }; int f(S2 s) { return s.f(); } } int main() { return f(N::S2()); } returns 1, both moving just the struct S2 into an nunnamed namespace, struct S1 { int f() { return 0; } }; int f(S1 s) { return s.f(); } namespace N { namespace { struct S2: S1 { int f() { return 1; } }; } int f(S2 s) { return s.f(); } } int main() { return f(N::S2()); } as well as moving just the function f overload into an unnamed namespace, struct S1 { int f() { return 0; } }; int f(S1 s) { return s.f(); } namespace N { struct S2: S1 { int f() { return 1; } }; namespace { int f(S2 s) { return s.f(); } } } int main() { return f(N::S2()); } would each change the program to return 0 instead. Change-Id: I4d09f7ac5e8f9bcd6e6bde4712608444b642265c Reviewed-on: https://gerrit.libreoffice.org/60539 Tested-by: Jenkins Reviewed-by: Stephan Bergmann <sbergman@redhat.com>
775 lines
26 KiB
C++
775 lines
26 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
|
|
// DVO: always use standard headers:
|
|
#include <istream>
|
|
#include <sstream>
|
|
using namespace std;
|
|
|
|
#include "mzstring.h"
|
|
#include "hwpeq.h"
|
|
#include <sal/types.h>
|
|
#include <sal/macros.h>
|
|
|
|
#include <rtl/character.hxx>
|
|
|
|
/* @Man: change the hwp formula to LaTeX */
|
|
#ifdef _WIN32
|
|
# define ENDL "\r\n"
|
|
#else /* !WIN32 */
|
|
# define ENDL "\n"
|
|
#endif
|
|
|
|
#define EQ_CASE 0x01 // case sensitive cmd
|
|
#define EQ_ENV 0x02 // equiv to latex environment
|
|
#define EQ_ATOP 0x04 // must revert order
|
|
|
|
static bool IS_WS(std::istream::int_type ch) {
|
|
return ch != std::istream::traits_type::eof()
|
|
&& rtl::isAsciiWhiteSpace(
|
|
static_cast<unsigned char>(
|
|
std::istream::traits_type::to_char_type(ch)));
|
|
}
|
|
|
|
static bool IS_BINARY(std::istream::int_type ch) {
|
|
return ch != std::istream::traits_type::eof()
|
|
&& strchr("+-<=>", std::istream::traits_type::to_char_type(ch));
|
|
}
|
|
|
|
#ifdef _WIN32
|
|
#define STRICMP stricmp
|
|
#else
|
|
#define STRICMP strcasecmp
|
|
#endif
|
|
|
|
// sub and sup script status
|
|
enum { SCRIPT_NONE, SCRIPT_SUB, SCRIPT_SUP, SCRIPT_ALL};
|
|
|
|
static int eq_word(MzString& outs, istream *strm, int script = SCRIPT_NONE);
|
|
static bool eq_sentence(MzString& outs, istream *strm, const char *end = nullptr);
|
|
|
|
struct hwpeq {
|
|
const char *key; // hwp math keyword
|
|
const char *latex; // corresponding latex keyword
|
|
int nargs; // # of argument
|
|
unsigned char flag; // case sensitive?
|
|
};
|
|
|
|
static const hwpeq eq_tbl[] = {
|
|
{ "!=", "\\equiv ", 0, 0 },
|
|
{ "#", "\\\\", 0, 0 },
|
|
{ "+-", "\\pm ", 0, 0 },
|
|
{ "-+", "\\mp ", 0, 0 },
|
|
{ "<=", "\\leq ", 0, 0 },
|
|
{ "==", "\\equiv ", 0, 0 },
|
|
{ ">=", "\\geq ", 0, 0 },
|
|
{ "Pr", nullptr, 0, 0 },
|
|
{ "^", "^", 1, 0 },
|
|
{ "_", "_", 1, 0 },
|
|
{ "`", "\\;", 0, 0 },
|
|
{ "acute", nullptr, 1, 0 },
|
|
{ "aleph", nullptr, 0, 0 },
|
|
{ "alpha", nullptr, 0, EQ_CASE },
|
|
{ "amalg", nullptr, 0, 0 },
|
|
{ "and", nullptr, 0, 0 },
|
|
{ "angle", nullptr, 0, 0 },
|
|
{ "angstrom", nullptr, 0, 0 },
|
|
{ "approx", nullptr, 0, 0 },
|
|
{ "arc", nullptr, 0, 0 },
|
|
{ "arccos", nullptr, 0, 0 },
|
|
{ "arch", nullptr, 0, 0 },
|
|
{ "arcsin", nullptr, 0, 0 },
|
|
{ "arctan", nullptr, 0, 0 },
|
|
{ "arg", nullptr, 0, 0 },
|
|
{ "assert", "\\vdash", 0, 0 },
|
|
{ "ast", nullptr, 0, 0 },
|
|
{ "asymp", nullptr, 0, 0 },
|
|
{ "atop", nullptr, 1, EQ_ATOP },
|
|
{ "backslash", nullptr, 0, 0 },
|
|
{ "bar", nullptr, 1, 0 },
|
|
{ "because", nullptr, 0, 0 },
|
|
{ "beta", nullptr, 0, EQ_CASE },
|
|
{ "big", nullptr, 0, EQ_CASE },
|
|
{ "bigcap", nullptr, 0, 0 },
|
|
{ "bigcirc", nullptr, 0, 0 },
|
|
{ "bigcup", nullptr, 0, 0 },
|
|
{ "bigg", nullptr, 0, EQ_CASE },
|
|
{ "bigodiv", nullptr, 0, 0 },
|
|
{ "bigodot", nullptr, 0, 0 },
|
|
{ "bigominus", nullptr, 0, 0 },
|
|
{ "bigoplus", nullptr, 0, 0 },
|
|
{ "bigotimes", nullptr, 0, 0 },
|
|
{ "bigsqcap", nullptr, 0, 0 },
|
|
{ "bigsqcup", nullptr, 0, 0 },
|
|
{ "biguplus", nullptr, 0, 0 },
|
|
{ "bigvee", nullptr, 0, 0 },
|
|
{ "bigwedge", nullptr, 0, 0 },
|
|
{ "binom", nullptr, 2, 0 },
|
|
{ "bmatrix", nullptr, 0, EQ_ENV },
|
|
{ "bold", nullptr, 0, 0 },
|
|
{ "bot", nullptr, 0, 0 },
|
|
{ "breve", nullptr, 1, 0 },
|
|
{ "buildrel", nullptr, 0, 0 }, // LATER
|
|
{ "bullet", nullptr, 0, 0 },
|
|
{ "cap", nullptr, 0, 0 },
|
|
{ "cases", nullptr, 0, EQ_ENV },
|
|
{ "ccol", nullptr, 0, 0 }, /* Center vertically */
|
|
{ "cdot", nullptr, 0, 0 },
|
|
{ "cdots", nullptr, 0, 0 },
|
|
{ "check", nullptr, 1, 0 },
|
|
{ "chi", nullptr, 0, EQ_CASE },
|
|
{ "choose", nullptr, 0, EQ_ATOP },
|
|
{ "circ", nullptr, 0, 0 },
|
|
{ "col", nullptr, 0, 0 }, // LATER
|
|
{ "cong", nullptr, 0, 0 },
|
|
{ "coprod", nullptr, 0, 0 },
|
|
{ "cos", nullptr, 0, 0 },
|
|
{ "cosec", nullptr, 0, 0 },
|
|
{ "cosh", nullptr, 0, 0 },
|
|
{ "cot", nullptr, 0, 0 },
|
|
{ "coth", nullptr, 0, 0 },
|
|
{ "cpile", nullptr, 0, 0 }, // LATER
|
|
{ "csc", nullptr, 0, 0 },
|
|
{ "cup", nullptr, 0, 0 },
|
|
{ "dagger", nullptr, 0, 0 },
|
|
{ "dashv", nullptr, 0, 0 },
|
|
{ "ddagger", nullptr, 0, 0 },
|
|
{ "ddot", nullptr, 1, 0 },
|
|
{ "ddots", nullptr, 0, 0 },
|
|
{ "def", nullptr, 0, 0 },
|
|
{ "deg", nullptr, 0, 0 },
|
|
{ "del", nullptr, 0, 0 },
|
|
{ "delta", nullptr, 0, EQ_CASE },
|
|
{ "diamond", nullptr, 0, 0 },
|
|
{ "dim", nullptr, 0, 0 },
|
|
{ "div", nullptr, 0, 0 },
|
|
{ "divide", nullptr, 0, 0 },
|
|
{ "dline", nullptr, 0, 0 },
|
|
{ "dmatrix", nullptr, 0, EQ_ENV },
|
|
{ "dot", nullptr, 1, 0 },
|
|
{ "doteq", nullptr, 0, 0 },
|
|
{ "dotsaxis", nullptr, 0, 0 },
|
|
{ "dotsdiag", nullptr, 0, 0 },
|
|
{ "dotslow", "\\ldots", 0, 0 },
|
|
{ "dotsvert", "\\vdots", 0, 0 },
|
|
{ "downarrow", nullptr, 0, EQ_CASE },
|
|
{ "dsum", "+", 0, 0 },
|
|
{ "dyad", nullptr, 0, 0 }, // LATER
|
|
{ "ell", nullptr, 0, 0 },
|
|
{ "emptyset", nullptr, 0, 0 },
|
|
{ "epsilon", nullptr, 0, EQ_CASE },
|
|
{ "eqalign", nullptr, 0, EQ_ENV },
|
|
{ "equiv", nullptr, 0, 0 },
|
|
{ "eta", nullptr, 0, EQ_CASE },
|
|
{ "exarrow", nullptr, 0, 0 },
|
|
{ "exist", "\\exists", 0, 0 },
|
|
{ "exists", nullptr, 0, 0 },
|
|
{ "exp", nullptr, 0, EQ_CASE },
|
|
{ "for", nullptr, 0, 0 },
|
|
{ "forall", nullptr, 0, 0 },
|
|
{ "from", "_", 1, 0 },
|
|
{ "gamma", nullptr, 0, EQ_CASE },
|
|
{ "gcd", nullptr, 0, 0 },
|
|
{ "ge", "\\geq", 0, 0 },
|
|
{ "geq", nullptr, 0, 0 },
|
|
{ "ggg", nullptr, 0, 0 },
|
|
{ "grad", nullptr, 0, 0 },
|
|
{ "grave", nullptr, 1, 0 },
|
|
{ "hat", "\\widehat", 1, 0 },
|
|
{ "hbar", nullptr, 0, 0 },
|
|
{ "hom", nullptr, 0, 0 },
|
|
{ "hookleft", nullptr, 0, 0 },
|
|
{ "hookright", nullptr, 0, 0 },
|
|
{ "identical", nullptr, 0, 0 }, // LATER
|
|
{ "if", nullptr, 0, 0 },
|
|
{ "imag", nullptr, 0, 0 },
|
|
{ "image", nullptr, 0, 0 },
|
|
{ "imath", nullptr, 0, 0 },
|
|
{ "in", nullptr, 0, 0 },
|
|
{ "inf", "\\infty", 0, 0 },
|
|
{ "infinity", "\\infty", 0, 0 },
|
|
{ "infty", nullptr, 0, 0 },
|
|
{ "int", nullptr, 0, 0 },
|
|
{ "integral", "\\int", 0, 0 },
|
|
{ "inter", "\\bigcap", 0, 0 },
|
|
{ "iota", nullptr, 0, EQ_CASE },
|
|
{ "iso", nullptr, 0, 0 }, // ams
|
|
{ "it", nullptr, 0, 0 },
|
|
{ "jmath", nullptr, 0, 0 },
|
|
{ "kappa", nullptr, 0, EQ_CASE },
|
|
{ "ker", nullptr, 0, 0 },
|
|
{ "lambda", nullptr, 0, EQ_CASE },
|
|
{ "land", nullptr, 0, 0 }, // LATER
|
|
{ "langle", nullptr, 0, 0 },
|
|
{ "larrow", "\\leftarrow", 0, EQ_CASE },
|
|
{ "lbrace", nullptr, 0, 0 },
|
|
{ "lbrack", "[", 0, 0 },
|
|
{ "lceil", nullptr, 0, 0 },
|
|
{ "lcol", nullptr, 0, 0 }, // LATER
|
|
{ "ldots", nullptr, 0, 0 },
|
|
{ "le", nullptr, 0, 0 },
|
|
{ "left", nullptr, 0, 0 },
|
|
{ "leftarrow", nullptr, 0, EQ_CASE },
|
|
{ "leq", nullptr, 0, 0 },
|
|
{ "lfloor", nullptr, 0, 0 },
|
|
{ "lg", nullptr, 0, 0 },
|
|
{ "lim", nullptr, 0, EQ_CASE },
|
|
{ "line", "\\vert", 0, 0 },
|
|
{ "liter", "\\ell", 0, 0 },
|
|
{ "lll", nullptr, 0, 0 }, // ams
|
|
{ "ln", nullptr, 0, 0 },
|
|
{ "log", nullptr, 0, 0 },
|
|
{ "lor", "\\vee", 0, 0 },
|
|
{ "lparen", "(", 0, 0 },
|
|
{ "lpile", nullptr, 0, 0 }, // LATER
|
|
{ "lrarrow", "\\leftrightarrow", 0, EQ_CASE },
|
|
{ "lrharpoons", "\\leftrightharpoons",0, 0 },
|
|
{ "mapsto", nullptr, 0, 0 },
|
|
{ "massert", "\\dashv", 0, 0 },
|
|
{ "matrix", nullptr, 0, EQ_ENV },
|
|
{ "max", nullptr, 0, 0 },
|
|
{ "mho", nullptr, 0, 0 }, // ams
|
|
{ "min", nullptr, 0, 0 },
|
|
{ "minusplus", nullptr, 0, 0 },
|
|
{ "mit", "", 0, 0 }, // font
|
|
{ "mod", "\\bmod", 0, 0 },
|
|
{ "models", nullptr, 0, 0 },
|
|
{ "msangle", nullptr, 0, 0 }, // LATER
|
|
{ "mu", nullptr, 0, EQ_CASE },
|
|
{ "nabla", nullptr, 0, 0 },
|
|
{ "ne", nullptr, 0, 0 },
|
|
{ "nearrow", nullptr, 0, 0 },
|
|
{ "neg", nullptr, 0, 0 },
|
|
{ "neq", nullptr, 0, 0 },
|
|
{ "nequiv", nullptr, 0, 0 },
|
|
{ "ni", nullptr, 0, 0 },
|
|
{ "not", nullptr, 0, 0 },
|
|
{ "notin", nullptr, 0, 0 },
|
|
{ "nu", nullptr, 0, EQ_CASE },
|
|
{ "nwarrow", nullptr, 0, 0 },
|
|
{ "odiv", nullptr, 0, 0 },
|
|
{ "odot", nullptr, 0, 0 },
|
|
{ "oint", nullptr, 0, 0 },
|
|
{ "omega", nullptr, 0, EQ_CASE },
|
|
{ "omicron", nullptr, 0, EQ_CASE },
|
|
{ "ominus", nullptr, 0, 0 },
|
|
{ "oplus", nullptr, 0, 0 },
|
|
{ "or ", nullptr, 0, 0 },
|
|
{ "oslash", nullptr, 0, 0 },
|
|
{ "otimes", nullptr, 0, 0 },
|
|
{ "over", nullptr, 1, EQ_ATOP },
|
|
{ "overline", nullptr, 1, 0 },
|
|
{ "owns", "\\ni", 0, 0 },
|
|
{ "parallel", nullptr, 0, 0 },
|
|
{ "partial", nullptr, 0, 0 },
|
|
{ "phantom", nullptr, 0, 0 },
|
|
{ "phi", nullptr, 0, EQ_CASE },
|
|
{ "pi", nullptr, 0, EQ_CASE },
|
|
{ "pile", nullptr, 0, 0 }, // LATER
|
|
{ "plusminus", "\\pm", 0, 0 },
|
|
{ "pmatrix", nullptr, 0, EQ_ENV },
|
|
{ "prec", nullptr, 0, 0 },
|
|
{ "prep", nullptr, 0, 0 },
|
|
{ "prime", nullptr, 0, 0 },
|
|
{ "prod", nullptr, 0, 0 },
|
|
{ "propto", nullptr, 0, 0 },
|
|
{ "psi", nullptr, 0, EQ_CASE },
|
|
{ "rangle", nullptr, 0, 0 },
|
|
{ "rarrow", "\\rightarrow", 0, EQ_CASE },
|
|
{ "rbrace", "]", 0, 0 },
|
|
{ "rbrace", nullptr, 0, 0 },
|
|
{ "rceil", nullptr, 0, 0 },
|
|
{ "rcol", nullptr, 0, 0 }, // LATER
|
|
{ "real", "\\Re", 0, 0 },
|
|
{ "reimage", nullptr, 0, 0 },
|
|
{ "rel", nullptr, 0, 0 },
|
|
{ "rfloor", nullptr, 0, 0 },
|
|
{ "rho", nullptr, 0, EQ_CASE },
|
|
{ "right", nullptr, 0, 0 },
|
|
{ "rightarrow", nullptr, 0, EQ_CASE },
|
|
{ "rlharpoons", nullptr, 0, 0 },
|
|
{ "rm", nullptr, 0, 0 },
|
|
{ "root", "\\sqrt", 1, 0 },
|
|
{ "rparen", ")", 0, 0 },
|
|
{ "rpile", nullptr, 0, 0 }, // LATER
|
|
{ "rtangle", nullptr, 0, 0 },
|
|
{ "sangle", nullptr, 0, 0 },
|
|
{ "scale", nullptr, 0, 0 },
|
|
{ "searrow", nullptr, 0, 0 },
|
|
{ "sec", nullptr, 0, 0 },
|
|
{ "sigma", nullptr, 0, EQ_CASE },
|
|
{ "sim", nullptr, 0, 0 },
|
|
{ "simeq", nullptr, 0, 0 },
|
|
{ "sin", nullptr, 0, 0 },
|
|
{ "sinh", nullptr, 0, 0 },
|
|
{ "slash", nullptr, 0, 0 },
|
|
{ "smallint", nullptr, 0, 0 },
|
|
{ "smallinter", nullptr, 0, 0 },
|
|
{ "smalloint", nullptr, 0, 0 },
|
|
{ "smallprod", nullptr, 0, 0 },
|
|
{ "smallsum", nullptr, 0, 0 },
|
|
{ "smallunion", nullptr, 0, 0 },
|
|
{ "smcoprod", nullptr, 0, 0 },
|
|
{ "sqcap", nullptr, 0, 0 },
|
|
{ "sqcup", nullptr, 0, 0 },
|
|
{ "sqrt", nullptr, 1, 0 },
|
|
{ "sqsubset", nullptr, 0, 0 },
|
|
{ "sqsubseteq", nullptr, 0, 0 },
|
|
{ "sqsupset", nullptr, 0, 0 },
|
|
{ "sqsupseteq", nullptr, 0, 0 },
|
|
{ "star", nullptr, 0, 0 },
|
|
{ "sub", "_", 0, 0 },
|
|
{ "subset", nullptr, 0, 0 },
|
|
{ "subseteq", nullptr, 0, 0 },
|
|
{ "succ", nullptr, 0, 0 },
|
|
{ "sum", nullptr, 0, 0 },
|
|
{ "sup", "^", 0, 0 },
|
|
{ "superset", nullptr, 0, 0 },
|
|
{ "supset", nullptr, 0, 0 },
|
|
{ "supseteq", nullptr, 0, 0 },
|
|
{ "swarrow", nullptr, 0, 0 },
|
|
{ "tan", nullptr, 0, 0 },
|
|
{ "tanh", nullptr, 0, 0 },
|
|
{ "tau", nullptr, 0, EQ_CASE },
|
|
{ "therefore", nullptr, 0, 0 },
|
|
{ "theta", nullptr, 0, EQ_CASE },
|
|
{ "tilde", "\\widetilde", 1, 0 },
|
|
{ "times", nullptr, 0, 0 },
|
|
{ "to", "^", 1, 0 },
|
|
{ "top", nullptr, 0, 0 },
|
|
{ "triangle", nullptr, 0, 0 },
|
|
{ "triangled", nullptr, 0, 0 },
|
|
{ "trianglel", nullptr, 0, 0 },
|
|
{ "triangler", nullptr, 0, 0 },
|
|
{ "triangleu", nullptr, 0, 0 },
|
|
{ "udarrow", "\\updownarrow",0, EQ_CASE },
|
|
{ "under", "\\underline", 1, 0 },
|
|
{ "underline", "\\underline", 1, 0 },
|
|
{ "union", "\\bigcup", 0, 0 },
|
|
{ "uparrow", nullptr, 0, EQ_CASE },
|
|
{ "uplus", nullptr, 0, 0 },
|
|
{ "upsilon", nullptr, 0, EQ_CASE },
|
|
{ "varepsilon", nullptr, 0, 0 },
|
|
{ "varphi", nullptr, 0, 0 },
|
|
{ "varpi", nullptr, 0, 0 },
|
|
{ "varrho", nullptr, 0, 0 },
|
|
{ "varsigma", nullptr, 0, 0 },
|
|
{ "vartheta", nullptr, 0, 0 },
|
|
{ "varupsilon", nullptr, 0, 0 },
|
|
{ "vdash", nullptr, 0, 0 },
|
|
{ "vdots", nullptr, 0, 0 },
|
|
{ "vec", nullptr, 1, 0 },
|
|
{ "vee", nullptr, 0, 0 },
|
|
{ "vert", nullptr, 0, 0 },
|
|
{ "wedge", nullptr, 0, 0 },
|
|
{ "wp", nullptr, 0, 0 },
|
|
{ "xi", nullptr, 0, EQ_CASE },
|
|
{ "xor", nullptr, 0, 0 },
|
|
{ "zeta", nullptr, 0, EQ_CASE }
|
|
};
|
|
|
|
static const hwpeq *lookup_eqn(char const *str)
|
|
{
|
|
static const int eqCount = SAL_N_ELEMENTS(eq_tbl);
|
|
int l = 0, r = eqCount;
|
|
const hwpeq *result = nullptr;
|
|
|
|
while( l < r ) {
|
|
const int m = (l + r) / 2;
|
|
const int k = strcmp(eq_tbl[m].key, str);
|
|
if( k == 0 ) {
|
|
result = eq_tbl + m;
|
|
break;
|
|
}
|
|
else if( k < 0 )
|
|
l = m + 1;
|
|
else
|
|
r = m;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/* If only the first character is uppercase or all characters are uppercase, change to lowercase */
|
|
static void make_keyword( char *keyword, const char *token)
|
|
{
|
|
char* ptr;
|
|
bool result = true;
|
|
int len = strlen(token);
|
|
assert(keyword);
|
|
|
|
if( 255 < len )
|
|
{
|
|
len = 255;
|
|
}
|
|
memcpy(keyword, token, len);
|
|
keyword[len] = 0;
|
|
|
|
if( (token[0] & 0x80) || rtl::isAsciiLowerCase(static_cast<unsigned char>(token[0])) || strlen(token) < 2 )
|
|
return;
|
|
|
|
bool capital = rtl::isAsciiUpperCase(
|
|
static_cast<unsigned char>(keyword[1]));
|
|
for( ptr = keyword + 2; *ptr && result; ptr++ )
|
|
{
|
|
if( (*ptr & 0x80) ||
|
|
(!capital && rtl::isAsciiUpperCase(static_cast<unsigned char>(*ptr))) ||
|
|
(capital && rtl::isAsciiLowerCase(static_cast<unsigned char>(*ptr))) )
|
|
{
|
|
result = false;
|
|
}
|
|
}
|
|
|
|
if( result )
|
|
{
|
|
ptr = keyword;
|
|
while( *ptr )
|
|
{
|
|
if( rtl::isAsciiUpperCase(static_cast<unsigned char>(*ptr)) )
|
|
*ptr = sal::static_int_cast<char>(
|
|
rtl::toAsciiLowerCase(static_cast<unsigned char>(*ptr)));
|
|
ptr++;
|
|
}
|
|
}
|
|
}
|
|
|
|
// token reading function
|
|
struct eq_stack {
|
|
MzString white;
|
|
MzString token;
|
|
istream *strm;
|
|
|
|
eq_stack() { strm = nullptr; };
|
|
bool state(istream const *s) {
|
|
if( strm != s) { white = nullptr; token = nullptr; }
|
|
return token.length() != 0;
|
|
}
|
|
};
|
|
|
|
static eq_stack *stk = nullptr;
|
|
|
|
static void push_token(MzString const &white, MzString const &token, istream *strm)
|
|
{
|
|
// one time stack
|
|
assert(stk->token.length() == 0);
|
|
|
|
stk->white = white;
|
|
stk->token = token;
|
|
stk->strm = strm;
|
|
}
|
|
|
|
/*
|
|
* It returns the length of the read tokens.
|
|
*
|
|
* control char, control sequence, binary sequence,
|
|
* alphabet string, single character */
|
|
static int next_token(MzString &white, MzString &token, istream *strm)
|
|
{
|
|
std::istream::int_type ch = 0;
|
|
|
|
if( stk->state(strm) ) {
|
|
white = stk->white;
|
|
token = stk->token;
|
|
stk->token = nullptr;
|
|
stk->white = nullptr;
|
|
return token.length();
|
|
}
|
|
|
|
token = nullptr;
|
|
white = nullptr;
|
|
if( !strm->good() || (ch = strm->get()) == std::istream::traits_type::eof() )
|
|
return 0;
|
|
|
|
// read preceding ws
|
|
if( IS_WS(ch) ) {
|
|
do white << static_cast<char>(ch);
|
|
while( IS_WS(ch = strm->get()) );
|
|
}
|
|
|
|
if( ch == '\\' || ch & 0x80
|
|
|| (ch != std::istream::traits_type::eof() && rtl::isAsciiAlpha(ch)) )
|
|
{
|
|
if( ch == '\\' ) {
|
|
token << static_cast<char>(ch);
|
|
ch = strm->get();
|
|
}
|
|
do {
|
|
token << static_cast<char>(ch);
|
|
ch = strm->get();
|
|
} while( ch != std::istream::traits_type::eof()
|
|
&& (ch & 0x80 || rtl::isAsciiAlpha(ch)) ) ;
|
|
strm->putback(static_cast<char>(ch));
|
|
/* special treatment of sub, sub, over, atop
|
|
The reason for this is that affect next_state().
|
|
*/
|
|
if( !STRICMP("sub", token) || !STRICMP("from", token) ||
|
|
!STRICMP("sup", token) || !STRICMP("to", token) ||
|
|
!STRICMP("over", token) || !STRICMP("atop", token) ||
|
|
!STRICMP("left", token) || !STRICMP("right", token) )
|
|
{
|
|
char buf[256];
|
|
make_keyword(buf, token);
|
|
token = buf;
|
|
}
|
|
if( !token.compare("sub") || !token.compare("from") )
|
|
token = "_";
|
|
if( !token.compare("sup") || !token.compare("to") )
|
|
token = "^";
|
|
}
|
|
else if( IS_BINARY(ch) ) {
|
|
do token << static_cast<char>(ch);
|
|
while( IS_BINARY(ch = strm->get()) );
|
|
strm->putback(static_cast<char>(ch));
|
|
}
|
|
else if( ch != std::istream::traits_type::eof() && rtl::isAsciiDigit(ch) ) {
|
|
do {
|
|
token << static_cast<char>(ch);
|
|
ch = strm->get();
|
|
} while( ch != std::istream::traits_type::eof() && rtl::isAsciiDigit(ch) );
|
|
strm->putback(static_cast<char>(ch));
|
|
}
|
|
else
|
|
token << static_cast<char>(ch);
|
|
|
|
return token.length();
|
|
}
|
|
|
|
static std::istream::int_type read_white_space(MzString& outs, istream *strm)
|
|
{
|
|
std::istream::int_type result;
|
|
|
|
if( stk->state(strm) ) {
|
|
outs << stk->white;
|
|
stk->white = nullptr;
|
|
result = std::istream::traits_type::to_int_type(stk->token[0]);
|
|
}
|
|
else {
|
|
std::istream::int_type ch;
|
|
while( IS_WS(ch = strm->get()) )
|
|
outs << static_cast<char>(ch);
|
|
strm->putback(static_cast<char>(ch));
|
|
result = ch;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/* If the argument is not required, delimiters are space and brace for each items.
|
|
sqrt {ab} c = sqrt {ab} c
|
|
(,} are for grouping
|
|
^ ,_ are for combination
|
|
|
|
Sorting of formats with arguments, such as sqrt
|
|
sqrt a -> sqrt {a}
|
|
sqrt {a} -> sqrt {a}
|
|
If there is more than one argument, it eliminates backslash between arguments.
|
|
\frac a b -> frac {a} {b}
|
|
Clean the form of over
|
|
a over b -> {a} over {b}
|
|
*/
|
|
|
|
static int eq_word(MzString& outs, istream *strm, int status)
|
|
{
|
|
MzString token, white, state;
|
|
int result;
|
|
char keyword[256];
|
|
const hwpeq *eq;
|
|
|
|
next_token(white, token, strm);
|
|
if (token.length() <= 0)
|
|
return 0;
|
|
result = token[0];
|
|
|
|
if( token.compare("{") == 0 ) {
|
|
state << white << token;
|
|
eq_sentence(state, strm, "}");
|
|
}
|
|
else if( token.compare("left") == 0 ) {
|
|
state << white << token;
|
|
next_token(white, token, strm);
|
|
state << white << token;
|
|
|
|
eq_sentence(state, strm, "right");
|
|
|
|
next_token(white, token, strm);
|
|
state << white << token;
|
|
}
|
|
else {
|
|
/* Normal token */
|
|
int script_status = SCRIPT_NONE;
|
|
while( true ) {
|
|
state << white << token;
|
|
make_keyword(keyword, token);
|
|
if( token[0] == '^' )
|
|
script_status |= SCRIPT_SUP;
|
|
else if( token[0] == '_' )
|
|
script_status |= SCRIPT_SUB;
|
|
else
|
|
script_status = SCRIPT_NONE;
|
|
|
|
if( nullptr != (eq = lookup_eqn(keyword)) ) {
|
|
int nargs = eq->nargs;
|
|
while( nargs-- ) {
|
|
const std::istream::int_type ch = read_white_space(state, strm);
|
|
if( ch != '{' ) state << '{';
|
|
eq_word(state, strm, script_status);
|
|
if( ch != '{' ) state << '}';
|
|
}
|
|
}
|
|
|
|
if( !next_token(white, token, strm) )
|
|
break;
|
|
// end loop and restart with this
|
|
if( (token[0] == '^' && status && !(status & SCRIPT_SUP)) ||
|
|
(token[0] == '_' && status && !(status & SCRIPT_SUB)) ||
|
|
strcmp("over", token) == 0 || strcmp("atop", token) == 0 ||
|
|
strchr("{}#&`", token[0]) ||
|
|
(!strchr("^_", token[0]) && white.length()) )
|
|
{
|
|
push_token(white, token, strm);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
outs << state;
|
|
|
|
return result;
|
|
}
|
|
|
|
static bool eq_sentence(MzString& outs, istream *strm, const char *end)
|
|
{
|
|
MzString state;
|
|
MzString white, token;
|
|
bool multiline = false;
|
|
|
|
read_white_space(outs, strm);
|
|
while( eq_word(state, strm) ) {
|
|
if( !next_token(white, token, strm) ||
|
|
(end && strcmp(token.c_str(), end) == 0) )
|
|
{
|
|
state << white << token;
|
|
break;
|
|
}
|
|
push_token(white, token, strm);
|
|
if( !token.compare("atop") || !token.compare("over") )
|
|
outs << '{' << state << '}';
|
|
else {
|
|
if( !token.compare("#") )
|
|
multiline = true;
|
|
outs << state;
|
|
}
|
|
state = nullptr;
|
|
read_white_space(outs, strm);
|
|
}
|
|
outs << state;
|
|
return multiline;
|
|
}
|
|
|
|
static char eq2ltxconv(MzString& sstr, istream *strm, const char *sentinel)
|
|
{
|
|
MzString white, token;
|
|
char key[256];
|
|
std::istream::int_type ch;
|
|
int result;
|
|
|
|
while( 0 != (result = next_token(white, token, strm)) ) {
|
|
if( sentinel && (result == 1) && strchr(sentinel, token[0]) )
|
|
break;
|
|
make_keyword(key, token);
|
|
const hwpeq *eq = nullptr;
|
|
if( (eq = lookup_eqn(key)) != nullptr ) {
|
|
if( eq->latex )
|
|
strcpy(key, eq->latex);
|
|
else {
|
|
key[0] = '\\';
|
|
strcpy(key + 1, eq->key);
|
|
}
|
|
if( (eq->flag & EQ_CASE)
|
|
&& rtl::isAsciiUpperCase(static_cast<unsigned char>(token[0])) )
|
|
key[1] = sal::static_int_cast<char>(
|
|
rtl::toAsciiUpperCase(static_cast<unsigned char>(key[1])));
|
|
token = key;
|
|
}
|
|
|
|
if( token[0] == '{' ) { // grouping
|
|
sstr << white << token;
|
|
eq2ltxconv(sstr, strm, "}");
|
|
sstr << '}';
|
|
}
|
|
else if( eq && (eq->flag & EQ_ENV) ) {
|
|
next_token(white, token, strm);
|
|
if( token[0] != '{' )
|
|
return 0;
|
|
sstr << "\\begin" << "{" << eq->key << "}" << ENDL ;
|
|
eq2ltxconv(sstr, strm, "}");
|
|
if( sstr[sstr.length() - 1] != '\n' )
|
|
sstr << ENDL ;
|
|
sstr << "\\end" << "{" << eq->key << "}" << ENDL ;
|
|
}
|
|
else if( eq && (eq->flag & EQ_ATOP) ) {
|
|
if( sstr.length() == 0 )
|
|
sstr << '{';
|
|
else {
|
|
int pos = sstr.rfind('}');
|
|
if( 0 < pos)
|
|
sstr.replace(pos, ' ');
|
|
}
|
|
sstr << token;
|
|
while( (ch = strm->get()) != std::istream::traits_type::eof()
|
|
&& IS_WS(ch) )
|
|
sstr << static_cast<char>(ch);
|
|
if( ch != '{' )
|
|
sstr << "{}";
|
|
else {
|
|
eq2ltxconv(sstr, strm, "}");
|
|
sstr << '}';
|
|
}
|
|
}
|
|
else
|
|
sstr << white << token;
|
|
}
|
|
return token[0];
|
|
}
|
|
|
|
void eq2latex(MzString& outs, char const *s)
|
|
{
|
|
assert(s);
|
|
if( stk == nullptr )
|
|
stk = new eq_stack;
|
|
|
|
MzString tstr;
|
|
|
|
istringstream tstrm(s);
|
|
bool eqnarray = eq_sentence(tstr, &tstrm);
|
|
istringstream strm(tstr.c_str());
|
|
|
|
if( eqnarray )
|
|
outs << "\\begin{array}{rllll}" << ENDL;
|
|
eq2ltxconv(outs, &strm, nullptr);
|
|
outs << ENDL;
|
|
if( eqnarray )
|
|
outs << "\\end{array}" << ENDL;
|
|
delete stk;
|
|
stk = nullptr;
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|