This addresses some cppcheck warnings. Change-Id: I9812658e8a96dd35d686c7ae7a8b829267c5c8bc Reviewed-on: https://gerrit.libreoffice.org/13499 Reviewed-by: Noel Grandin <noelgrandin@gmail.com> Tested-by: Noel Grandin <noelgrandin@gmail.com>
757 lines
24 KiB
C++
757 lines
24 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <ctype.h>
|
|
|
|
// DVO: always use standard headers:
|
|
#include <istream>
|
|
#include <sstream>
|
|
using namespace std;
|
|
|
|
#include "mzstring.h"
|
|
#include "hwpeq.h"
|
|
#include <sal/types.h>
|
|
#include <sal/macros.h>
|
|
|
|
/* @Man: hwp수식을 LaTeX으로 바꾸기 */
|
|
#ifdef WIN32
|
|
# define ENDL "\r\n"
|
|
#else /* !WIN32 */
|
|
# define ENDL "\n"
|
|
#endif
|
|
|
|
#define WS " \t\r\n\v\f"
|
|
|
|
#define EQ_CASE 0x01 // case sensitive cmd
|
|
#define EQ_ENV 0x02 // equiv to latex environment
|
|
#define EQ_ATOP 0x04 // must revert order
|
|
|
|
#define IS_WS(ch) (strchr(WS, ch))
|
|
#define IS_BINARY(ch) (strchr("+-<=>", ch))
|
|
|
|
#ifdef WIN32
|
|
#define STRICMP stricmp
|
|
#else
|
|
#define STRICMP strcasecmp
|
|
#endif
|
|
|
|
// sub and sup scipt script status
|
|
enum { SCRIPT_NONE, SCRIPT_SUB, SCRIPT_SUP, SCRIPT_ALL};
|
|
|
|
static int eq_word(MzString& outs, istream *strm, int script = SCRIPT_NONE);
|
|
static bool eq_sentence(MzString& outs, istream *strm, const char *end = 0);
|
|
|
|
struct hwpeq {
|
|
const char *key; // hwp math keyword
|
|
const char *latex; // corresponding latex keywork
|
|
int nargs; // # of argument
|
|
unsigned char flag; // case sensitive?
|
|
};
|
|
|
|
static const hwpeq eq_tbl[] = {
|
|
{ "!=", "\\equiv ", 0, 0 },
|
|
{ "#", "\\\\", 0, 0 },
|
|
{ "+-", "\\pm ", 0, 0 },
|
|
{ "-+", "\\mp ", 0, 0 },
|
|
{ "<=", "\\leq ", 0, 0 },
|
|
{ "==", "\\equiv ", 0, 0 },
|
|
{ ">=", "\\geq ", 0, 0 },
|
|
{ "Pr", NULL, 0, 0 },
|
|
{ "^", "^", 1, 0 },
|
|
{ "_", "_", 1, 0 },
|
|
{ "`", "\\;", 0, 0 },
|
|
{ "acute", NULL, 1, 0 },
|
|
{ "aleph", NULL, 0, 0 },
|
|
{ "alpha", NULL, 0, EQ_CASE },
|
|
{ "amalg", NULL, 0, 0 },
|
|
{ "and", NULL, 0, 0 },
|
|
{ "angle", NULL, 0, 0 },
|
|
{ "angstrom", NULL, 0, 0 },
|
|
{ "approx", NULL, 0, 0 },
|
|
{ "arc", NULL, 0, 0 },
|
|
{ "arccos", NULL, 0, 0 },
|
|
{ "arch", NULL, 0, 0 },
|
|
{ "arcsin", NULL, 0, 0 },
|
|
{ "arctan", NULL, 0, 0 },
|
|
{ "arg", NULL, 0, 0 },
|
|
{ "assert", "\\vdash", 0, 0 },
|
|
{ "ast", NULL, 0, 0 },
|
|
{ "asymp", NULL, 0, 0 },
|
|
{ "atop", NULL, 1, EQ_ATOP },
|
|
{ "backslash", NULL, 0, 0 },
|
|
{ "bar", NULL, 1, 0 },
|
|
{ "because", NULL, 0, 0 },
|
|
{ "beta", NULL, 0, EQ_CASE },
|
|
{ "big", NULL, 0, EQ_CASE },
|
|
{ "bigcap", NULL, 0, 0 },
|
|
{ "bigcirc", NULL, 0, 0 },
|
|
{ "bigcup", NULL, 0, 0 },
|
|
{ "bigg", NULL, 0, EQ_CASE },
|
|
{ "bigodiv", NULL, 0, 0 },
|
|
{ "bigodot", NULL, 0, 0 },
|
|
{ "bigominus", NULL, 0, 0 },
|
|
{ "bigoplus", NULL, 0, 0 },
|
|
{ "bigotimes", NULL, 0, 0 },
|
|
{ "bigsqcap", NULL, 0, 0 },
|
|
{ "bigsqcup", NULL, 0, 0 },
|
|
{ "biguplus", NULL, 0, 0 },
|
|
{ "bigvee", NULL, 0, 0 },
|
|
{ "bigwedge", NULL, 0, 0 },
|
|
{ "binom", NULL, 2, 0 },
|
|
{ "bmatrix", NULL, 0, EQ_ENV },
|
|
{ "bold", NULL, 0, 0 },
|
|
{ "bot", NULL, 0, 0 },
|
|
{ "breve", NULL, 1, 0 },
|
|
{ "buildrel", NULL, 0, 0 }, // LATER
|
|
{ "bullet", NULL, 0, 0 },
|
|
{ "cap", NULL, 0, 0 },
|
|
{ "cases", NULL, 0, EQ_ENV },
|
|
{ "ccol", NULL, 0, 0 }, /* 세로로 가운데 */
|
|
{ "cdot", NULL, 0, 0 },
|
|
{ "cdots", NULL, 0, 0 },
|
|
{ "check", NULL, 1, 0 },
|
|
{ "chi", NULL, 0, EQ_CASE },
|
|
{ "choose", NULL, 0, EQ_ATOP },
|
|
{ "circ", NULL, 0, 0 },
|
|
{ "col", NULL, 0, 0 }, // LATER
|
|
{ "cong", NULL, 0, 0 },
|
|
{ "coprod", NULL, 0, 0 },
|
|
{ "cos", NULL, 0, 0 },
|
|
{ "cosec", NULL, 0, 0 },
|
|
{ "cosh", NULL, 0, 0 },
|
|
{ "cot", NULL, 0, 0 },
|
|
{ "coth", NULL, 0, 0 },
|
|
{ "cpile", NULL, 0, 0 }, // LATER
|
|
{ "csc", NULL, 0, 0 },
|
|
{ "cup", NULL, 0, 0 },
|
|
{ "dagger", NULL, 0, 0 },
|
|
{ "dashv", NULL, 0, 0 },
|
|
{ "ddagger", NULL, 0, 0 },
|
|
{ "ddot", NULL, 1, 0 },
|
|
{ "ddots", NULL, 0, 0 },
|
|
{ "def", NULL, 0, 0 },
|
|
{ "deg", NULL, 0, 0 },
|
|
{ "del", NULL, 0, 0 },
|
|
{ "delta", NULL, 0, EQ_CASE },
|
|
{ "diamond", NULL, 0, 0 },
|
|
{ "dim", NULL, 0, 0 },
|
|
{ "div", NULL, 0, 0 },
|
|
{ "divide", NULL, 0, 0 },
|
|
{ "dline", NULL, 0, 0 },
|
|
{ "dmatrix", NULL, 0, EQ_ENV },
|
|
{ "dot", NULL, 1, 0 },
|
|
{ "doteq", NULL, 0, 0 },
|
|
{ "dotsaxis", NULL, 0, 0 },
|
|
{ "dotsdiag", NULL, 0, 0 },
|
|
{ "dotslow", "\\ldots", 0, 0 },
|
|
{ "dotsvert", "\\vdots", 0, 0 },
|
|
{ "downarrow", NULL, 0, EQ_CASE },
|
|
{ "dsum", "+", 0, 0 },
|
|
{ "dyad", NULL, 0, 0 }, // LATER
|
|
{ "ell", NULL, 0, 0 },
|
|
{ "emptyset", NULL, 0, 0 },
|
|
{ "epsilon", NULL, 0, EQ_CASE },
|
|
{ "eqalign", NULL, 0, EQ_ENV },
|
|
{ "equiv", NULL, 0, 0 },
|
|
{ "eta", NULL, 0, EQ_CASE },
|
|
{ "exarrow", NULL, 0, 0 },
|
|
{ "exist", "\\exists", 0, 0 },
|
|
{ "exists", NULL, 0, 0 },
|
|
{ "exp", NULL, 0, EQ_CASE },
|
|
{ "for", NULL, 0, 0 },
|
|
{ "forall", NULL, 0, 0 },
|
|
{ "from", "_", 1, 0 },
|
|
{ "gamma", NULL, 0, EQ_CASE },
|
|
{ "gcd", NULL, 0, 0 },
|
|
{ "ge", "\\geq", 0, 0 },
|
|
{ "geq", NULL, 0, 0 },
|
|
{ "ggg", NULL, 0, 0 },
|
|
{ "grad", NULL, 0, 0 },
|
|
{ "grave", NULL, 1, 0 },
|
|
{ "hat", "\\widehat", 1, 0 },
|
|
{ "hbar", NULL, 0, 0 },
|
|
{ "hom", NULL, 0, 0 },
|
|
{ "hookleft", NULL, 0, 0 },
|
|
{ "hookright", NULL, 0, 0 },
|
|
{ "identical", NULL, 0, 0 }, // LATER
|
|
{ "if", NULL, 0, 0 },
|
|
{ "imag", NULL, 0, 0 },
|
|
{ "image", NULL, 0, 0 },
|
|
{ "imath", NULL, 0, 0 },
|
|
{ "in", NULL, 0, 0 },
|
|
{ "inf", "\\infty", 0, 0 },
|
|
{ "infinity", "\\infty", 0, 0 },
|
|
{ "infty", NULL, 0, 0 },
|
|
{ "int", NULL, 0, 0 },
|
|
{ "integral", "\\int", 0, 0 },
|
|
{ "inter", "\\bigcap", 0, 0 },
|
|
{ "iota", NULL, 0, EQ_CASE },
|
|
{ "iso", NULL, 0, 0 }, // ams
|
|
{ "it", NULL, 0, 0 },
|
|
{ "jmath", NULL, 0, 0 },
|
|
{ "kappa", NULL, 0, EQ_CASE },
|
|
{ "ker", NULL, 0, 0 },
|
|
{ "lambda", NULL, 0, EQ_CASE },
|
|
{ "land", NULL, 0, 0 }, // LATER
|
|
{ "langle", NULL, 0, 0 },
|
|
{ "larrow", "\\leftarrow", 0, EQ_CASE },
|
|
{ "lbrace", NULL, 0, 0 },
|
|
{ "lbrack", "[", 0, 0 },
|
|
{ "lceil", NULL, 0, 0 },
|
|
{ "lcol", NULL, 0, 0 }, // LATER
|
|
{ "ldots", NULL, 0, 0 },
|
|
{ "le", NULL, 0, 0 },
|
|
{ "left", NULL, 0, 0 },
|
|
{ "leftarrow", NULL, 0, EQ_CASE },
|
|
{ "leq", NULL, 0, 0 },
|
|
{ "lfloor", NULL, 0, 0 },
|
|
{ "lg", NULL, 0, 0 },
|
|
{ "lim", NULL, 0, EQ_CASE },
|
|
{ "line", "\\vert", 0, 0 },
|
|
{ "liter", "\\ell", 0, 0 },
|
|
{ "lll", NULL, 0, 0 }, // ams
|
|
{ "ln", NULL, 0, 0 },
|
|
{ "log", NULL, 0, 0 },
|
|
{ "lor", "\\vee", 0, 0 },
|
|
{ "lparen", "(", 0, 0 },
|
|
{ "lpile", NULL, 0, 0 }, // LATER
|
|
{ "lrarrow", "\\leftrightarrow", 0, EQ_CASE },
|
|
{ "lrharpoons", "\\leftrightharpoons",0, 0 },
|
|
{ "mapsto", NULL, 0, 0 },
|
|
{ "massert", "\\dashv", 0, 0 },
|
|
{ "matrix", NULL, 0, EQ_ENV },
|
|
{ "max", NULL, 0, 0 },
|
|
{ "mho", NULL, 0, 0 }, // ams
|
|
{ "min", NULL, 0, 0 },
|
|
{ "minusplus", NULL, 0, 0 },
|
|
{ "mit", "", 0, 0 }, // font
|
|
{ "mod", "\\bmod", 0, 0 },
|
|
{ "models", NULL, 0, 0 },
|
|
{ "msangle", NULL, 0, 0 }, // LATER
|
|
{ "mu", NULL, 0, EQ_CASE },
|
|
{ "nabla", NULL, 0, 0 },
|
|
{ "ne", NULL, 0, 0 },
|
|
{ "nearrow", NULL, 0, 0 },
|
|
{ "neg", NULL, 0, 0 },
|
|
{ "neq", NULL, 0, 0 },
|
|
{ "nequiv", NULL, 0, 0 },
|
|
{ "ni", NULL, 0, 0 },
|
|
{ "not", NULL, 0, 0 },
|
|
{ "notin", NULL, 0, 0 },
|
|
{ "nu", NULL, 0, EQ_CASE },
|
|
{ "nwarrow", NULL, 0, 0 },
|
|
{ "odiv", NULL, 0, 0 },
|
|
{ "odot", NULL, 0, 0 },
|
|
{ "oint", NULL, 0, 0 },
|
|
{ "omega", NULL, 0, EQ_CASE },
|
|
{ "omicron", NULL, 0, EQ_CASE },
|
|
{ "ominus", NULL, 0, 0 },
|
|
{ "oplus", NULL, 0, 0 },
|
|
{ "or ", NULL, 0, 0 },
|
|
{ "oslash", NULL, 0, 0 },
|
|
{ "otimes", NULL, 0, 0 },
|
|
{ "over", NULL, 1, EQ_ATOP },
|
|
{ "overline", NULL, 1, 0 },
|
|
{ "owns", "\\ni", 0, 0 },
|
|
{ "parallel", NULL, 0, 0 },
|
|
{ "partial", NULL, 0, 0 },
|
|
{ "phantom", NULL, 0, 0 },
|
|
{ "phi", NULL, 0, EQ_CASE },
|
|
{ "pi", NULL, 0, EQ_CASE },
|
|
{ "pile", NULL, 0, 0 }, // LATER
|
|
{ "plusminus", "\\pm", 0, 0 },
|
|
{ "pmatrix", NULL, 0, EQ_ENV },
|
|
{ "prec", NULL, 0, 0 },
|
|
{ "prep", NULL, 0, 0 },
|
|
{ "prime", NULL, 0, 0 },
|
|
{ "prod", NULL, 0, 0 },
|
|
{ "propto", NULL, 0, 0 },
|
|
{ "psi", NULL, 0, EQ_CASE },
|
|
{ "rangle", NULL, 0, 0 },
|
|
{ "rarrow", "\\rightarrow", 0, EQ_CASE },
|
|
{ "rbrace", "]", 0, 0 },
|
|
{ "rbrace", NULL, 0, 0 },
|
|
{ "rceil", NULL, 0, 0 },
|
|
{ "rcol", NULL, 0, 0 }, // LATER
|
|
{ "real", "\\Re", 0, 0 },
|
|
{ "reimage", NULL, 0, 0 },
|
|
{ "rel", NULL, 0, 0 },
|
|
{ "rfloor", NULL, 0, 0 },
|
|
{ "rho", NULL, 0, EQ_CASE },
|
|
{ "right", NULL, 0, 0 },
|
|
{ "rightarrow", NULL, 0, EQ_CASE },
|
|
{ "rlharpoons", NULL, 0, 0 },
|
|
{ "rm", NULL, 0, 0 },
|
|
{ "root", "\\sqrt", 1, 0 },
|
|
{ "rparen", ")", 0, 0 },
|
|
{ "rpile", NULL, 0, 0 }, // LATER
|
|
{ "rtangle", NULL, 0, 0 },
|
|
{ "sangle", NULL, 0, 0 },
|
|
{ "scale", NULL, 0, 0 },
|
|
{ "searrow", NULL, 0, 0 },
|
|
{ "sec", NULL, 0, 0 },
|
|
{ "sigma", NULL, 0, EQ_CASE },
|
|
{ "sim", NULL, 0, 0 },
|
|
{ "simeq", NULL, 0, 0 },
|
|
{ "sin", NULL, 0, 0 },
|
|
{ "sinh", NULL, 0, 0 },
|
|
{ "slash", NULL, 0, 0 },
|
|
{ "smallint", NULL, 0, 0 },
|
|
{ "smallinter", NULL, 0, 0 },
|
|
{ "smalloint", NULL, 0, 0 },
|
|
{ "smallprod", NULL, 0, 0 },
|
|
{ "smallsum", NULL, 0, 0 },
|
|
{ "smallunion", NULL, 0, 0 },
|
|
{ "smcoprod", NULL, 0, 0 },
|
|
{ "sqcap", NULL, 0, 0 },
|
|
{ "sqcup", NULL, 0, 0 },
|
|
{ "sqrt", NULL, 1, 0 },
|
|
{ "sqsubset", NULL, 0, 0 },
|
|
{ "sqsubseteq", NULL, 0, 0 },
|
|
{ "sqsupset", NULL, 0, 0 },
|
|
{ "sqsupseteq", NULL, 0, 0 },
|
|
{ "star", NULL, 0, 0 },
|
|
{ "sub", "_", 0, 0 },
|
|
{ "subset", NULL, 0, 0 },
|
|
{ "subseteq", NULL, 0, 0 },
|
|
{ "succ", NULL, 0, 0 },
|
|
{ "sum", NULL, 0, 0 },
|
|
{ "sup", "^", 0, 0 },
|
|
{ "superset", NULL, 0, 0 },
|
|
{ "supset", NULL, 0, 0 },
|
|
{ "supseteq", NULL, 0, 0 },
|
|
{ "swarrow", NULL, 0, 0 },
|
|
{ "tan", NULL, 0, 0 },
|
|
{ "tanh", NULL, 0, 0 },
|
|
{ "tau", NULL, 0, EQ_CASE },
|
|
{ "therefore", NULL, 0, 0 },
|
|
{ "theta", NULL, 0, EQ_CASE },
|
|
{ "tilde", "\\widetilde", 1, 0 },
|
|
{ "times", NULL, 0, 0 },
|
|
{ "to", "^", 1, 0 },
|
|
{ "top", NULL, 0, 0 },
|
|
{ "triangle", NULL, 0, 0 },
|
|
{ "triangled", NULL, 0, 0 },
|
|
{ "trianglel", NULL, 0, 0 },
|
|
{ "triangler", NULL, 0, 0 },
|
|
{ "triangleu", NULL, 0, 0 },
|
|
{ "udarrow", "\\updownarrow",0, EQ_CASE },
|
|
{ "under", "\\underline", 1, 0 },
|
|
{ "underline", "\\underline", 1, 0 },
|
|
{ "union", "\\bigcup", 0, 0 },
|
|
{ "uparrow", NULL, 0, EQ_CASE },
|
|
{ "uplus", NULL, 0, 0 },
|
|
{ "upsilon", NULL, 0, EQ_CASE },
|
|
{ "varepsilon", NULL, 0, 0 },
|
|
{ "varphi", NULL, 0, 0 },
|
|
{ "varpi", NULL, 0, 0 },
|
|
{ "varrho", NULL, 0, 0 },
|
|
{ "varsigma", NULL, 0, 0 },
|
|
{ "vartheta", NULL, 0, 0 },
|
|
{ "varupsilon", NULL, 0, 0 },
|
|
{ "vdash", NULL, 0, 0 },
|
|
{ "vdots", NULL, 0, 0 },
|
|
{ "vec", NULL, 1, 0 },
|
|
{ "vee", NULL, 0, 0 },
|
|
{ "vert", NULL, 0, 0 },
|
|
{ "wedge", NULL, 0, 0 },
|
|
{ "wp", NULL, 0, 0 },
|
|
{ "xi", NULL, 0, EQ_CASE },
|
|
{ "xor", NULL, 0, 0 },
|
|
{ "zeta", NULL, 0, EQ_CASE }
|
|
};
|
|
|
|
static const hwpeq *lookup_eqn(char *str)
|
|
{
|
|
static const int eqCount = SAL_N_ELEMENTS(eq_tbl);
|
|
int l = 0, r = eqCount;
|
|
const hwpeq *result = 0;
|
|
|
|
while( l < r ) {
|
|
const int m = (l + r) / 2;
|
|
const int k = strcmp(eq_tbl[m].key, str);
|
|
if( k == 0 ) {
|
|
result = eq_tbl + m;
|
|
break;
|
|
}
|
|
else if( k < 0 )
|
|
l = m + 1;
|
|
else
|
|
r = m;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/* 첫자만 대문자이거나 전부 대문자면 소문자로 바꾼다. */
|
|
void make_keyword( char *keyword, const char *token)
|
|
{
|
|
char* ptr;
|
|
bool result = true;
|
|
int len = strlen(token);
|
|
assert(keyword);
|
|
|
|
if( 255 < len )
|
|
{
|
|
len = 255;
|
|
}
|
|
memcpy(keyword, token, len);
|
|
keyword[len] = 0;
|
|
|
|
if( (token[0] & 0x80) || islower(token[0]) || strlen(token) < 2 )
|
|
return;
|
|
|
|
int capital = isupper(keyword[1]);
|
|
for( ptr = keyword + 2; *ptr && result; ptr++ )
|
|
{
|
|
if( (*ptr & 0x80) ||
|
|
(!capital && isupper(*ptr)) ||
|
|
(capital && islower(*ptr)) )
|
|
{
|
|
result = false;
|
|
}
|
|
}
|
|
|
|
if( result )
|
|
{
|
|
ptr = keyword;
|
|
while( *ptr )
|
|
{
|
|
if( isupper(*ptr) )
|
|
*ptr = sal::static_int_cast<char>(tolower(*ptr));
|
|
ptr++;
|
|
}
|
|
}
|
|
return;
|
|
}
|
|
|
|
// token reading function
|
|
struct eq_stack {
|
|
MzString white;
|
|
MzString token;
|
|
istream *strm;
|
|
|
|
eq_stack() { strm = 0; };
|
|
bool state(istream *s) {
|
|
if( strm != s) { white = 0; token = 0; }
|
|
return token.length() != 0;
|
|
}
|
|
};
|
|
|
|
static eq_stack *stk = 0;
|
|
|
|
void push_token(MzString &white, MzString &token, istream *strm)
|
|
{
|
|
// one time stack
|
|
assert(stk->state(strm) == false);
|
|
|
|
stk->white = white;
|
|
stk->token = token;
|
|
stk->strm = strm;
|
|
}
|
|
|
|
/*
|
|
읽은 토큰의 길이를 반환한다.
|
|
*/
|
|
/* control char, control sequence, binary sequence,
|
|
alphabet string, sigle character */
|
|
static int next_token(MzString &white, MzString &token, istream *strm)
|
|
{
|
|
int ch = 0;
|
|
|
|
if( stk->state(strm) ) {
|
|
white = stk->white;
|
|
token = stk->token;
|
|
stk->token = 0;
|
|
stk->white = 0;
|
|
return token.length();
|
|
}
|
|
|
|
token = 0;
|
|
white = 0;
|
|
if( !strm->good() || (ch = strm->get()) == EOF )
|
|
return 0;
|
|
|
|
// read preceding ws
|
|
if( IS_WS(ch) ) {
|
|
do white << (char) ch;
|
|
while( IS_WS(ch = strm->get()) );
|
|
}
|
|
|
|
if( ch == '\\' || ch & 0x80 || isalpha(ch) ) {
|
|
if( ch == '\\' ) {
|
|
token << (char) ch;
|
|
ch = strm->get();
|
|
}
|
|
do {
|
|
token << (char) ch;
|
|
ch = strm->get();
|
|
} while( ch != EOF && (ch & 0x80 || isalpha(ch)) ) ;
|
|
strm->putback(sal::static_int_cast<char>(ch));
|
|
/* sub, sub, over, atop 특수 처리
|
|
그 이유는 next_state()에 영향을 미치기 때문이다.
|
|
*/
|
|
if( !STRICMP("sub", token) || !STRICMP("from", token) ||
|
|
!STRICMP("sup", token) || !STRICMP("to", token) ||
|
|
!STRICMP("over", token) || !STRICMP("atop", token) ||
|
|
!STRICMP("left", token) || !STRICMP("right", token) )
|
|
{
|
|
char buf[256];
|
|
make_keyword(buf, token);
|
|
token = buf;
|
|
}
|
|
if( !token.compare("sub") || !token.compare("from") )
|
|
token = "_";
|
|
if( !token.compare("sup") || !token.compare("to") )
|
|
token = "^";
|
|
}
|
|
else if( IS_BINARY(ch) ) {
|
|
do token << (char) ch;
|
|
while( IS_BINARY(ch = strm->get()) );
|
|
strm->putback(sal::static_int_cast<char>(ch));
|
|
}
|
|
else if( isdigit(ch) ) {
|
|
do token << (char) ch;
|
|
while( isdigit(ch = strm->get()) );
|
|
strm->putback(sal::static_int_cast<char>(ch));
|
|
}
|
|
else
|
|
token << (char) ch;
|
|
|
|
return token.length();
|
|
}
|
|
|
|
static int read_white_space(MzString& outs, istream *strm)
|
|
{
|
|
int result;
|
|
|
|
if( stk->state(strm) ) {
|
|
outs << stk->white;
|
|
stk->white = 0;
|
|
result = stk->token[0];
|
|
}
|
|
else {
|
|
int ch;
|
|
while( IS_WS(ch = strm->get()) )
|
|
outs << (char )ch;
|
|
strm->putback(sal::static_int_cast<char>(ch));
|
|
result = ch;
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/* 인수가 필요하지 않은 경우 각 항목간의 구분은 space와 brace
|
|
sqrt {ab}c = sqrt{ab} c
|
|
(, }는 grouping
|
|
^, _ 는 앞뒤로 결합한다.
|
|
|
|
sqrt 등과 같이 인수가 있는 형식 정리
|
|
sqrt a -> sqrt{a}
|
|
sqrt {a} -> sqrt{a}
|
|
1 이상의 인수가 있는 경우 인수들간의 역백은 없앤다.
|
|
\frac a b -> frac{a}{b}
|
|
over의 형식 정리
|
|
a over b -> {a}over{b}
|
|
*/
|
|
|
|
static int eq_word(MzString& outs, istream *strm, int status)
|
|
{
|
|
MzString token, white, state;
|
|
int result;
|
|
char keyword[256];
|
|
const hwpeq *eq;
|
|
|
|
next_token(white, token, strm);
|
|
if (token.length() <= 0)
|
|
return 0;
|
|
result = token[0];
|
|
|
|
if( token.compare("{") == 0 ) {
|
|
state << white << token;
|
|
eq_sentence(state, strm, "}");
|
|
}
|
|
else if( token.compare("left") == 0 ) {
|
|
state << white << token;
|
|
next_token(white, token, strm);
|
|
state << white << token;
|
|
|
|
eq_sentence(state, strm, "right");
|
|
|
|
next_token(white, token, strm);
|
|
state << white << token;
|
|
}
|
|
else {
|
|
/* 정상적인 token */
|
|
int script_status = SCRIPT_NONE;
|
|
while( true ) {
|
|
state << white << token;
|
|
make_keyword(keyword, token);
|
|
if( token[0] == '^' )
|
|
script_status |= SCRIPT_SUP;
|
|
else if( token[0] == '_' )
|
|
script_status |= SCRIPT_SUB;
|
|
else
|
|
script_status = SCRIPT_NONE;
|
|
|
|
if( 0 != (eq = lookup_eqn(keyword)) ) {
|
|
int nargs = eq->nargs;
|
|
while( nargs-- ) {
|
|
const int ch = read_white_space(state, strm);
|
|
if( ch != '{' ) state << '{';
|
|
eq_word(state, strm, script_status);
|
|
if( ch != '{' ) state << '}';
|
|
}
|
|
}
|
|
|
|
if( !next_token(white, token, strm) )
|
|
break;
|
|
// end loop and restart with this
|
|
if( (token[0] == '^' && status && !(status & SCRIPT_SUP)) ||
|
|
(token[0] == '_' && status && !(status & SCRIPT_SUB)) ||
|
|
strcmp("over", token) == 0 || strcmp("atop", token) == 0 ||
|
|
strchr("{}#&`", token[0]) ||
|
|
(!strchr("^_", token[0]) && white.length()) )
|
|
{
|
|
push_token(white, token, strm);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
outs << state;
|
|
|
|
return result;
|
|
}
|
|
|
|
static bool eq_sentence(MzString& outs, istream *strm, const char *end)
|
|
{
|
|
MzString state;
|
|
MzString white, token;
|
|
bool multiline = false;
|
|
|
|
read_white_space(outs, strm);
|
|
while( eq_word(state, strm) ) {
|
|
if( !next_token(white, token, strm) ||
|
|
(end && strcmp(token.c_str(), end) == 0) )
|
|
{
|
|
state << white << token;
|
|
break;
|
|
}
|
|
push_token(white, token, strm);
|
|
if( !token.compare("atop") || !token.compare("over") )
|
|
outs << '{' << state << '}';
|
|
else {
|
|
if( !token.compare("#") )
|
|
multiline = true;
|
|
outs << state;
|
|
}
|
|
state = 0;
|
|
read_white_space(outs, strm);
|
|
}
|
|
outs << state;
|
|
return multiline;
|
|
}
|
|
|
|
static char eq2ltxconv(MzString& sstr, istream *strm, const char *sentinel)
|
|
{
|
|
MzString white, token;
|
|
char key[256];
|
|
int ch, result;
|
|
const hwpeq *eq = 0;
|
|
|
|
while( 0 != (result = next_token(white, token, strm)) ) {
|
|
if( sentinel && (result == 1) && strchr(sentinel, token[0]) )
|
|
break;
|
|
make_keyword(key, token);
|
|
if( (eq = lookup_eqn(key)) != 0 ) {
|
|
if( eq->latex )
|
|
strcpy(key, eq->latex);
|
|
else {
|
|
key[0] = '\\';
|
|
strcpy(key + 1, eq->key);
|
|
}
|
|
if( (eq->flag & EQ_CASE) && isupper(token[0]) )
|
|
key[1] = sal::static_int_cast<char>(toupper(key[1]));
|
|
token = key;
|
|
}
|
|
|
|
if( token[0] == '{' ) { // grouping
|
|
sstr << white << token;
|
|
eq2ltxconv(sstr, strm, "}");
|
|
sstr << '}';
|
|
}
|
|
else if( eq && (eq->flag & EQ_ENV) ) {
|
|
next_token(white, token, strm);
|
|
if( token[0] != '{' )
|
|
return 0;
|
|
sstr << "\\begin" << "{" << eq->key << "}" << ENDL ;
|
|
eq2ltxconv(sstr, strm, "}");
|
|
if( sstr[sstr.length() - 1] != '\n' )
|
|
sstr << ENDL ;
|
|
sstr << "\\end" << "{" << eq->key << "}" << ENDL ;
|
|
}
|
|
else if( eq && (eq->flag & EQ_ATOP) ) {
|
|
if( sstr.length() == 0 )
|
|
sstr << '{';
|
|
else {
|
|
int pos = sstr.rfind('}');
|
|
if( 0 < pos)
|
|
sstr.replace(pos, ' ');
|
|
}
|
|
sstr << token;
|
|
while( (ch = strm->get()) != EOF && IS_WS(ch) )
|
|
sstr << (char)ch;
|
|
if( ch != '{' )
|
|
sstr << "{}";
|
|
else {
|
|
eq2ltxconv(sstr, strm, "}");
|
|
sstr << '}';
|
|
}
|
|
}
|
|
else
|
|
sstr << white << token;
|
|
}
|
|
return token[0];
|
|
}
|
|
|
|
void eq2latex(MzString& outs, char *s)
|
|
{
|
|
assert(s);
|
|
if( stk == 0 )
|
|
stk = new eq_stack;
|
|
|
|
MzString tstr;
|
|
|
|
istringstream tstrm(s);
|
|
bool eqnarray = eq_sentence(tstr, &tstrm);
|
|
istringstream strm(tstr.c_str());
|
|
|
|
if( eqnarray )
|
|
outs << "\\begin{array}{rllll}" << ENDL;
|
|
eq2ltxconv(outs, &strm, 0);
|
|
outs << ENDL;
|
|
if( eqnarray )
|
|
outs << "\\end{array}" << ENDL;
|
|
delete stk;
|
|
stk = 0;
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|