/*
 * lexer.ll - part of abakus
 * Copyright (C) 2004, 2005 Michael Pyne <michael.pyne@kdemail.net>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 */
%option noyywrap
%{
#define YY_NO_UNPUT

#include <kdebug.h>

#include "node.h"
#include "function.h"
#include "parser.h"
#include "result.h"

int yyCurTokenPos;
int yyThisTokenLength;

int yyparse(void);
%}

DIGITS [0-9]+
HEX [0-9A-Fa-f]+
%%

 /* Always skip whitespace */
[ \t]* { yyCurTokenPos += yyThisTokenLength; yyThisTokenLength = yyleng; }

 /* Power operator */
"**" { 
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 2;
    return POWER;
}

"^" {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 1;
    return POWER;
}

[sS][eE][tT] {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 3;
    return SET;
}

[rR][eE][mM][oO][vV][eE] {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 6;
    return REMOVE;
}

[dD][eE][rR][iI][vV] {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 5;
    return DERIV;
}

 /* Read numbers of the form with at least the decimal point and trailing
 * digits, such as .32, -234.45, .0, etc.  Numbers are only read in the BEGIN
 * state.
 */
{DIGITS}*([\.,]{DIGITS}+)(e[-+]?{DIGITS}+)? {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;
    return NUM;
}

 /* Read Hex */
0x({HEX}+)? {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;
    return NUM;
}

 /* Read numbers with at least the integral part, such as +4234, -34e8, etc.
 * Numbers are only read in the BEGIN state.
 */
{DIGITS}+([\.,]{DIGITS}*)?(e[-+]?{DIGITS}+)? {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;
    return NUM;
}

[nN][aA][nN] {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;
    return NUM;
}

[iI][nN][fF] {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;
    return NUM;
}

 /* This detects textual input, and if it isn't pre-declared by the parser (in
 * other words, if it isn't a function), then it is returned as an identifier.
 */
[a-zA-Z_][a-zA-Z_0-9]* {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = yyleng;

    if(FunctionManager::instance()->isFunction(yytext))
	return FN;
    else {
	return ID;
    }
}

 /* All other characters are returned as-is to the parser, who can accept or
 * reject it as needed.
 */
. {
    yyCurTokenPos += yyThisTokenLength;
    yyThisTokenLength = 1;
    return *yytext;
}

%%

class Lexer::Private
{
public:
    YY_BUFFER_STATE buffer;
    int lastToken, thisToken;
    int lastPos, thisPos;
    QString lastTokenData, thisTokenData;
};

/* Declared in function.h, implemented here in lexer.l since this is where
 * all the yy_*() functions and types are defined.
 */
Lexer::Lexer(const TQString &expr) :
    m_private(new Private)
{
    const char *exprString = expr.latin1();

    yyCurTokenPos = 0;
    yyThisTokenLength = 0;

    m_private->buffer = yy_scan_string(exprString ? exprString : "");
    m_private->lastToken = -1;
    m_private->lastPos = -1;

    m_private->thisToken = yylex();
    m_private->thisTokenData = QString(yytext);

    if(yyCurTokenPos != 0)
    {
	kdError() << "yyCurTokenPos should be 0!!\n";
    }

    m_private->thisPos = yyCurTokenPos;
}

Lexer::~Lexer()
{
    yy_delete_buffer(m_private->buffer);
    delete m_private;
}

bool Lexer::hasNext() const
{
    return m_private->thisToken > 0;
}

int Lexer::nextType()
{
    m_private->lastTokenData = m_private->thisTokenData;
    m_private->lastPos = m_private->thisPos;
    m_private->lastToken = m_private->thisToken;

    m_private->thisToken = yylex();
    m_private->thisTokenData = QString(yytext);
    m_private->thisPos = yyCurTokenPos;

    return m_private->lastToken;
}

TQString Lexer::tokenValue() const
{
    return m_private->lastTokenData;
}

int Lexer::tokenPos() const
{
    return m_private->lastPos;
}

/* Declared in function.h, implemented here in lexer.l since this is where
 * all the yy_*() functions and types are defined.
 */
Abakus::number_t parseString(const char *str)
{
    YY_BUFFER_STATE buffer = yy_scan_string(str);

    yyCurTokenPos = 0;
    yyThisTokenLength = 0;

    yyparse();
    yy_delete_buffer(buffer);

    if(Result::lastResult()->type() != Result::Value)
	return Abakus::number_t();

    return Result::lastResult()->result()->value();
}