summaryrefslogtreecommitdiffstats
path: root/kregexpeditor/emacsregexpconverter.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'kregexpeditor/emacsregexpconverter.cpp')
-rw-r--r--kregexpeditor/emacsregexpconverter.cpp253
1 files changed, 253 insertions, 0 deletions
diff --git a/kregexpeditor/emacsregexpconverter.cpp b/kregexpeditor/emacsregexpconverter.cpp
new file mode 100644
index 0000000..327d04c
--- /dev/null
+++ b/kregexpeditor/emacsregexpconverter.cpp
@@ -0,0 +1,253 @@
+/*
+ * Copyright (c) 2002-2004 Jesper K. Pedersen <[email protected]>
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Library General Public
+ * License version 2 as published by the Free Software Foundation.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Library General Public License for more details.
+ *
+ * You should have received a copy of the GNU Library General Public License
+ * along with this library; see the file COPYING.LIB. If not, write to
+ * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
+ * Boston, MA 02110-1301, USA.
+ **/
+
+#include "emacsregexpconverter.h"
+#include "regexp.h"
+#include "altnregexp.h"
+#include "concregexp.h"
+#include "lookaheadregexp.h"
+#include "textrangeregexp.h"
+#include "textregexp.h"
+#include "compoundregexp.h"
+#include "dotregexp.h"
+#include "positionregexp.h"
+#include "repeatregexp.h"
+
+#include <kmessagebox.h>
+#include <klocale.h>
+bool EmacsRegExpConverter::canParse()
+{
+ return false;
+}
+
+QString EmacsRegExpConverter::toString( AltnRegExp* regexp, bool markSelection )
+{
+ QString res;
+
+ bool first = true;
+ RegExpList list = regexp->children();
+ for ( RegExpListIt it(list); *it; ++it ) {
+ if ( !first ) {
+ res += QString::fromLatin1("\\|");
+ }
+ first = false;
+ res += toStr( *it, markSelection );
+ }
+ return res;
+
+}
+
+QString EmacsRegExpConverter::toString( ConcRegExp* regexp, bool markSelection )
+{
+ QString res;
+
+ RegExpList list = regexp->children();
+ for ( RegExpListIt it(list); *it; ++it ) {
+ QString startPar = QString::fromLocal8Bit("");
+ QString endPar = QString::fromLocal8Bit("");
+ if ( (*it)->precedence() < regexp->precedence() ) {
+ startPar = QString::fromLatin1( "\\(" );
+ endPar = QString::fromLatin1( "\\)" );
+ }
+
+ res += startPar + toStr( *it, markSelection ) + endPar;
+ }
+
+ return res;
+
+}
+
+QString EmacsRegExpConverter::toString( LookAheadRegExp* /*regexp*/, bool /*markSelection*/ )
+{
+ static bool haveWarned = false;
+ if ( ! haveWarned ) {
+ KMessageBox::sorry( 0, i18n("Look ahead regular expressions not supported in Emacs style") );
+ haveWarned = true;
+ }
+
+ return QString::null;
+}
+
+QString EmacsRegExpConverter::toString( TextRangeRegExp* regexp, bool /*markSelection*/ )
+{
+ QString txt;
+
+ bool foundCarrot = false;
+ bool foundDash = false;
+ bool foundParenthesis = false;
+
+ // print the single characters, but keep "^" as the very
+ // last element of the characters.
+ QStringList chars = regexp->chars();
+ for (unsigned int i = 0; i< chars.count(); i++) {
+ if ( *chars.at(i) == QChar(']') ) {
+ foundParenthesis = true;
+ }
+ else if ( *chars.at(i) == QChar('-') ) {
+ foundDash = true;
+ }
+ else if ( *chars.at(i) == QChar('^') ) {
+ foundCarrot = true;
+ }
+ else {
+ txt.append( *chars.at(i) );
+ }
+ }
+
+ // Now insert the ranges.
+ QPtrList<StringPair> ranges = regexp->range();
+ for ( QPtrListIterator<StringPair> it(ranges); *it; ++it ) {
+ txt.append((*it)->first()+ QString::fromLatin1("-")+ (*it)->second());
+ }
+
+ // Ok, its time to build each part of the regexp, here comes the rule:
+ // if a ']' is one of the characters, then it must be the first one in the
+ // list (after then opening '[' and eventually negation '^')
+ // Next if a '-' is one of the characters, then it must come
+ // finally if '^' is one of the characters, then it must not be the first
+ // one!
+
+ QString res = QString::fromLatin1("[");
+
+ if ( regexp->negate() )
+ res.append(QString::fromLatin1("^"));
+
+
+ // a ']' must be the first character in teh range.
+ if ( foundParenthesis ) {
+ res.append(QString::fromLatin1("]"));
+ }
+
+ // a '-' must be the first character ( only coming after a ']')
+ if ( foundDash ) {
+ res.append(QString::fromLatin1("-"));
+ }
+
+ res += txt;
+
+ // Insert equivalents to \s,\S,\d,\D,\w, and \W
+ // non-digit, non-space, and non-word is not supported in Emacs style
+ if ( regexp->digit() )
+ res += QString::fromLocal8Bit("0-9");
+ if ( regexp->space() )
+ res += QString::fromLocal8Bit(" ") + QString( QChar( (char) 9 ) ); // Tab char
+ if ( regexp->wordChar() )
+ res += QString::fromLocal8Bit("a-zA-Z");
+
+ if ( foundCarrot ) {
+ res.append( QChar( '^' ) );
+ }
+
+ res.append(QString::fromLatin1("]"));
+
+ return res;
+}
+
+QString EmacsRegExpConverter::toString( CompoundRegExp* regexp, bool markSelection )
+{
+ return toStr( regexp->child(), markSelection );
+}
+
+QString EmacsRegExpConverter::toString( DotRegExp* /*regexp*/, bool /*markSelection*/ )
+{
+ return QString::fromLatin1( "." );
+}
+
+QString EmacsRegExpConverter::toString( PositionRegExp* regexp, bool /*markSelection*/ )
+{
+ static bool haveWarned = false;
+ switch ( regexp->position()) {
+ case PositionRegExp::BEGLINE:
+ return QString::fromLatin1("^");
+ case PositionRegExp::ENDLINE:
+ return QString::fromLatin1("$");
+ case PositionRegExp::WORDBOUNDARY:
+ case PositionRegExp::NONWORDBOUNDARY:
+ if ( ! haveWarned ) {
+ KMessageBox::sorry( 0, i18n( "Word boundary and non word boundary is not supported in Emacs syntax" ) );
+ haveWarned = true;
+ return QString::fromLatin1("");
+ }
+ }
+ return QString::fromLatin1("");
+}
+
+QString EmacsRegExpConverter::toString( RepeatRegExp* regexp, bool markSelection )
+{
+ RegExp* child = regexp->child();
+ QString cText = toStr( child, markSelection );
+ QString startPar;
+ QString endPar;
+
+ if ( child->precedence() < regexp->precedence() ) {
+ startPar = QString::fromLatin1( "\\(" );
+ endPar = QString::fromLatin1( "\\)" );
+ }
+
+ if (regexp->min() == 0 && regexp->max() == -1) {
+ return startPar + cText +endPar + QString::fromLocal8Bit("*");
+ }
+ else if ( regexp->min() == 0 && regexp->max() == 1 ) {
+ return startPar + cText + endPar + QString::fromLocal8Bit("?");
+ }
+ else if ( regexp->min() == 1 && regexp->max() == -1 ) {
+ return startPar + cText + endPar + QString::fromLocal8Bit("+");
+ }
+ else {
+ QString res = QString::fromLatin1("");
+ for ( int i = 0; i < regexp->min(); ++i ) {
+ res += QString::fromLatin1( "\\(" ) + cText + QString::fromLatin1( "\\)" );
+ }
+ if ( regexp->max() != -1 ) {
+ for ( int i = regexp->min(); i < regexp->max(); ++i ) {
+ res += QString::fromLatin1("\\(") + cText + QString::fromLatin1("\\)?");
+ }
+ }
+ else
+ res += QString::fromLatin1("+");
+
+ return res;
+ }
+}
+
+QString EmacsRegExpConverter::toString( TextRegExp* regexp, bool /*markSelection*/ )
+{
+ QValueList<QChar> list;
+ list << QChar('$')
+ << QChar('^')
+ << QChar('.')
+ << QChar('*')
+ << QChar('+')
+ << QChar('?')
+ << QChar('[')
+ << QChar(']')
+ << QChar('\\');
+
+ QString res = escape( regexp->text(), list, QChar('\\') );
+ return res;
+}
+
+QString EmacsRegExpConverter::name()
+{
+ return QString::fromLatin1( "Emacs" );
+}
+
+int EmacsRegExpConverter::features()
+{
+ return WordStart | WordEnd;
+}