searchengine/util/tsrc/cpixtoolsunittest/src/parseunittest.cpp
author hgs
Mon, 28 Jun 2010 10:34:53 +0530
changeset 8 6547bf8ca13a
parent 0 671dee74050a
permissions -rw-r--r--
201025
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     1
/*
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     2
* Copyright (c) 2010 Nokia Corporation and/or its subsidiary(-ies).
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     3
* All rights reserved.
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     4
* This component and the accompanying materials are made available
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     5
* under the terms of "Eclipse Public License v1.0"
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     6
* which accompanies this distribution, and is available
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     8
*
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
     9
* Initial Contributors:
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    10
* Nokia Corporation - initial contribution.
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    11
*
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    12
* Contributors:
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    13
*
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    14
* Description: 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    15
*
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    16
*/
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    17
#include "cpixparsetools.h"
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    18
#include "itk.h"
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    19
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    20
#include <iostream>
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    21
#include <memory>
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    22
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    23
using namespace Cpt::Lex; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    24
using namespace Cpt::Parser; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    25
using namespace std; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    26
8
hgs
parents: 0
diff changeset
    27
const wchar_t* TOKEN_LEFT_BRACKET = L"left bracket";
hgs
parents: 0
diff changeset
    28
const wchar_t* TOKEN_RIGHT_BRACKET = L"right bracket"; 
hgs
parents: 0
diff changeset
    29
const wchar_t* TOKEN_COMMA = L"comma";
hgs
parents: 0
diff changeset
    30
const wchar_t* TOKEN_PIPE = L"pipe";
hgs
parents: 0
diff changeset
    31
const wchar_t* TOKEN_SWITCH = L"switch";
hgs
parents: 0
diff changeset
    32
const wchar_t* TOKEN_CASE = L"case";
hgs
parents: 0
diff changeset
    33
const wchar_t* TOKEN_DEFAULT = L"default";
hgs
parents: 0
diff changeset
    34
const wchar_t* TOKEN_LEFT_BRACE = L"left brace";
hgs
parents: 0
diff changeset
    35
const wchar_t* TOKEN_RIGHT_BRACE = L"right brace";
hgs
parents: 0
diff changeset
    36
const wchar_t* TOKEN_COLON = L"colon";
hgs
parents: 0
diff changeset
    37
const wchar_t* TOKEN_TERMINATOR = L"terminator";
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    38
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    39
void PrintToken(Cpt::Lex::Token token) {
8
hgs
parents: 0
diff changeset
    40
	wcout<<token.type()<<L"('"<<token.text()<<L"')";  
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    41
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    42
8
hgs
parents: 0
diff changeset
    43
void TestTokenization(Itk::TestMgr  * testMgr,
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    44
                      const wchar_t * inputStr)
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    45
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    46
	WhitespaceTokenizer ws; 
8
hgs
parents: 0
diff changeset
    47
	LineCommentTokenizer line; 
hgs
parents: 0
diff changeset
    48
	SectionCommentTokenizer section; 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    49
	IdTokenizer ids; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    50
        IntLitTokenizer ints;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    51
        RealLitTokenizer reals;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    52
	LitTokenizer lits('\''); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    53
	SymbolTokenizer lb(TOKEN_LEFT_BRACKET, L"("); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    54
	SymbolTokenizer rb(TOKEN_RIGHT_BRACKET, L")"); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    55
	SymbolTokenizer cm(TOKEN_COMMA, L","); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    56
	SymbolTokenizer pp(TOKEN_PIPE, L">");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    57
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    58
        // NOTE: ints and reals are before lits, so even if lits
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    59
        // itself can recognize strings, ints and reals, the ints and
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    60
        // reals are taking precedence - just for the test cases now
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    61
        // (to check if those types are recognized correctly). So
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    62
        // basically, in test cases, lit will mean string literals,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    63
        // and int-lit, real-lit will mean integer and real literals,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    64
        // respectively.
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    65
	Tokenizer* tokenizers[] = {
8
hgs
parents: 0
diff changeset
    66
		&ws, &line, &section, &lb, &rb, &cm, &pp, &ids, &ints, &reals, &lits, 0
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    67
	};
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    68
	MultiTokenizer tokenizer(tokenizers);
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    69
	
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    70
	Tokens 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    71
            source(tokenizer, 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    72
                   inputStr);
8
hgs
parents: 0
diff changeset
    73
	StdFilter tokens(source); 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    74
	
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    75
	while (tokens) PrintToken(tokens++); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    76
	cout<<endl;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    77
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    78
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    79
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    80
void TestTokenization1(Itk::TestMgr * testMgr)
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    81
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    82
    TestTokenization(testMgr,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    83
                     L"stdtokens>lowercase>stopwords('a', 'an','the')>stem('en')");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    84
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    85
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    86
void TestTokenization2(Itk::TestMgr * testMgr)
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    87
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    88
    TestTokenization(testMgr,
8
hgs
parents: 0
diff changeset
    89
                     L"'foo' 0 1 -2 'bar' +234 -34 // side note");
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    90
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    91
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    92
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    93
void TestTokenization3(Itk::TestMgr * testMgr)
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    94
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    95
    TestTokenization(testMgr,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    96
                     L"'hallo' 0.0 .0 .5 -1.0 -.05 45 'bar' +.123 +3.1415");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    97
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    98
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
    99
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   100
void TestTokenization4(Itk::TestMgr * testMgr)
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   101
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   102
    TestTokenization(testMgr,
8
hgs
parents: 0
diff changeset
   103
                     L"'\\' ''\\\\' '\\a' '\\\n' // comment\n /*foobar*/");
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   104
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   105
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   106
8
hgs
parents: 0
diff changeset
   107
void TestTokenization5(Itk::TestMgr * testMgr)
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   108
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   109
    WhitespaceTokenizer 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   110
        ws; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   111
    IdTokenizer 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   112
        ids; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   113
    SymbolTokenizer 
8
hgs
parents: 0
diff changeset
   114
        for_(L"for", L"for"); 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   115
    SymbolTokenizer 
8
hgs
parents: 0
diff changeset
   116
        if_(L"if", L"if"); 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   117
    Tokenizer* tokenizers[] = {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   118
        &ws, &for_, &if_, &ids, 0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   119
    };
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   120
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   121
    MultiTokenizer 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   122
        tokenizer(tokenizers);
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   123
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   124
    Tokens 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   125
        source(tokenizer, 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   126
               L"fo for fore forth ofor oforo i if ifdom ifer fif fifi forfi fifor"); // test escape in literals
8
hgs
parents: 0
diff changeset
   127
    StdFilter 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   128
        tokens(source); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   129
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   130
    while (tokens) PrintToken(tokens++); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   131
    cout<<endl;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   132
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   133
8
hgs
parents: 0
diff changeset
   134
void TestTokenization6(Itk::TestMgr * testMgr)
hgs
parents: 0
diff changeset
   135
{
hgs
parents: 0
diff changeset
   136
    WhitespaceTokenizer 
hgs
parents: 0
diff changeset
   137
        ws; 
hgs
parents: 0
diff changeset
   138
    LineCommentTokenizer 
hgs
parents: 0
diff changeset
   139
        line; 
hgs
parents: 0
diff changeset
   140
    SectionCommentTokenizer 
hgs
parents: 0
diff changeset
   141
        section; 
hgs
parents: 0
diff changeset
   142
    IdTokenizer 
hgs
parents: 0
diff changeset
   143
        ids; 
hgs
parents: 0
diff changeset
   144
    IntLitTokenizer 
hgs
parents: 0
diff changeset
   145
        intLit; 
hgs
parents: 0
diff changeset
   146
    RealLitTokenizer 
hgs
parents: 0
diff changeset
   147
        realLit; 
hgs
parents: 0
diff changeset
   148
    SymbolTokenizer 
hgs
parents: 0
diff changeset
   149
        div(L"slash", L"/"); 
hgs
parents: 0
diff changeset
   150
    SymbolTokenizer 
hgs
parents: 0
diff changeset
   151
        mul(L"star", L"*");
hgs
parents: 0
diff changeset
   152
    SymbolTokenizer 
hgs
parents: 0
diff changeset
   153
        plus(L"plus", L"+");
hgs
parents: 0
diff changeset
   154
    SymbolTokenizer 
hgs
parents: 0
diff changeset
   155
        minus(L"minus", L"-");
hgs
parents: 0
diff changeset
   156
    SymbolTokenizer 
hgs
parents: 0
diff changeset
   157
        equal(L"equals", L"=");
hgs
parents: 0
diff changeset
   158
    
hgs
parents: 0
diff changeset
   159
    Tokenizer* tokenizers[] = {
hgs
parents: 0
diff changeset
   160
        &ws, &line, &section, &ids, &intLit, &realLit, &div, &mul, &plus, &minus, &equal, 0
hgs
parents: 0
diff changeset
   161
    };
hgs
parents: 0
diff changeset
   162
hgs
parents: 0
diff changeset
   163
    MultiTokenizer 
hgs
parents: 0
diff changeset
   164
        tokenizer(tokenizers);
hgs
parents: 0
diff changeset
   165
    
hgs
parents: 0
diff changeset
   166
    const wchar_t* text = 
hgs
parents: 0
diff changeset
   167
    	L"4 + 6 = 2 * 5\n"
hgs
parents: 0
diff changeset
   168
        L"6 / 2 = 1*3 // true\n"
hgs
parents: 0
diff changeset
   169
		L"3 / x /*important thingie*/ = 2 * y\n"
hgs
parents: 0
diff changeset
   170
		L"6 / x * / * / /* non sense / * / */ // zap"
hgs
parents: 0
diff changeset
   171
		L"//\n"
hgs
parents: 0
diff changeset
   172
		L"//"; 
hgs
parents: 0
diff changeset
   173
hgs
parents: 0
diff changeset
   174
    {
hgs
parents: 0
diff changeset
   175
		cout<<"With whitespaces & comments visible"<<endl;
hgs
parents: 0
diff changeset
   176
		Tokens 
hgs
parents: 0
diff changeset
   177
			tokens(tokenizer, text);
hgs
parents: 0
diff changeset
   178
	
hgs
parents: 0
diff changeset
   179
		while (tokens) PrintToken(tokens++); 
hgs
parents: 0
diff changeset
   180
		cout<<endl;
hgs
parents: 0
diff changeset
   181
    }
hgs
parents: 0
diff changeset
   182
hgs
parents: 0
diff changeset
   183
    {
hgs
parents: 0
diff changeset
   184
		cout<<"With whitespaces & comments filtered"<<endl;
hgs
parents: 0
diff changeset
   185
		Tokens 
hgs
parents: 0
diff changeset
   186
			source(tokenizer, text);
hgs
parents: 0
diff changeset
   187
		
hgs
parents: 0
diff changeset
   188
		StdFilter tokens(source); 
hgs
parents: 0
diff changeset
   189
	
hgs
parents: 0
diff changeset
   190
		while (tokens) PrintToken(tokens++); 
hgs
parents: 0
diff changeset
   191
		cout<<endl;
hgs
parents: 0
diff changeset
   192
    }
hgs
parents: 0
diff changeset
   193
hgs
parents: 0
diff changeset
   194
}
hgs
parents: 0
diff changeset
   195
hgs
parents: 0
diff changeset
   196
void TestTokenizationErrors(Itk::TestMgr* mgr) 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   197
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   198
	WhitespaceTokenizer ws; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   199
	IdTokenizer ids; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   200
	LitTokenizer lits('\''); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   201
	SymbolTokenizer lb(TOKEN_LEFT_BRACKET, L"("); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   202
	SymbolTokenizer rb(TOKEN_RIGHT_BRACKET, L")"); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   203
	SymbolTokenizer cm(TOKEN_COMMA, L","); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   204
	SymbolTokenizer pp(TOKEN_PIPE, L">");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   205
	Tokenizer* tokenizers[] = {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   206
		&ws, &lb, &rb, &cm, &pp, &ids, &lits, 0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   207
	};
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   208
	MultiTokenizer tokenizer(tokenizers);
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   209
	const wchar_t* text;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   210
	{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   211
		Tokens tokens(tokenizer, text = L"stdtokens>lowercase>stopwords('a', 'an','the)>stem('en')");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   212
		try {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   213
			while (tokens) PrintToken(tokens++); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   214
		} catch (LexException& exc) {
8
hgs
parents: 0
diff changeset
   215
			exc.setContext(text);
hgs
parents: 0
diff changeset
   216
			wcout<<endl<<L"LexException: "<<exc.wWhat()<<endl; 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   217
		} catch (exception& exc) {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   218
			cout<<endl<<"Exception: "<<exc.what()<<endl; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   219
		}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   220
	}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   221
	{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   222
		Tokens tokens(tokenizer, text = L"fas-324we?`213ff3*21(+");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   223
		try {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   224
			while (tokens) PrintToken(tokens++); 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   225
		} catch (LexException& exc) {
8
hgs
parents: 0
diff changeset
   226
			exc.setContext(text);
hgs
parents: 0
diff changeset
   227
			wcout<<endl<<L"LexException: "<<exc.wWhat()<<endl; 
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   228
		} catch (exception& exc) {
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   229
			cout<<endl<<"Exception: "<<exc.what()<<endl; 
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   230
		}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   231
	}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   232
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   233
8
hgs
parents: 0
diff changeset
   234
void TestWhitespaceSplitter(Itk::TestMgr* mgr) 
hgs
parents: 0
diff changeset
   235
{
hgs
parents: 0
diff changeset
   236
	{
hgs
parents: 0
diff changeset
   237
		WhitespaceSplitter tokens(L"foobar foo bar foo\tbar _*4 4bar foo*bar foo\nbar foo\rbar foo\0bar");
hgs
parents: 0
diff changeset
   238
		while (tokens) printf(" \"%S\"", tokens++.text().c_str());
hgs
parents: 0
diff changeset
   239
		printf("\n");
hgs
parents: 0
diff changeset
   240
	}
hgs
parents: 0
diff changeset
   241
	
hgs
parents: 0
diff changeset
   242
	{
hgs
parents: 0
diff changeset
   243
		WhitespaceSplitter tokens(L"foobar");
hgs
parents: 0
diff changeset
   244
		while (tokens) printf(" \"%S\"", tokens++.text().c_str());
hgs
parents: 0
diff changeset
   245
		printf("\n");
hgs
parents: 0
diff changeset
   246
	}
hgs
parents: 0
diff changeset
   247
hgs
parents: 0
diff changeset
   248
	{
hgs
parents: 0
diff changeset
   249
		WhitespaceSplitter tokens(L"   foobar  \r\n");
hgs
parents: 0
diff changeset
   250
		while (tokens) printf(" \"%S\"", tokens++.text().c_str());
hgs
parents: 0
diff changeset
   251
		printf("\n");
hgs
parents: 0
diff changeset
   252
	}
hgs
parents: 0
diff changeset
   253
hgs
parents: 0
diff changeset
   254
	{
hgs
parents: 0
diff changeset
   255
		WhitespaceSplitter tokens(L"   ");
hgs
parents: 0
diff changeset
   256
		while (tokens) printf(" \"%S\"", tokens++.text().c_str());
hgs
parents: 0
diff changeset
   257
		printf("\n");
hgs
parents: 0
diff changeset
   258
	}
hgs
parents: 0
diff changeset
   259
hgs
parents: 0
diff changeset
   260
	{
hgs
parents: 0
diff changeset
   261
		WhitespaceSplitter tokens(L"");
hgs
parents: 0
diff changeset
   262
		while (tokens) printf(" \"%S\"", tokens++.text().c_str());
hgs
parents: 0
diff changeset
   263
		printf("\n");
hgs
parents: 0
diff changeset
   264
	}
hgs
parents: 0
diff changeset
   265
hgs
parents: 0
diff changeset
   266
}
hgs
parents: 0
diff changeset
   267
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   268
Itk::TesterBase * CreateParsingTests()
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   269
{
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   270
    using namespace Itk;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   271
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   272
    SuiteTester
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   273
        * parsingTests = new SuiteTester("parsing");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   274
   
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   275
    parsingTests->add("tokenization1",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   276
                      TestTokenization1,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   277
                      "tokenization1");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   278
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   279
    parsingTests->add("tokenization2",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   280
                      TestTokenization2,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   281
                      "tokenization2");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   282
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   283
    parsingTests->add("tokenization3",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   284
                      TestTokenization3,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   285
                      "tokenization3");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   286
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   287
    parsingTests->add("tokenization4",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   288
                      TestTokenization4,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   289
                      "tokenization4");
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   290
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   291
    parsingTests->add("tokenization5",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   292
                      TestTokenization5,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   293
                      "tokenization5");
8
hgs
parents: 0
diff changeset
   294
    
hgs
parents: 0
diff changeset
   295
    parsingTests->add("tokenization6",
hgs
parents: 0
diff changeset
   296
                      TestTokenization6,
hgs
parents: 0
diff changeset
   297
                      "tokenization6");
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   298
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   299
    parsingTests->add("syntaxerrors",
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   300
                      TestTokenizationErrors,
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   301
                      "syntaxerrors");
8
hgs
parents: 0
diff changeset
   302
hgs
parents: 0
diff changeset
   303
    parsingTests->add("whitespace",
hgs
parents: 0
diff changeset
   304
					  TestWhitespaceSplitter,
hgs
parents: 0
diff changeset
   305
                      "whitespace");
hgs
parents: 0
diff changeset
   306
0
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   307
    return parsingTests;
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   308
}
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   309
671dee74050a Revision: 201011
Dremov Kirill (Nokia-D-MSW/Tampere) <kirill.dremov@nokia.com>
parents:
diff changeset
   310