searchengine/cpix/tsrc/cpixunittest/src/localetestinfos.cpp
author hgs
Mon, 28 Jun 2010 10:34:53 +0530
changeset 8 6547bf8ca13a
permissions -rw-r--r--
201025
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
8
hgs
parents:
diff changeset
     1
/*
hgs
parents:
diff changeset
     2
 * analysisutil.cpp
hgs
parents:
diff changeset
     3
 *
hgs
parents:
diff changeset
     4
 *  Created on: Mar 25, 2010
hgs
parents:
diff changeset
     5
 *      Author: admin
hgs
parents:
diff changeset
     6
 */
hgs
parents:
diff changeset
     7
hgs
parents:
diff changeset
     8
#include "localetestinfos.h"
hgs
parents:
diff changeset
     9
#include "config.h"
hgs
parents:
diff changeset
    10
hgs
parents:
diff changeset
    11
const char* EnglishLocale::LOCALE = "en";
hgs
parents:
diff changeset
    12
const char* EnglishLocale::FILES[] = {
hgs
parents:
diff changeset
    13
	STEM_TEST_CORPUS_PATH "\\en\\1.txt",
hgs
parents:
diff changeset
    14
	STEM_TEST_CORPUS_PATH "\\en\\2.txt",
hgs
parents:
diff changeset
    15
	STEM_TEST_CORPUS_PATH "\\en\\3.txt",
hgs
parents:
diff changeset
    16
	STEM_TEST_CORPUS_PATH "\\en\\4.txt",
hgs
parents:
diff changeset
    17
	0
hgs
parents:
diff changeset
    18
};
hgs
parents:
diff changeset
    19
const wchar_t* EnglishLocale::QUERIES[] = {
hgs
parents:
diff changeset
    20
	L"happy",
hgs
parents:
diff changeset
    21
	L"happiness",
hgs
parents:
diff changeset
    22
	L"happening",
hgs
parents:
diff changeset
    23
	0
hgs
parents:
diff changeset
    24
};
hgs
parents:
diff changeset
    25
hgs
parents:
diff changeset
    26
hgs
parents:
diff changeset
    27
const char* FrenchLocale::LOCALE = "fr";
hgs
parents:
diff changeset
    28
hgs
parents:
diff changeset
    29
const char* FrenchLocale::FILES[] = {
hgs
parents:
diff changeset
    30
	LOC_TEST_CORPUS_PATH "\\fr\\1.txt",
hgs
parents:
diff changeset
    31
	LOC_TEST_CORPUS_PATH "\\fr\\2.txt",
hgs
parents:
diff changeset
    32
	LOC_TEST_CORPUS_PATH "\\fr\\3.txt",
hgs
parents:
diff changeset
    33
	LOC_TEST_CORPUS_PATH "\\fr\\4.txt",
hgs
parents:
diff changeset
    34
	0
hgs
parents:
diff changeset
    35
};
hgs
parents:
diff changeset
    36
hgs
parents:
diff changeset
    37
const wchar_t* FrenchLocale::QUERIES[] = {
hgs
parents:
diff changeset
    38
	L"d'\xe9nergie",
hgs
parents:
diff changeset
    39
	L"\xe9nergie",
hgs
parents:
diff changeset
    40
	L"elle",
hgs
parents:
diff changeset
    41
	0
hgs
parents:
diff changeset
    42
};
hgs
parents:
diff changeset
    43
hgs
parents:
diff changeset
    44
const char* HebrewLocale::LOCALE = "he";
hgs
parents:
diff changeset
    45
hgs
parents:
diff changeset
    46
const char* HebrewLocale::FILES[] = {
hgs
parents:
diff changeset
    47
	LOC_TEST_CORPUS_PATH "\\he\\1.txt",
hgs
parents:
diff changeset
    48
	LOC_TEST_CORPUS_PATH "\\he\\2.txt",
hgs
parents:
diff changeset
    49
	LOC_TEST_CORPUS_PATH "\\he\\3.txt",
hgs
parents:
diff changeset
    50
	LOC_TEST_CORPUS_PATH "\\he\\4.txt",
hgs
parents:
diff changeset
    51
	0
hgs
parents:
diff changeset
    52
};
hgs
parents:
diff changeset
    53
hgs
parents:
diff changeset
    54
const wchar_t* HebrewLocale::QUERIES[] = {
hgs
parents:
diff changeset
    55
	L"\x05e9\x05e4\x05e2\x05ea", // L"שפעת",
hgs
parents:
diff changeset
    56
	L"\x05e4\x05e2\x05ea", // L"פעת",
hgs
parents:
diff changeset
    57
	L"\x05e9\x05e4\x05e2*", // L"שפע*",
hgs
parents:
diff changeset
    58
	L"\x05e4\x05e8*", //L"פר*",
hgs
parents:
diff changeset
    59
	0
hgs
parents:
diff changeset
    60
};
hgs
parents:
diff changeset
    61
hgs
parents:
diff changeset
    62
const char* ThaiLocale::LOCALE = "th";
hgs
parents:
diff changeset
    63
const char* ThaiLocale::FILES[] = {
hgs
parents:
diff changeset
    64
	LOC_TEST_CORPUS_PATH "\\th\\1.txt",
hgs
parents:
diff changeset
    65
	LOC_TEST_CORPUS_PATH "\\th\\2.txt",
hgs
parents:
diff changeset
    66
	LOC_TEST_CORPUS_PATH "\\th\\3.txt",
hgs
parents:
diff changeset
    67
	LOC_TEST_CORPUS_PATH "\\th\\4.txt",
hgs
parents:
diff changeset
    68
	0
hgs
parents:
diff changeset
    69
};
hgs
parents:
diff changeset
    70
const wchar_t* ThaiLocale::QUERIES[] = {
hgs
parents:
diff changeset
    71
	L"\x0E14\x0E32\x0E27\x0E15\x0E01", // a thai word
hgs
parents:
diff changeset
    72
	L"\x0E21\x0E35", // another thai word
hgs
parents:
diff changeset
    73
	0
hgs
parents:
diff changeset
    74
};
hgs
parents:
diff changeset
    75
hgs
parents:
diff changeset
    76
hgs
parents:
diff changeset
    77
const char* ChineseLocale::LOCALE = "ch";
hgs
parents:
diff changeset
    78
const char* ChineseLocale::FILES[] = {
hgs
parents:
diff changeset
    79
	LOC_TEST_CORPUS_PATH "\\ch_hk\\1.txt",
hgs
parents:
diff changeset
    80
	LOC_TEST_CORPUS_PATH "\\ch_hk\\2.txt",
hgs
parents:
diff changeset
    81
	LOC_TEST_CORPUS_PATH "\\ch_hk\\3.txt",
hgs
parents:
diff changeset
    82
	LOC_TEST_CORPUS_PATH "\\ch_hk\\4.txt",
hgs
parents:
diff changeset
    83
	
hgs
parents:
diff changeset
    84
	LOC_TEST_CORPUS_PATH "\\ch_prc\\1.txt",
hgs
parents:
diff changeset
    85
	LOC_TEST_CORPUS_PATH "\\ch_prc\\2.txt",
hgs
parents:
diff changeset
    86
	LOC_TEST_CORPUS_PATH "\\ch_prc\\3.txt",
hgs
parents:
diff changeset
    87
	LOC_TEST_CORPUS_PATH "\\ch_prc\\4.txt",
hgs
parents:
diff changeset
    88
hgs
parents:
diff changeset
    89
	LOC_TEST_CORPUS_PATH "\\ch_simple\\1.txt",
hgs
parents:
diff changeset
    90
	LOC_TEST_CORPUS_PATH "\\ch_simple\\2.txt",
hgs
parents:
diff changeset
    91
	LOC_TEST_CORPUS_PATH "\\ch_simple\\3.txt",
hgs
parents:
diff changeset
    92
	LOC_TEST_CORPUS_PATH "\\ch_simple\\4.txt",
hgs
parents:
diff changeset
    93
hgs
parents:
diff changeset
    94
	LOC_TEST_CORPUS_PATH "\\ch_tw\\1.txt",
hgs
parents:
diff changeset
    95
	LOC_TEST_CORPUS_PATH "\\ch_tw\\2.txt",
hgs
parents:
diff changeset
    96
	LOC_TEST_CORPUS_PATH "\\ch_tw\\3.txt",
hgs
parents:
diff changeset
    97
	LOC_TEST_CORPUS_PATH "\\ch_tw\\4.txt",
hgs
parents:
diff changeset
    98
hgs
parents:
diff changeset
    99
	0
hgs
parents:
diff changeset
   100
};
hgs
parents:
diff changeset
   101
const wchar_t* ChineseLocale::QUERIES[] = {
hgs
parents:
diff changeset
   102
	L"\x53f0\x6e7e", // a chinese word
hgs
parents:
diff changeset
   103
	L"\x4e2d\x56fd", // another chinese word
hgs
parents:
diff changeset
   104
	0
hgs
parents:
diff changeset
   105
};
hgs
parents:
diff changeset
   106
hgs
parents:
diff changeset
   107
const char* KoreanLocale::LOCALE = "ko";
hgs
parents:
diff changeset
   108
const char* KoreanLocale::FILES[] = {
hgs
parents:
diff changeset
   109
	LOC_TEST_CORPUS_PATH "\\ko\\1.txt",
hgs
parents:
diff changeset
   110
	LOC_TEST_CORPUS_PATH "\\ko\\2.txt",
hgs
parents:
diff changeset
   111
	LOC_TEST_CORPUS_PATH "\\ko\\3.txt",
hgs
parents:
diff changeset
   112
	LOC_TEST_CORPUS_PATH "\\ko\\4.txt",
hgs
parents:
diff changeset
   113
	
hgs
parents:
diff changeset
   114
	0
hgs
parents:
diff changeset
   115
};
hgs
parents:
diff changeset
   116
const wchar_t* KoreanLocale::QUERIES[] = {
hgs
parents:
diff changeset
   117
	L"\xc2a4\xd1a0\xb9ac", // a korean word
hgs
parents:
diff changeset
   118
	L"\xc778\xbb3c", // another korean word
hgs
parents:
diff changeset
   119
	0
hgs
parents:
diff changeset
   120
};
hgs
parents:
diff changeset
   121
hgs
parents:
diff changeset
   122
const char* JapaneseLocale::LOCALE = "jp";
hgs
parents:
diff changeset
   123
const char* JapaneseLocale::FILES[] = {
hgs
parents:
diff changeset
   124
	LOC_TEST_CORPUS_PATH "\\jp\\1.txt",
hgs
parents:
diff changeset
   125
	LOC_TEST_CORPUS_PATH "\\jp\\2.txt",
hgs
parents:
diff changeset
   126
	LOC_TEST_CORPUS_PATH "\\jp\\3.txt",
hgs
parents:
diff changeset
   127
	LOC_TEST_CORPUS_PATH "\\jp\\4.txt",
hgs
parents:
diff changeset
   128
hgs
parents:
diff changeset
   129
	LOC_TEST_CORPUS_PATH "\\jp_old\\1.txt",
hgs
parents:
diff changeset
   130
	LOC_TEST_CORPUS_PATH "\\jp_old\\2.txt",
hgs
parents:
diff changeset
   131
	LOC_TEST_CORPUS_PATH "\\jp_old\\3.txt",
hgs
parents:
diff changeset
   132
	LOC_TEST_CORPUS_PATH "\\jp_old\\4.txt",
hgs
parents:
diff changeset
   133
hgs
parents:
diff changeset
   134
	0
hgs
parents:
diff changeset
   135
};
hgs
parents:
diff changeset
   136
const wchar_t* JapaneseLocale::QUERIES[] = {
hgs
parents:
diff changeset
   137
	L"\x56fd\x969b", // a japanese word
hgs
parents:
diff changeset
   138
	L"\x65e5\x672c", // another japanese word
hgs
parents:
diff changeset
   139
	0
hgs
parents:
diff changeset
   140
};