searchengine/cpix/tsrc/cpixunittest/data/cpixunittest/analysis/whitebox/loc/he_exp_out.txt
author hgs
Fri, 15 Oct 2010 12:09:28 +0530
changeset 24 65456528cac2
permissions -rw-r--r--
201041
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
24
hgs
parents:
diff changeset
     1
Analyzer "natural":
hgs
parents:
diff changeset
     2
File ./cpixunittestcorpus/text/en/1.txt tokenized:
hgs
parents:
diff changeset
     3
 'i' 'am' 'happy'
hgs
parents:
diff changeset
     4
File ./cpixunittestcorpus/text/en/2.txt tokenized:
hgs
parents:
diff changeset
     5
 'oh' 'happiness'
hgs
parents:
diff changeset
     6
File ./cpixunittestcorpus/text/en/3.txt tokenized:
hgs
parents:
diff changeset
     7
 'nothing' 'important' 'in' 'here' 'so' 'don't' 'even' 'look' 'because' 'you' 'shall' 'find' 'nothing' 'whatsoever'
hgs
parents:
diff changeset
     8
File ./cpixunittestcorpus/text/en/4.txt tokenized:
hgs
parents:
diff changeset
     9
 'what' 'is' 'happening' 'here'
hgs
parents:
diff changeset
    10
hgs
parents:
diff changeset
    11
Analyzer "natural":
hgs
parents:
diff changeset
    12
File ./cpixunittestcorpus/text/he/1.txt tokenized:
hgs
parents:
diff changeset
    13
 'שפעת'|'פעת' 'החזירים'|'חזירים' 'תושבת'|'ושבת'|'שבת'|'בת'|'ת' 'נצרת'|'צרת' 'עילית' 'בת'|'ת' '51' 'ללא'|'לא'|'א' 'מחלות'|'חלות' 'רקע' 'מתה'|'תה'|'ה'
hgs
parents:
diff changeset
    14
File ./cpixunittestcorpus/text/he/2.txt tokenized:
hgs
parents:
diff changeset
    15
 'בבית'|'בית'|'ית'|'ת' 'החולים'|'חולים' 'העמק'|'עמק' 'החולה'|'חולה' 'טופלה' 'אתמול'|'תמול'|'מול'|'ול'|'ל' 'בתרופה'|'תרופה'|'רופה' 'הניסיונית'|'ניסיונית'|'יסיונית'|'סיונית'
hgs
parents:
diff changeset
    16
File ./cpixunittestcorpus/text/he/3.txt tokenized:
hgs
parents:
diff changeset
    17
 'פרהמיביר' 'אולם'|'ולם'|'לם'|'ם' 'מצבה'|'צבה' 'הוסיף'|'וסיף'|'סיף' 'להידרדר'|'הידרדר'|'ידרדר'|'דרדר'
hgs
parents:
diff changeset
    18
File ./cpixunittestcorpus/text/he/4.txt tokenized:
hgs
parents:
diff changeset
    19
 'והבוקר'|'הבוקר'|'בוקר'|'וקר'|'קר' 'נקבע'|'קבע' 'מותה'|'ותה'|'תה'|'ה' 'החולה'|'חולה' 'תושבת'|'ושבת'|'שבת'|'בת'|'ת' 'נצרת'|'צרת' 'עילית'
hgs
parents:
diff changeset
    20