searchengine/oss/loc/analysis/inc/private/tinyanalysis.inl
author hgs
Fri, 15 Oct 2010 12:09:28 +0530
changeset 24 65456528cac2
permissions -rw-r--r--
201041
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
24
hgs
parents:
diff changeset
     1
/*
hgs
parents:
diff changeset
     2
* Copyright (c) 2010 Nokia Corporation and/or its subsidiary(-ies).
hgs
parents:
diff changeset
     3
* All rights reserved.
hgs
parents:
diff changeset
     4
* This component and the accompanying materials are made available
hgs
parents:
diff changeset
     5
* under the terms of "Eclipse Public License v1.0"
hgs
parents:
diff changeset
     6
* which accompanies this distribution, and is available
hgs
parents:
diff changeset
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
hgs
parents:
diff changeset
     8
*
hgs
parents:
diff changeset
     9
* Initial Contributors:
hgs
parents:
diff changeset
    10
* Nokia Corporation - initial contribution.
hgs
parents:
diff changeset
    11
*
hgs
parents:
diff changeset
    12
* Contributors:
hgs
parents:
diff changeset
    13
*
hgs
parents:
diff changeset
    14
* Description: 
hgs
parents:
diff changeset
    15
*
hgs
parents:
diff changeset
    16
*/
hgs
parents:
diff changeset
    17
#ifndef TINYANALYSIS_INL_
hgs
parents:
diff changeset
    18
#define TINYANALYSIS_INL_
hgs
parents:
diff changeset
    19
hgs
parents:
diff changeset
    20
#include "CLucene.h"
hgs
parents:
diff changeset
    21
hgs
parents:
diff changeset
    22
/*
hgs
parents:
diff changeset
    23
 * TODO: 
hgs
parents:
diff changeset
    24
 * 
hgs
parents:
diff changeset
    25
 *   Move more functionality in here
hgs
parents:
diff changeset
    26
 *   
hgs
parents:
diff changeset
    27
 */
hgs
parents:
diff changeset
    28
hgs
parents:
diff changeset
    29
namespace analysis {
hgs
parents:
diff changeset
    30
    namespace tiny {
hgs
parents:
diff changeset
    31
        namespace cl {
hgs
parents:
diff changeset
    32
    
hgs
parents:
diff changeset
    33
            template<int SIZE>
hgs
parents:
diff changeset
    34
            wchar_t ReaderBuffer<SIZE>::operator[](int i)
hgs
parents:
diff changeset
    35
            {
hgs
parents:
diff changeset
    36
                if ( i < read_ - SIZE ) throw TooOldIndexException();
hgs
parents:
diff changeset
    37
                // fill
hgs
parents:
diff changeset
    38
                while (i >= read_) {
hgs
parents:
diff changeset
    39
                    int c = reader_.read(); 
hgs
parents:
diff changeset
    40
                    buf_[cut_++] = ( c == -1 ? '\0' : c );
hgs
parents:
diff changeset
    41
                    cut_ %= SIZE;
hgs
parents:
diff changeset
    42
                    if (read_++ >= SIZE) {
hgs
parents:
diff changeset
    43
                        offset_++;
hgs
parents:
diff changeset
    44
                    } 
hgs
parents:
diff changeset
    45
                }
hgs
parents:
diff changeset
    46
                // guaranteed that i < read
hgs
parents:
diff changeset
    47
                return buf_[i % SIZE]; 
hgs
parents:
diff changeset
    48
            }
hgs
parents:
diff changeset
    49
           
hgs
parents:
diff changeset
    50
            template<int SIZE>
hgs
parents:
diff changeset
    51
            ReaderBuffer<SIZE>::ReaderBuffer(lucene::util::Reader& reader)
hgs
parents:
diff changeset
    52
            : reader_(reader), read_(0), cut_(0), offset_(0) {}
hgs
parents:
diff changeset
    53
            
hgs
parents:
diff changeset
    54
            template<int SIZE>
hgs
parents:
diff changeset
    55
            typename ReaderBuffer<SIZE>::iterator ReaderBuffer<SIZE>::at(int i) {
hgs
parents:
diff changeset
    56
                return  iterator(*this, i); 
hgs
parents:
diff changeset
    57
            }
hgs
parents:
diff changeset
    58
            
hgs
parents:
diff changeset
    59
            template<int SIZE>
hgs
parents:
diff changeset
    60
            typename ReaderBuffer<SIZE>::iterator ReaderBuffer<SIZE>::begin() { 
hgs
parents:
diff changeset
    61
                return iterator(*this, 0); 
hgs
parents:
diff changeset
    62
            }
hgs
parents:
diff changeset
    63
            
hgs
parents:
diff changeset
    64
        }
hgs
parents:
diff changeset
    65
        
hgs
parents:
diff changeset
    66
        template <typename Iterator>
hgs
parents:
diff changeset
    67
        void Token<Iterator>::copyTo(lucene::analysis::Token* token) {
hgs
parents:
diff changeset
    68
            token->resetTermTextLen();
hgs
parents:
diff changeset
    69
            token->growBuffer(utf16size()+1);
hgs
parents:
diff changeset
    70
            token->setPositionIncrement(1);
hgs
parents:
diff changeset
    71
            Utf16Writer<wchar_t*> out(token->_termText); 
hgs
parents:
diff changeset
    72
            Iterator i = begin_; 
hgs
parents:
diff changeset
    73
            token->setStartOffset(i);
hgs
parents:
diff changeset
    74
            for (int n = length_; n; n--) {
hgs
parents:
diff changeset
    75
				out<<*i; ++i; 
hgs
parents:
diff changeset
    76
            }
hgs
parents:
diff changeset
    77
            out<<L'\0';
hgs
parents:
diff changeset
    78
            token->setEndOffset(i);
hgs
parents:
diff changeset
    79
        }
hgs
parents:
diff changeset
    80
hgs
parents:
diff changeset
    81
    }
hgs
parents:
diff changeset
    82
}
hgs
parents:
diff changeset
    83
hgs
parents:
diff changeset
    84
#endif /* TINYANALYSIS_INL_ */