tracesrv/tracecompiler/src/com.nokia.tracecompiler/src/com/nokia/tracecompiler/source/SourceStringSearch.java
author hgs
Fri, 08 Oct 2010 14:56:39 +0300
changeset 56 aa2539c91954
parent 41 tracefw/tracecompiler/src/com.nokia.tracecompiler/src/com/nokia/tracecompiler/source/SourceStringSearch.java@838cdffd57ce
permissions -rw-r--r--
201041
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
41
hgs
parents:
diff changeset
     1
/*
hgs
parents:
diff changeset
     2
* Copyright (c) 2008 Nokia Corporation and/or its subsidiary(-ies). 
hgs
parents:
diff changeset
     3
* All rights reserved.
hgs
parents:
diff changeset
     4
* This component and the accompanying materials are made available
hgs
parents:
diff changeset
     5
* under the terms of "Eclipse Public License v1.0"
hgs
parents:
diff changeset
     6
* which accompanies this distribution, and is available
hgs
parents:
diff changeset
     7
* at the URL "http://www.eclipse.org/legal/epl-v10.html".
hgs
parents:
diff changeset
     8
*
hgs
parents:
diff changeset
     9
* Initial Contributors:
hgs
parents:
diff changeset
    10
* Nokia Corporation - initial contribution.
hgs
parents:
diff changeset
    11
*
hgs
parents:
diff changeset
    12
* Contributors:
hgs
parents:
diff changeset
    13
*
hgs
parents:
diff changeset
    14
* Description:
hgs
parents:
diff changeset
    15
*
hgs
parents:
diff changeset
    16
* String search algorithm
hgs
parents:
diff changeset
    17
*
hgs
parents:
diff changeset
    18
*/
hgs
parents:
diff changeset
    19
package com.nokia.tracecompiler.source;
hgs
parents:
diff changeset
    20
hgs
parents:
diff changeset
    21
import java.util.List;
hgs
parents:
diff changeset
    22
hgs
parents:
diff changeset
    23
/**
hgs
parents:
diff changeset
    24
 * String search algorithm
hgs
parents:
diff changeset
    25
 * 
hgs
parents:
diff changeset
    26
 */
hgs
parents:
diff changeset
    27
public class SourceStringSearch extends SourceSearch {
hgs
parents:
diff changeset
    28
hgs
parents:
diff changeset
    29
	/**
hgs
parents:
diff changeset
    30
	 * String to be searched from the source.
hgs
parents:
diff changeset
    31
	 */
hgs
parents:
diff changeset
    32
	private String searchString;
hgs
parents:
diff changeset
    33
hgs
parents:
diff changeset
    34
	/**
hgs
parents:
diff changeset
    35
	 * Number of different characters in source file alphabet. Assumes that
hgs
parents:
diff changeset
    36
	 * 8-bit encoding is used
hgs
parents:
diff changeset
    37
	 */
hgs
parents:
diff changeset
    38
	private final static int CHARACTER_COUNT = 256; // CodForChk_Dis_Magic
hgs
parents:
diff changeset
    39
hgs
parents:
diff changeset
    40
	/**
hgs
parents:
diff changeset
    41
	 * Mask for bad character shifts (0xFF)
hgs
parents:
diff changeset
    42
	 */
hgs
parents:
diff changeset
    43
	private static final int BAD_CHARACTER_MASK = 0xFF; // CodForChk_Dis_Magic
hgs
parents:
diff changeset
    44
hgs
parents:
diff changeset
    45
	/**
hgs
parents:
diff changeset
    46
	 * String search shifts.
hgs
parents:
diff changeset
    47
	 */
hgs
parents:
diff changeset
    48
	private int[] badCharacterShifts = new int[CHARACTER_COUNT];
hgs
parents:
diff changeset
    49
hgs
parents:
diff changeset
    50
	/**
hgs
parents:
diff changeset
    51
	 * User data associated with search
hgs
parents:
diff changeset
    52
	 */
hgs
parents:
diff changeset
    53
	private Object searchData;
hgs
parents:
diff changeset
    54
hgs
parents:
diff changeset
    55
	/**
hgs
parents:
diff changeset
    56
	 * Creates a new string search
hgs
parents:
diff changeset
    57
	 * 
hgs
parents:
diff changeset
    58
	 * @param parser
hgs
parents:
diff changeset
    59
	 *            the parser containing the source to be searched
hgs
parents:
diff changeset
    60
	 * @param searchString
hgs
parents:
diff changeset
    61
	 *            the string to be searched
hgs
parents:
diff changeset
    62
	 * @param startOffset
hgs
parents:
diff changeset
    63
	 *            offset to the start of search
hgs
parents:
diff changeset
    64
	 * @param endOffset
hgs
parents:
diff changeset
    65
	 *            offset to end of search or -1 for rest of the document
hgs
parents:
diff changeset
    66
	 * @param flags
hgs
parents:
diff changeset
    67
	 *            the search flags
hgs
parents:
diff changeset
    68
	 */
hgs
parents:
diff changeset
    69
	public SourceStringSearch(SourceParser parser, String searchString,
hgs
parents:
diff changeset
    70
			int startOffset, int endOffset, int flags) {
hgs
parents:
diff changeset
    71
		super(parser, startOffset, endOffset, flags);
hgs
parents:
diff changeset
    72
		setSearchString(searchString);
hgs
parents:
diff changeset
    73
	}
hgs
parents:
diff changeset
    74
hgs
parents:
diff changeset
    75
	/*
hgs
parents:
diff changeset
    76
	 * (non-Javadoc)
hgs
parents:
diff changeset
    77
	 * 
hgs
parents:
diff changeset
    78
	 * @see com.nokia.tracecompiler.source.SourceSearch#findNext()
hgs
parents:
diff changeset
    79
	 */
hgs
parents:
diff changeset
    80
	@Override
hgs
parents:
diff changeset
    81
	public int findNext() {
hgs
parents:
diff changeset
    82
		try {
hgs
parents:
diff changeset
    83
			SourceDocumentInterface source = parser.getSource();
hgs
parents:
diff changeset
    84
			int stringIndex = searchString.length() - 1;
hgs
parents:
diff changeset
    85
			boolean found = false;
hgs
parents:
diff changeset
    86
			while (!found && searchIndex + stringIndex < searchEnd) {
hgs
parents:
diff changeset
    87
				char dataChar;
hgs
parents:
diff changeset
    88
				char searchChar;
hgs
parents:
diff changeset
    89
				boolean match = false;
hgs
parents:
diff changeset
    90
				do {
hgs
parents:
diff changeset
    91
					dataChar = source.getChar(searchIndex + stringIndex);
hgs
parents:
diff changeset
    92
					searchChar = searchString.charAt(stringIndex);
hgs
parents:
diff changeset
    93
					if ((flags & SourceParser.IGNORE_CASE) != 0) {
hgs
parents:
diff changeset
    94
						searchChar = Character.toLowerCase(searchChar);
hgs
parents:
diff changeset
    95
						dataChar = Character.toLowerCase(dataChar);
hgs
parents:
diff changeset
    96
					}
hgs
parents:
diff changeset
    97
					if (searchChar == '?' || searchChar == dataChar) {
hgs
parents:
diff changeset
    98
						match = true;
hgs
parents:
diff changeset
    99
						stringIndex--;
hgs
parents:
diff changeset
   100
					} else {
hgs
parents:
diff changeset
   101
						match = false;
hgs
parents:
diff changeset
   102
					}
hgs
parents:
diff changeset
   103
				} while (match && stringIndex >= 0);
hgs
parents:
diff changeset
   104
				// If string was not found, resets index and skips according
hgs
parents:
diff changeset
   105
				// to the shift table
hgs
parents:
diff changeset
   106
				if (stringIndex < 0) {
hgs
parents:
diff changeset
   107
					found = true;
hgs
parents:
diff changeset
   108
					// Checks the previous character if match beginning is set
hgs
parents:
diff changeset
   109
					if ((flags & SourceParser.MATCH_WORD_BEGINNING) != 0) {
hgs
parents:
diff changeset
   110
						if ((searchIndex > 0)
hgs
parents:
diff changeset
   111
								&& isPartOfWord(source.getChar(searchIndex - 1))) {
hgs
parents:
diff changeset
   112
							found = false;
hgs
parents:
diff changeset
   113
						}
hgs
parents:
diff changeset
   114
					}
hgs
parents:
diff changeset
   115
					// Checks the character after data if match end is set
hgs
parents:
diff changeset
   116
					if (found && ((flags & SourceParser.MATCH_WORD_END) != 0)) {
hgs
parents:
diff changeset
   117
						if (((searchIndex + searchString.length()) < source
hgs
parents:
diff changeset
   118
								.getLength())
hgs
parents:
diff changeset
   119
								&& isPartOfWord(source.getChar(searchIndex
hgs
parents:
diff changeset
   120
										+ searchString.length()))) {
hgs
parents:
diff changeset
   121
							found = false;
hgs
parents:
diff changeset
   122
						}
hgs
parents:
diff changeset
   123
					}
hgs
parents:
diff changeset
   124
				}
hgs
parents:
diff changeset
   125
				if (!found) {
hgs
parents:
diff changeset
   126
					int diff = searchString.length() - 1 - stringIndex;
hgs
parents:
diff changeset
   127
					stringIndex = searchString.length() - 1;
hgs
parents:
diff changeset
   128
					int skip;
hgs
parents:
diff changeset
   129
hgs
parents:
diff changeset
   130
					if (dataChar > badCharacterShifts.length - 1) {
hgs
parents:
diff changeset
   131
						skip = 1;
hgs
parents:
diff changeset
   132
					} else {
hgs
parents:
diff changeset
   133
						skip = badCharacterShifts[dataChar] - diff;
hgs
parents:
diff changeset
   134
						if (skip <= 0) {
hgs
parents:
diff changeset
   135
							skip = 1;
hgs
parents:
diff changeset
   136
						}
hgs
parents:
diff changeset
   137
					}
hgs
parents:
diff changeset
   138
hgs
parents:
diff changeset
   139
					searchIndex += skip;
hgs
parents:
diff changeset
   140
					skipExcludedArea();
hgs
parents:
diff changeset
   141
				}
hgs
parents:
diff changeset
   142
			}
hgs
parents:
diff changeset
   143
			if (!found) {
hgs
parents:
diff changeset
   144
				searchIndex = -1;
hgs
parents:
diff changeset
   145
			}
hgs
parents:
diff changeset
   146
		} catch (SourceParserException e) {
hgs
parents:
diff changeset
   147
			searchIndex = -1;
hgs
parents:
diff changeset
   148
		}
hgs
parents:
diff changeset
   149
		int ret = searchIndex;
hgs
parents:
diff changeset
   150
		if (searchIndex != -1) {
hgs
parents:
diff changeset
   151
			searchIndex += searchString.length();
hgs
parents:
diff changeset
   152
		}
hgs
parents:
diff changeset
   153
		return ret;
hgs
parents:
diff changeset
   154
	}
hgs
parents:
diff changeset
   155
hgs
parents:
diff changeset
   156
	/**
hgs
parents:
diff changeset
   157
	 * Checks if the character is part of a word
hgs
parents:
diff changeset
   158
	 * 
hgs
parents:
diff changeset
   159
	 * @param c
hgs
parents:
diff changeset
   160
	 *            the character to be checked
hgs
parents:
diff changeset
   161
	 * @return true if part of word
hgs
parents:
diff changeset
   162
	 */
hgs
parents:
diff changeset
   163
	private boolean isPartOfWord(char c) {
hgs
parents:
diff changeset
   164
		return Character.isLetterOrDigit(c) || c == '_';
hgs
parents:
diff changeset
   165
	}
hgs
parents:
diff changeset
   166
hgs
parents:
diff changeset
   167
	/*
hgs
parents:
diff changeset
   168
	 * (non-Javadoc)
hgs
parents:
diff changeset
   169
	 * 
hgs
parents:
diff changeset
   170
	 * @see com.nokia.tracecompiler.source.SourceSearch#findAll(java.util.List)
hgs
parents:
diff changeset
   171
	 */
hgs
parents:
diff changeset
   172
	@Override
hgs
parents:
diff changeset
   173
	public void findAll(List<Integer> list) throws SourceParserException {
hgs
parents:
diff changeset
   174
		resetSearch(0, -1);
hgs
parents:
diff changeset
   175
		int index;
hgs
parents:
diff changeset
   176
		do {
hgs
parents:
diff changeset
   177
			index = findNext();
hgs
parents:
diff changeset
   178
			if (index > 0) {
hgs
parents:
diff changeset
   179
				list.add(new Integer(index));
hgs
parents:
diff changeset
   180
			}
hgs
parents:
diff changeset
   181
		} while (index > 0);
hgs
parents:
diff changeset
   182
	}
hgs
parents:
diff changeset
   183
hgs
parents:
diff changeset
   184
	/**
hgs
parents:
diff changeset
   185
	 * Changes the search string
hgs
parents:
diff changeset
   186
	 * 
hgs
parents:
diff changeset
   187
	 * @param searchString
hgs
parents:
diff changeset
   188
	 *            the string to be searched
hgs
parents:
diff changeset
   189
	 */
hgs
parents:
diff changeset
   190
	public void setSearchString(String searchString) {
hgs
parents:
diff changeset
   191
		this.searchString = searchString;
hgs
parents:
diff changeset
   192
		int length = searchString.length();
hgs
parents:
diff changeset
   193
		// Elements not found in the string get the maximum shift distance
hgs
parents:
diff changeset
   194
		for (int i = 0; i < badCharacterShifts.length; i++) {
hgs
parents:
diff changeset
   195
			badCharacterShifts[i] = searchString.length();
hgs
parents:
diff changeset
   196
		}
hgs
parents:
diff changeset
   197
		// Characters of the search string are mapped into the
hgs
parents:
diff changeset
   198
		// shift distances array. If a character is found multiple
hgs
parents:
diff changeset
   199
		// times, the smallest shitft distance is stored
hgs
parents:
diff changeset
   200
		for (int i = 0; i < searchString.length() - 1; i++) {
hgs
parents:
diff changeset
   201
			if ((flags & SourceParser.IGNORE_CASE) != 0) {
hgs
parents:
diff changeset
   202
				badCharacterShifts[Character
hgs
parents:
diff changeset
   203
						.toLowerCase(searchString.charAt(i))
hgs
parents:
diff changeset
   204
						& BAD_CHARACTER_MASK] = length - i - 1;
hgs
parents:
diff changeset
   205
hgs
parents:
diff changeset
   206
			} else {
hgs
parents:
diff changeset
   207
				badCharacterShifts[searchString.charAt(i) & BAD_CHARACTER_MASK] = length
hgs
parents:
diff changeset
   208
						- i - 1;
hgs
parents:
diff changeset
   209
			}
hgs
parents:
diff changeset
   210
		}
hgs
parents:
diff changeset
   211
	}
hgs
parents:
diff changeset
   212
hgs
parents:
diff changeset
   213
	/**
hgs
parents:
diff changeset
   214
	 * Returns the search string
hgs
parents:
diff changeset
   215
	 * 
hgs
parents:
diff changeset
   216
	 * @return the string
hgs
parents:
diff changeset
   217
	 */
hgs
parents:
diff changeset
   218
	public String getSearchString() {
hgs
parents:
diff changeset
   219
		return searchString;
hgs
parents:
diff changeset
   220
	}
hgs
parents:
diff changeset
   221
hgs
parents:
diff changeset
   222
	/**
hgs
parents:
diff changeset
   223
	 * Checks if the given string matches the search string
hgs
parents:
diff changeset
   224
	 * 
hgs
parents:
diff changeset
   225
	 * @param string
hgs
parents:
diff changeset
   226
	 *            the string
hgs
parents:
diff changeset
   227
	 * @return true if they match
hgs
parents:
diff changeset
   228
	 */
hgs
parents:
diff changeset
   229
	public boolean isSearchStringMatch(String string) {
hgs
parents:
diff changeset
   230
		int index = 0;
hgs
parents:
diff changeset
   231
		boolean match = true;
hgs
parents:
diff changeset
   232
		while (index < string.length() && match) {
hgs
parents:
diff changeset
   233
			char dataChar = string.charAt(index);
hgs
parents:
diff changeset
   234
			char searchChar = searchString.charAt(index);
hgs
parents:
diff changeset
   235
			if ((flags & SourceParser.IGNORE_CASE) != 0) {
hgs
parents:
diff changeset
   236
				searchChar = Character.toLowerCase(searchChar);
hgs
parents:
diff changeset
   237
				dataChar = Character.toLowerCase(dataChar);
hgs
parents:
diff changeset
   238
			}
hgs
parents:
diff changeset
   239
			if (searchChar == '?' || searchChar == dataChar) {
hgs
parents:
diff changeset
   240
				index++;
hgs
parents:
diff changeset
   241
			} else {
hgs
parents:
diff changeset
   242
				match = false;
hgs
parents:
diff changeset
   243
			}
hgs
parents:
diff changeset
   244
		}
hgs
parents:
diff changeset
   245
		return match;
hgs
parents:
diff changeset
   246
	}
hgs
parents:
diff changeset
   247
hgs
parents:
diff changeset
   248
	/**
hgs
parents:
diff changeset
   249
	 * Sets the user variable associated with this searcher
hgs
parents:
diff changeset
   250
	 * 
hgs
parents:
diff changeset
   251
	 * @param data
hgs
parents:
diff changeset
   252
	 *            the variable
hgs
parents:
diff changeset
   253
	 */
hgs
parents:
diff changeset
   254
	public void setSearchData(Object data) {
hgs
parents:
diff changeset
   255
		searchData = data;
hgs
parents:
diff changeset
   256
	}
hgs
parents:
diff changeset
   257
hgs
parents:
diff changeset
   258
	/**
hgs
parents:
diff changeset
   259
	 * Gets the user variable associated with this searcher
hgs
parents:
diff changeset
   260
	 * 
hgs
parents:
diff changeset
   261
	 * @return the variable
hgs
parents:
diff changeset
   262
	 */
hgs
parents:
diff changeset
   263
	public Object getSearchData() {
hgs
parents:
diff changeset
   264
		return searchData;
hgs
parents:
diff changeset
   265
	}
hgs
parents:
diff changeset
   266
hgs
parents:
diff changeset
   267
}