--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/bintools/rcomp/inc/UNICODE_COMPRESSOR.H Mon May 10 19:54:49 2010 +0100
@@ -0,0 +1,203 @@
+/*
+* Copyright (c) 2001-2009 Nokia Corporation and/or its subsidiary(-ies).
+* All rights reserved.
+* This component and the accompanying materials are made available
+* under the terms of the License "Eclipse Public License v1.0"
+* which accompanies this distribution, and is available
+* at the URL "http://www.eclipse.org/legal/epl-v10.html".
+*
+* Initial Contributors:
+* Nokia Corporation - initial contribution.
+*
+* Contributors:
+*
+* Description:
+* the API to the Unicode compressor
+*
+*/
+
+
+#include "wide.h"
+
+
+extern void CompressUnicode(unsigned char* aOutputBuffer, int& aOutputLength, int aMaximumOutputLength, const UTF16* aInputBuffer, int aInputLength);
+
+// the Symbian things that the Symbian Unicode-compression classes use
+
+#define IMPORT_C
+#define EXPORT_C
+#ifdef __TOOLS2__ // If TOOLS2 defined, use the definition of NULL as supplied in stddef.h
+#include <stddef.h>
+#else
+#define NULL 0
+#endif // !__TOOLS2__
+#define TRUE true
+#define FALSE false
+typedef unsigned char TUint8;
+typedef unsigned short TUint16;
+typedef unsigned long TUint32;
+typedef unsigned int TUint;
+typedef int TInt;
+typedef bool TBool;
+const TInt KMaxTInt = 0x7fffffff;
+const TInt KErrNotFound = -1;
+class RWriteStream;
+extern void Panic(int aCode);
+
+// the rest of the contents of this file is a selective copy of base\store\inc\S32UCMP.H
+
+class TUnicodeCompressionState
+ {
+ public:
+ TUnicodeCompressionState();
+ void Reset();
+ static TInt StaticWindowIndex(TUint16 aCode);
+ static TInt DynamicWindowOffsetIndex(TUint16 aCode);
+ static TUint32 DynamicWindowBase(TInt aOffsetIndex);
+ static TBool EncodeAsIs(TUint16 aCode);
+
+ enum TPanic
+ {
+ EUnhandledByte, // expander code fails to handle all possible byte codes
+ ENotUnicode, // expander can't handle Unicode values outside range 0x0..0x10FFFF;
+ // that is, 16-bit codes plus 32-bit codes that can be expressed using
+ // 16-bit surrogates
+ EOutputBufferOverflow // output buffer is not big enough
+ ,ECannotUseStreams // not in the file from which this file is derived (i.e. not in base\store\inc\S32UCMP.H)
+ };
+
+ static void Panic(TPanic aPanic);
+
+ protected:
+
+ enum
+ {
+ EStaticWindows = 8,
+ EDynamicWindows = 8,
+ ESpecialBases = 7
+ };
+
+ TBool iUnicodeMode; // TRUE if in Unicode mode as opposed to single-byte mode
+ TUint32 iActiveWindowBase; // base of the active window - bases are 32-bit because they
+ // can be set to the surrogate area, which represents codes
+ // from 0x00010000 to 0x0010FFFF - planes 1-16 of ISO-10646.
+ static const TUint32 iStaticWindow[EStaticWindows]; // bases of the static windows
+ static const TUint32 iDynamicWindowDefault[EDynamicWindows]; // default bases of the dynamic windows
+ static const TUint16 iSpecialBase[ESpecialBases]; // bases for window offsets F9..FF
+
+ TUint32 iDynamicWindow[EDynamicWindows]; // bases of the dynamic windows
+ TInt iUnicodeWords; // Unicode words processed; read by compressor, written by expander
+ TInt iMaxUnicodeWords; // maximum number of Unicode words to read or write
+ TInt iCompressedBytes; // compressed bytes processed: read by expander, written by compressor
+ TInt iMaxCompressedBytes; // maximum number of compressed bytes to read or write
+ };
+
+class MUnicodeSource
+ {
+ public:
+ virtual TUint16 ReadUnicodeValueL() = 0;
+ };
+
+// A class to read Unicode values directly from memory.
+class TMemoryUnicodeSource: public MUnicodeSource
+ {
+ public:
+ inline TMemoryUnicodeSource(const UTF16* aPtr);
+ inline TUint16 ReadUnicodeValueL();
+
+ private:
+ const UTF16* iPtr;
+ };
+
+/**
+A class to hold functions to compress text using the Standard Compression Scheme for Unicode.
+
+A note on error handling and leaving.
+
+Although all the public functions except the constructor can leave, it is possible to guarantee success: that is,
+guarantee that a call will not leave, and that compression will be completed. To do this, (i) supply a MUnicodeSource
+object with a non-leaving ReadUnicodeValueL function, such as a TMemoryUnicodeSource; (ii) write output to a
+RWriteStream with a non-leaving WriteL function, or to a buffer that you already know to be big enough, which can be
+found out using CompressedSizeL.
+
+This guarantee of success is particularly useful when compressing from one memory buffer to another.
+*/
+class TUnicodeCompressor: public TUnicodeCompressionState
+ {
+ public:
+ IMPORT_C TUnicodeCompressor();
+ IMPORT_C void CompressL(TUint8* aOutput,MUnicodeSource& aInput,
+ TInt aMaxOutputBytes = KMaxTInt,TInt aMaxInputWords = KMaxTInt,
+ TInt* aOutputBytes = NULL,TInt* aInputWords = NULL);
+ IMPORT_C TInt FlushL(TUint8* aOutput,TInt aMaxOutputBytes,TInt& aOutputBytes);
+ IMPORT_C static TInt CompressedSizeL(MUnicodeSource& aInput,TInt aInputWords);
+
+ private:
+ // A structure to store a character and its treatment code
+ struct TAction
+ {
+ // Treatment codes: static and dynamic window numbers, plain ASCII or plain Unicode
+ enum
+ {
+ EPlainUnicode = -2, // character cannot be expressed as ASCII or using static or dynamic windows
+ EPlainASCII = -1, // character can be emitted as an ASCII code
+ EFirstDynamic = 0, // values 0..255 are for dynamic windows with offsets at these places in the offset table
+ ELastDynamic = 255,
+ EFirstStatic = 256, // values 256..263 are for static windows 0..7
+ ELastStatic = 263
+ };
+
+ inline TAction();
+ TAction(TUint16 aCode);
+
+ TUint16 iCode; // Unicode value of the character
+ TInt iTreatment; // treatment code: see above
+ };
+
+ void DoCompressL(RWriteStream* aOutputStream,TUint8* aOutputPointer,MUnicodeSource* aInput,
+ TInt aMaxCompressedBytes,TInt aMaxUnicodeWords,
+ TInt* aCompressedBytes,TInt* aUnicodeWords);
+ void FlushInputBufferL();
+ void FlushOutputBufferL();
+ void WriteRunL();
+ void WriteCharacter(const TAction& aAction);
+ void WriteSCharacter(const TAction& aAction);
+ void WriteUCharacter(TUint16 aCode);
+ void WriteByte(TUint aByte);
+ void WriteCharacterFromBuffer();
+ void SelectTreatment(TInt aTreatment);
+
+ enum
+ {
+ EMaxInputBufferSize = 4,
+ EMaxOutputBufferSize = EMaxInputBufferSize * 3 // no Unicode character can be encoded as more than three bytes
+ };
+ TAction iInputBuffer[EMaxInputBufferSize]; // circular buffer; queue of Unicode characters to be processed
+ TInt iInputBufferStart; // position of first Unicode character to be processed
+ TInt iInputBufferSize; // characters in the input buffer
+ TUint8 iOutputBuffer[EMaxOutputBufferSize]; // circular buffer; queue of compressed bytes to be output
+ TInt iOutputBufferStart; // position of first compressed byte to be output
+ TInt iOutputBufferSize; // characters in the output buffer
+ TInt iDynamicWindowIndex; // index of the current dynamic window
+ RWriteStream* iOutputStream; // if non-null, output is to this stream
+ TUint8* iOutputPointer; // if non-null, output is to memory
+ MUnicodeSource* iInput; // input object
+ };
+
+// inline functions start here
+inline TMemoryUnicodeSource::TMemoryUnicodeSource(const UTF16* aPtr):
+ iPtr(aPtr)
+ {
+ }
+
+inline TUint16 TMemoryUnicodeSource::ReadUnicodeValueL()
+ {
+ return *iPtr++;
+ }
+
+inline TUnicodeCompressor::TAction::TAction():
+ iCode(0),
+ iTreatment(EPlainUnicode)
+ {
+ }
+