Thu, 22 Jan 2015 13:21:57 +0100
Incorporate requested changes from Mozilla in review:
https://bugzilla.mozilla.org/show_bug.cgi?id=1123480#c6
michael@0 | 1 | /* -*- Mode: C; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 2 -*- */ |
michael@0 | 2 | /* This Source Code Form is subject to the terms of the Mozilla Public |
michael@0 | 3 | * License, v. 2.0. If a copy of the MPL was not distributed with this |
michael@0 | 4 | * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ |
michael@0 | 5 | |
michael@0 | 6 | // for S-JIS encoding, obeserve characteristic: |
michael@0 | 7 | // 1, kana character (or hankaku?) often have hight frequency of appereance |
michael@0 | 8 | // 2, kana character often exist in group |
michael@0 | 9 | // 3, certain combination of kana is never used in japanese language |
michael@0 | 10 | |
michael@0 | 11 | #ifndef nsEUCJPProber_h__ |
michael@0 | 12 | #define nsEUCJPProber_h__ |
michael@0 | 13 | |
michael@0 | 14 | #include "nsCharSetProber.h" |
michael@0 | 15 | #include "nsCodingStateMachine.h" |
michael@0 | 16 | #include "JpCntx.h" |
michael@0 | 17 | #include "CharDistribution.h" |
michael@0 | 18 | |
michael@0 | 19 | class nsEUCJPProber: public nsCharSetProber { |
michael@0 | 20 | public: |
michael@0 | 21 | nsEUCJPProber(bool aIsPreferredLanguage) |
michael@0 | 22 | :mIsPreferredLanguage(aIsPreferredLanguage) |
michael@0 | 23 | {mCodingSM = new nsCodingStateMachine(&EUCJPSMModel); |
michael@0 | 24 | Reset();} |
michael@0 | 25 | virtual ~nsEUCJPProber(void){delete mCodingSM;} |
michael@0 | 26 | nsProbingState HandleData(const char* aBuf, uint32_t aLen); |
michael@0 | 27 | const char* GetCharSetName() {return "EUC-JP";} |
michael@0 | 28 | nsProbingState GetState(void) {return mState;} |
michael@0 | 29 | void Reset(void); |
michael@0 | 30 | float GetConfidence(void); |
michael@0 | 31 | |
michael@0 | 32 | protected: |
michael@0 | 33 | nsCodingStateMachine* mCodingSM; |
michael@0 | 34 | nsProbingState mState; |
michael@0 | 35 | |
michael@0 | 36 | EUCJPContextAnalysis mContextAnalyser; |
michael@0 | 37 | EUCJPDistributionAnalysis mDistributionAnalyser; |
michael@0 | 38 | |
michael@0 | 39 | char mLastChar[2]; |
michael@0 | 40 | bool mIsPreferredLanguage; |
michael@0 | 41 | }; |
michael@0 | 42 | |
michael@0 | 43 | |
michael@0 | 44 | #endif /* nsEUCJPProber_h__ */ |
michael@0 | 45 |