summaryrefslogtreecommitdiffstats
path: root/extensions/universalchardet/src/base/nsSJISProber.h
diff options
context:
space:
mode:
Diffstat (limited to 'extensions/universalchardet/src/base/nsSJISProber.h')
-rw-r--r--extensions/universalchardet/src/base/nsSJISProber.h44
1 files changed, 44 insertions, 0 deletions
diff --git a/extensions/universalchardet/src/base/nsSJISProber.h b/extensions/universalchardet/src/base/nsSJISProber.h
new file mode 100644
index 000000000..6044fae87
--- /dev/null
+++ b/extensions/universalchardet/src/base/nsSJISProber.h
@@ -0,0 +1,44 @@
+/* -*- Mode: C; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
+/* This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
+
+// for S-JIS encoding, obeserve characteristic:
+// 1, kana character (or hankaku?) often have hight frequency of appereance
+// 2, kana character often exist in group
+// 3, certain combination of kana is never used in japanese language
+
+#ifndef nsSJISProber_h__
+#define nsSJISProber_h__
+
+#include "nsCharSetProber.h"
+#include "nsCodingStateMachine.h"
+#include "JpCntx.h"
+#include "CharDistribution.h"
+
+
+class nsSJISProber: public nsCharSetProber {
+public:
+ nsSJISProber()
+ {mCodingSM = new nsCodingStateMachine(&SJISSMModel);
+ Reset();}
+ virtual ~nsSJISProber(void){delete mCodingSM;}
+ nsProbingState HandleData(const char* aBuf, uint32_t aLen);
+ const char* GetCharSetName() {return "Shift_JIS";}
+ nsProbingState GetState(void) {return mState;}
+ void Reset(void);
+ float GetConfidence(void);
+
+protected:
+ nsCodingStateMachine* mCodingSM;
+ nsProbingState mState;
+
+ SJISContextAnalysis mContextAnalyser;
+ SJISDistributionAnalysis mDistributionAnalyser;
+
+ char mLastChar[2];
+};
+
+
+#endif /* nsSJISProber_h__ */
+