2002-11-09 17:05:47 +00:00
|
|
|
|
/*
|
|
|
|
|
* charset=UTF-8
|
|
|
|
|
* vim600: encoding=utf-8
|
|
|
|
|
*/
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* "streamable kanji code filter and converter"
|
|
|
|
|
*
|
|
|
|
|
* Copyright (c) 1998,1999,2000,2001 HappySize, Inc. All rights reserved.
|
|
|
|
|
*
|
|
|
|
|
* This software is released under the GNU Lesser General Public License.
|
2001-05-07 13:58:00 +00:00
|
|
|
|
* (Version 2.1, February 1999)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
* Please read the following detail of the licence (in japanese).
|
|
|
|
|
*
|
|
|
|
|
* ◆使用許諾条件◆
|
|
|
|
|
*
|
|
|
|
|
* このソフトウェアは株式会社ハッピーサイズによって開発されました。株式会社ハッ
|
|
|
|
|
* ピーサイズは、著作権法および万国著作権条約の定めにより、このソフトウェアに関
|
|
|
|
|
* するすべての権利を留保する権利を持ち、ここに行使します。株式会社ハッピーサイ
|
|
|
|
|
* ズは以下に明記した条件に従って、このソフトウェアを使用する排他的ではない権利
|
|
|
|
|
* をお客様に許諾します。何人たりとも、以下の条件に反してこのソフトウェアを使用
|
|
|
|
|
* することはできません。
|
|
|
|
|
*
|
|
|
|
|
* このソフトウェアを「GNU Lesser General Public License (Version 2.1, February
|
|
|
|
|
* 1999)」に示された条件で使用することを、全ての方に許諾します。「GNU Lesser
|
|
|
|
|
* General Public License」を満たさない使用には、株式会社ハッピーサイズから書面
|
|
|
|
|
* による許諾を得る必要があります。
|
|
|
|
|
*
|
|
|
|
|
* 「GNU Lesser General Public License」の全文は以下のウェブページから取得でき
|
|
|
|
|
* ます。「GNU Lesser General Public License」とは、これまでLibrary General
|
|
|
|
|
* Public Licenseと呼ばれていたものです。
|
|
|
|
|
* http://www.gnu.org/ --- GNUウェブサイト
|
|
|
|
|
* http://www.gnu.org/copyleft/lesser.html --- ライセンス文面
|
|
|
|
|
* このライセンスの内容がわからない方、守れない方には使用を許諾しません。
|
|
|
|
|
*
|
|
|
|
|
* しかしながら、当社とGNUプロジェクトとの特定の関係を示唆または主張するもので
|
|
|
|
|
* はありません。
|
|
|
|
|
*
|
|
|
|
|
* ◆保証内容◆
|
|
|
|
|
*
|
|
|
|
|
* このソフトウェアは、期待された動作・機能・性能を持つことを目標として設計され
|
|
|
|
|
* 開発されていますが、これを保証するものではありません。このソフトウェアは「こ
|
|
|
|
|
* のまま」の状態で提供されており、たとえばこのソフトウェアの有用性ないし特定の
|
|
|
|
|
* 目的に合致することといった、何らかの保証内容が、明示されたり暗黙に示されてい
|
|
|
|
|
* る場合であっても、その保証は無効です。このソフトウェアを使用した結果ないし使
|
|
|
|
|
* 用しなかった結果によって、直接あるいは間接に受けた身体的な傷害、財産上の損害
|
|
|
|
|
* 、データの損失あるいはその他の全ての損害については、その損害の可能性が使用者
|
|
|
|
|
* 、当社あるいは第三者によって警告されていた場合であっても、当社はその損害の賠
|
|
|
|
|
* 償および補填を行いません。この規定は他の全ての、書面上または書面に無い保証・
|
|
|
|
|
* 契約・規定に優先します。
|
|
|
|
|
*
|
|
|
|
|
* ◆著作権者の連絡先および使用条件についての問い合わせ先◆
|
|
|
|
|
*
|
2001-05-07 13:58:00 +00:00
|
|
|
|
* 〒102-0073
|
|
|
|
|
* 東京都千代田区九段北1-13-5日本地所第一ビル4F
|
2001-05-01 01:52:55 +00:00
|
|
|
|
* 株式会社ハッピーサイズ
|
2001-05-07 13:58:00 +00:00
|
|
|
|
* Phone: 03-3512-3655, Fax: 03-3512-3656
|
|
|
|
|
* Email: sales@happysize.co.jp
|
|
|
|
|
* Web: http://happysize.com/
|
2001-05-01 01:52:55 +00:00
|
|
|
|
*
|
|
|
|
|
* ◆著者◆
|
|
|
|
|
*
|
|
|
|
|
* 金本 茂 <sgk@happysize.co.jp>
|
|
|
|
|
*
|
|
|
|
|
* ◆履歴◆
|
|
|
|
|
*
|
|
|
|
|
* 1998/11/10 sgk implementation in C++
|
|
|
|
|
* 1999/4/25 sgk Cで書きなおし。
|
|
|
|
|
* 1999/4/26 sgk 入力フィルタを実装。漢字コードを推定しながらフィルタを追加。
|
|
|
|
|
* 1999/6/?? Unicodeサポート。
|
|
|
|
|
* 1999/6/22 sgk ライセンスをLGPLに変更。
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Unicode support
|
|
|
|
|
*
|
|
|
|
|
* Portions copyright (c) 1999,2000,2001 by the PHP3 internationalization team.
|
|
|
|
|
* All rights reserved.
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/* $Id$ */
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
|
|
|
#include "config.h"
|
|
|
|
|
#endif
|
|
|
|
|
|
2002-02-23 00:00:15 +00:00
|
|
|
|
#include "php.h"
|
2002-04-10 12:47:41 +00:00
|
|
|
|
#include "php_globals.h"
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-10-06 09:36:26 +00:00
|
|
|
|
#ifdef HAVE_MBSTRING
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
#include "mbfilter.h"
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
#include "mbfilter_ja.h"
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
#include "mbfilter_cn.h"
|
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
#include "mbfilter_tw.h"
|
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
#include "mbfilter_kr.h"
|
|
|
|
|
#endif
|
2002-08-14 06:38:07 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#include "mbfilter_ru.h"
|
|
|
|
|
#endif
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
#include "zend.h"
|
|
|
|
|
|
2001-06-11 15:31:58 +00:00
|
|
|
|
#ifdef PHP_WIN32
|
|
|
|
|
#include "win95nt.h"
|
|
|
|
|
#endif
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
#define mbfl_malloc emalloc
|
|
|
|
|
#define mbfl_realloc erealloc
|
|
|
|
|
#define mbfl_calloc ecalloc
|
|
|
|
|
#define mbfl_free efree
|
|
|
|
|
|
|
|
|
|
#define mbfl_pmalloc malloc
|
|
|
|
|
#define mbfl_prealloc realloc
|
|
|
|
|
#define mbfl_pfree free
|
|
|
|
|
|
2002-03-07 17:28:50 +00:00
|
|
|
|
#include "unicode_table.h"
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* language structure */
|
2002-11-12 19:24:45 +00:00
|
|
|
|
static const mbfl_language mbfl_language_neutral = {
|
|
|
|
|
mbfl_no_language_neutral,
|
|
|
|
|
"neutral",
|
|
|
|
|
"neutral",
|
|
|
|
|
NULL,
|
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_base64
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_language_uni_aliases[] = {"universal", NULL};
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_language mbfl_language_uni = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_language_uni,
|
|
|
|
|
"uni",
|
|
|
|
|
"uni",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_language_uni_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_base64
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_language mbfl_language_japanese = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_language_japanese,
|
|
|
|
|
"Japanese",
|
|
|
|
|
"ja",
|
|
|
|
|
NULL,
|
|
|
|
|
mbfl_no_encoding_2022jp,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_7bit
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_language mbfl_language_korean = {
|
2002-05-12 13:06:13 +00:00
|
|
|
|
mbfl_no_language_korean,
|
|
|
|
|
"Korean",
|
|
|
|
|
"ko",
|
|
|
|
|
NULL,
|
|
|
|
|
mbfl_no_encoding_2022kr,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_7bit
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_language mbfl_language_english = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_language_english,
|
|
|
|
|
"English",
|
|
|
|
|
"en",
|
|
|
|
|
NULL,
|
|
|
|
|
mbfl_no_encoding_8859_1,
|
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
mbfl_no_encoding_8bit
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const char *mbfl_language_german_aliases[] = {"Deutsch", NULL};
|
|
|
|
|
|
|
|
|
|
static const mbfl_language mbfl_language_german = {
|
2002-11-10 21:31:26 +00:00
|
|
|
|
mbfl_no_language_german,
|
2002-08-02 10:22:31 +00:00
|
|
|
|
"German",
|
|
|
|
|
"de",
|
|
|
|
|
(const char *(*)[])&mbfl_language_german_aliases,
|
|
|
|
|
mbfl_no_encoding_8859_15,
|
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
mbfl_no_encoding_8bit
|
|
|
|
|
};
|
|
|
|
|
|
2002-05-12 13:06:13 +00:00
|
|
|
|
static mbfl_language mbfl_language_simplified_chinese = {
|
|
|
|
|
mbfl_no_language_simplified_chinese,
|
|
|
|
|
"Simplified Chinese",
|
|
|
|
|
"zh-cn",
|
2002-04-30 12:00:42 +00:00
|
|
|
|
NULL,
|
2002-05-12 13:06:13 +00:00
|
|
|
|
mbfl_no_encoding_hz,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_7bit
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static mbfl_language mbfl_language_traditional_chinese = {
|
|
|
|
|
mbfl_no_language_traditional_chinese,
|
|
|
|
|
"Traditional Chinese",
|
|
|
|
|
"zh-tw",
|
|
|
|
|
NULL,
|
2002-11-13 11:57:59 +00:00
|
|
|
|
mbfl_no_encoding_big5,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_base64,
|
2002-11-13 11:57:59 +00:00
|
|
|
|
mbfl_no_encoding_8bit
|
2002-04-30 12:00:42 +00:00
|
|
|
|
};
|
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
static mbfl_language mbfl_language_russian = {
|
|
|
|
|
mbfl_no_language_russian,
|
|
|
|
|
"Russian",
|
|
|
|
|
"ru",
|
|
|
|
|
NULL,
|
|
|
|
|
mbfl_no_encoding_koi8r,
|
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
mbfl_no_encoding_8bit
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_language *mbfl_language_ptr_table[] = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_language_uni,
|
|
|
|
|
&mbfl_language_japanese,
|
2002-05-12 13:06:13 +00:00
|
|
|
|
&mbfl_language_korean,
|
|
|
|
|
&mbfl_language_simplified_chinese,
|
|
|
|
|
&mbfl_language_traditional_chinese,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_language_english,
|
2002-08-02 10:22:31 +00:00
|
|
|
|
&mbfl_language_german,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
&mbfl_language_russian,
|
2002-11-12 19:44:56 +00:00
|
|
|
|
&mbfl_language_neutral,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* encoding byte width table */
|
|
|
|
|
static const unsigned char mblen_table_utf8[] = {
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
|
|
|
|
|
4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 6, 6, 1, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_eucjp[] = { /* 0xA1-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_sjis[] = { /* 0x80-0x9f,0xE0-0xFF */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
static const unsigned char mblen_table_euccn[] = { /* 0xA1-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_cp936[] = { /* 0x81-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_euctw[] = { /* 0xA1-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 4, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_big5[] = { /* 0x81-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_euckr[] = { /* 0xA1-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char mblen_table_uhc[] = { /* 0x81-0xFE */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
|
|
|
|
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-04 14:20:11 +00:00
|
|
|
|
static const unsigned char mblen_table_html[] = { /* 0x00, 0x80 - 0xFF, only valid for numeric entities */
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
|
|
|
|
|
6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6, 6
|
|
|
|
|
};
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* encoding structure */
|
|
|
|
|
static const char *mbfl_encoding_pass_aliases[] = {"none", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_pass = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_pass,
|
|
|
|
|
"pass",
|
|
|
|
|
NULL,
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_pass_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
0
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_auto_aliases[] = {"unknown", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_auto = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_auto,
|
|
|
|
|
"auto",
|
|
|
|
|
NULL,
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_auto_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
0
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
"wchar",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_byte2be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte2be,
|
|
|
|
|
"byte2be",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_byte2le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte2le,
|
|
|
|
|
"byte2le",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_byte4be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte4be,
|
|
|
|
|
"byte4be",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_byte4le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte4le,
|
|
|
|
|
"byte4le",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_base64 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
"BASE64",
|
|
|
|
|
"BASE64",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_uuencode = {
|
2001-05-12 23:42:09 +00:00
|
|
|
|
mbfl_no_encoding_uuencode,
|
|
|
|
|
"UUENCODE",
|
|
|
|
|
"x-uuencode",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-04 14:20:11 +00:00
|
|
|
|
static const char *mbfl_encoding_html_ent_aliases[] = {"HTML", "html", NULL};
|
|
|
|
|
|
|
|
|
|
static const mbfl_encoding mbfl_encoding_html_ent = {
|
|
|
|
|
mbfl_no_encoding_html_ent,
|
|
|
|
|
"HTML-ENTITIES",
|
2002-08-04 20:50:53 +00:00
|
|
|
|
"US-ASCII",
|
2002-08-04 14:20:11 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_html_ent_aliases,
|
|
|
|
|
NULL, /* mblen_table_html, Do not use table instead calulate length based on entities actually used */
|
|
|
|
|
MBFL_ENCTYPE_HTML_ENT
|
|
|
|
|
};
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
static const char *mbfl_encoding_qprint_aliases[] = {"qprint", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_qprint = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
"Quoted-Printable",
|
|
|
|
|
"Quoted-Printable",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_qprint_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_7bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_7bit,
|
|
|
|
|
"7bit",
|
|
|
|
|
"7bit",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
"8bit",
|
|
|
|
|
"8bit",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_ucs2_aliases[] = {"ISO-10646-UCS-2", "UCS2" , "UNICODE", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs2 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2,
|
|
|
|
|
"UCS-2",
|
|
|
|
|
"UCS-2",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_ucs2_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS2BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs2be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2be,
|
|
|
|
|
"UCS-2BE",
|
|
|
|
|
"UCS-2BE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS2BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs2le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2le,
|
|
|
|
|
"UCS-2LE",
|
|
|
|
|
"UCS-2LE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS2LE
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_ucs4_aliases[] = {"ISO-10646-UCS-4", "UCS4", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs4 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4,
|
|
|
|
|
"UCS-4",
|
|
|
|
|
"UCS-4",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_ucs4_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs4be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4be,
|
|
|
|
|
"UCS-4BE",
|
|
|
|
|
"UCS-4BE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ucs4le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4le,
|
|
|
|
|
"UCS-4LE",
|
|
|
|
|
"UCS-4LE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4LE
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_utf32_aliases[] = {"utf32", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf32 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32,
|
|
|
|
|
"UTF-32",
|
|
|
|
|
"UTF-32",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_utf32_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf32be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32be,
|
|
|
|
|
"UTF-32BE",
|
|
|
|
|
"UTF-32BE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf32le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32le,
|
|
|
|
|
"UTF-32LE",
|
|
|
|
|
"UTF-32LE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_WCS4LE
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_utf16_aliases[] = {"utf16", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf16 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16,
|
|
|
|
|
"UTF-16",
|
|
|
|
|
"UTF-16",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_utf16_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MWC2BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf16be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16be,
|
|
|
|
|
"UTF-16BE",
|
|
|
|
|
"UTF-16BE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MWC2BE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf16le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16le,
|
|
|
|
|
"UTF-16LE",
|
|
|
|
|
"UTF-16LE",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MWC2LE
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_utf8_aliases[] = {"utf8", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
"UTF-8",
|
|
|
|
|
"UTF-8",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_utf8_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mblen_table_utf8,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_utf7_aliases[] = {"utf7", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf7,
|
|
|
|
|
"UTF-7",
|
|
|
|
|
"UTF-7",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_utf7_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_utf7imap = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf7imap,
|
|
|
|
|
"UTF7-IMAP",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-04 20:50:53 +00:00
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_ascii_aliases[] = {"ANSI_X3.4-1968", "iso-ir-6", "ANSI_X3.4-1986", "ISO_646.irv:1991", "US-ASCII", "ISO646-US", "us", "IBM367", "cp367", "csASCII", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_ascii = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ascii,
|
|
|
|
|
"ASCII",
|
2002-08-04 20:50:53 +00:00
|
|
|
|
"US-ASCII", /* preferred MIME name */
|
|
|
|
|
(const char *(*)[])&mbfl_encoding_ascii_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
static const char *mbfl_encoding_euc_jp_aliases[] = {"EUC", "EUC_JP", "eucJP", "x-euc-jp", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_euc_jp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_euc_jp,
|
|
|
|
|
"EUC-JP",
|
|
|
|
|
"EUC-JP",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_euc_jp_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mblen_table_eucjp,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_sjis_aliases[] = {"x-sjis", "SHIFT-JIS", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_sjis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis,
|
|
|
|
|
"SJIS",
|
|
|
|
|
"Shift_JIS",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_sjis_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mblen_table_sjis,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_eucjp_win_aliases[] = {"eucJP-open", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_eucjp_win = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_eucjp_win,
|
|
|
|
|
"eucJP-win",
|
|
|
|
|
"EUC-JP",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_eucjp_win_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mblen_table_eucjp,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-05-05 02:22:36 +00:00
|
|
|
|
static const char *mbfl_encoding_sjis_win_aliases[] = {"SJIS-open", "MS_Kanji", "Windows-31J", "CP932", NULL};
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_sjis_win = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis_win,
|
|
|
|
|
"SJIS-win",
|
|
|
|
|
"Shift_JIS",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_sjis_win_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mblen_table_sjis,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_jis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_jis,
|
|
|
|
|
"JIS",
|
|
|
|
|
"ISO-2022-JP",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_2022jp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_2022jp,
|
|
|
|
|
"ISO-2022-JP",
|
|
|
|
|
"ISO-2022-JP",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_JA */
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
2002-05-29 09:15:28 +00:00
|
|
|
|
static const char *mbfl_encoding_euc_cn_aliases[] = {"CN-GB", "EUC_CN", "eucCN", "x-euc-cn", "gb2312", NULL};
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
static mbfl_encoding mbfl_encoding_euc_cn = {
|
|
|
|
|
mbfl_no_encoding_euc_cn,
|
|
|
|
|
"EUC-CN",
|
2002-05-08 12:33:44 +00:00
|
|
|
|
"CN-GB",
|
2002-04-30 12:00:42 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_euc_cn_aliases,
|
|
|
|
|
mblen_table_euccn,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_cp936_aliases[] = {"CP-936", NULL};
|
|
|
|
|
|
|
|
|
|
static mbfl_encoding mbfl_encoding_cp936 = {
|
|
|
|
|
mbfl_no_encoding_cp936,
|
|
|
|
|
"CP936",
|
|
|
|
|
"CP936",
|
|
|
|
|
(const char *(*)[])&mbfl_encoding_cp936_aliases,
|
|
|
|
|
mblen_table_cp936,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-05-12 13:06:13 +00:00
|
|
|
|
static mbfl_encoding mbfl_encoding_hz = {
|
|
|
|
|
mbfl_no_encoding_hz,
|
|
|
|
|
"HZ",
|
|
|
|
|
"HZ-GB-2312",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_CN */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
static const char *mbfl_encoding_euc_tw_aliases[] = {"EUC_TW", "eucTW", "x-euc-tw", NULL};
|
|
|
|
|
|
|
|
|
|
static mbfl_encoding mbfl_encoding_euc_tw = {
|
|
|
|
|
mbfl_no_encoding_euc_tw,
|
|
|
|
|
"EUC-TW",
|
|
|
|
|
"EUC-TW",
|
|
|
|
|
(const char *(*)[])&mbfl_encoding_euc_tw_aliases,
|
|
|
|
|
mblen_table_euctw,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-11-13 11:57:59 +00:00
|
|
|
|
static const char *mbfl_encoding_big5_aliases[] = {"CN-BIG5", "BIG-FIVE", "BIGFIVE", "CP950", NULL};
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
static mbfl_encoding mbfl_encoding_big5 = {
|
|
|
|
|
mbfl_no_encoding_big5,
|
|
|
|
|
"BIG-5",
|
2002-11-13 11:57:59 +00:00
|
|
|
|
"BIG5",
|
2002-04-30 12:00:42 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_big5_aliases,
|
|
|
|
|
mblen_table_big5,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
#endif /* HAVE_MBSTR_TW */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
static const char *mbfl_encoding_euc_kr_aliases[] = {"EUC_KR", "eucKR", "x-euc-kr", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_euc_kr = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_euc_kr,
|
|
|
|
|
"EUC-KR",
|
|
|
|
|
"EUC-KR",
|
|
|
|
|
(const char *(*)[])&mbfl_encoding_euc_kr_aliases,
|
|
|
|
|
mblen_table_euckr,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_uhc_aliases[] = {"CP949", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_uhc = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_uhc,
|
|
|
|
|
"UHC",
|
|
|
|
|
"UHC",
|
|
|
|
|
(const char *(*)[])&mbfl_encoding_uhc_aliases,
|
|
|
|
|
mblen_table_uhc,
|
|
|
|
|
MBFL_ENCTYPE_MBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_2022kr = {
|
2002-05-24 22:28:42 +00:00
|
|
|
|
mbfl_no_encoding_2022kr,
|
|
|
|
|
"ISO-2022-KR",
|
|
|
|
|
"ISO-2022-KR",
|
|
|
|
|
NULL,
|
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_MBCS | MBFL_ENCTYPE_SHFTCODE
|
|
|
|
|
};
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_KR */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2001-08-25 09:21:43 +00:00
|
|
|
|
static const char *mbfl_encoding_cp1252_aliases[] = {"cp1252", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_cp1252 = {
|
2001-08-25 09:21:43 +00:00
|
|
|
|
mbfl_no_encoding_cp1252,
|
|
|
|
|
"Windows-1252",
|
|
|
|
|
"Windows-1252",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_cp1252_aliases,
|
2001-08-25 09:21:43 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
static const char *mbfl_encoding_8859_1_aliases[] = {"ISO_8859-1", "latin1", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_1 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_1,
|
|
|
|
|
"ISO-8859-1",
|
|
|
|
|
"ISO-8859-1",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_1_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_2_aliases[] = {"ISO_8859-2", "latin2", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_2 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_2,
|
|
|
|
|
"ISO-8859-2",
|
|
|
|
|
"ISO-8859-2",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_2_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_3_aliases[] = {"ISO_8859-3", "latin3", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_3 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_3,
|
|
|
|
|
"ISO-8859-3",
|
|
|
|
|
"ISO-8859-3",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_3_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_4_aliases[] = {"ISO_8859-4", "latin4", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_4 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_4,
|
|
|
|
|
"ISO-8859-4",
|
|
|
|
|
"ISO-8859-4",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_4_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_5_aliases[] = {"ISO_8859-5", "cyrillic", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_5 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_5,
|
|
|
|
|
"ISO-8859-5",
|
|
|
|
|
"ISO-8859-5",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_5_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_6_aliases[] = {"ISO_8859-6", "arabic", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_6 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_6,
|
|
|
|
|
"ISO-8859-6",
|
|
|
|
|
"ISO-8859-6",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_6_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_7_aliases[] = {"ISO_8859-7", "greek", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_7,
|
|
|
|
|
"ISO-8859-7",
|
|
|
|
|
"ISO-8859-7",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_7_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_8_aliases[] = {"ISO_8859-8", "hebrew", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_8,
|
|
|
|
|
"ISO-8859-8",
|
|
|
|
|
"ISO-8859-8",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_8_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_9_aliases[] = {"ISO_8859-9", "latin5", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_9 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_9,
|
|
|
|
|
"ISO-8859-9",
|
|
|
|
|
"ISO-8859-9",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_9_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_10_aliases[] = {"ISO_8859-10", "latin6", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_10 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_10,
|
|
|
|
|
"ISO-8859-10",
|
|
|
|
|
"ISO-8859-10",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_10_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_13_aliases[] = {"ISO_8859-13", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_13 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_13,
|
|
|
|
|
"ISO-8859-13",
|
|
|
|
|
"ISO-8859-13",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_13_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_14_aliases[] = {"ISO_8859-14", "latin8", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_14 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_14,
|
|
|
|
|
"ISO-8859-14",
|
|
|
|
|
"ISO-8859-14",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_14_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_8859_15_aliases[] = {"ISO_8859-15", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_8859_15 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_15,
|
|
|
|
|
"ISO-8859-15",
|
|
|
|
|
"ISO-8859-15",
|
2002-03-07 17:28:50 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_8859_15_aliases,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
2002-06-22 08:01:57 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
2002-05-21 07:00:34 +00:00
|
|
|
|
static const char *mbfl_encoding_cp1251_aliases[] = {"CP1251", "CP-1251", "WINDOWS-1251", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_cp1251 = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_cp1251,
|
|
|
|
|
"Windows-1251",
|
|
|
|
|
"Windows-1251",
|
2002-06-01 05:45:25 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_cp1251_aliases,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_cp866_aliases[] = {"CP866", "CP-866", "IBM-866", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_cp866 = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_cp866,
|
|
|
|
|
"CP866",
|
|
|
|
|
"CP866",
|
2002-06-01 05:45:25 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_cp866_aliases,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const char *mbfl_encoding_koi8r_aliases[] = {"KOI8-R", "KOI8R", NULL};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding mbfl_encoding_koi8r = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_koi8r,
|
|
|
|
|
"KOI8-R",
|
|
|
|
|
"KOI8-R",
|
2002-06-01 05:45:25 +00:00
|
|
|
|
(const char *(*)[])&mbfl_encoding_koi8r_aliases,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
NULL,
|
|
|
|
|
MBFL_ENCTYPE_SBCS
|
|
|
|
|
};
|
|
|
|
|
#endif
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const mbfl_encoding *mbfl_encoding_ptr_list[] = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_encoding_pass,
|
|
|
|
|
&mbfl_encoding_auto,
|
|
|
|
|
&mbfl_encoding_wchar,
|
|
|
|
|
&mbfl_encoding_byte2be,
|
|
|
|
|
&mbfl_encoding_byte2le,
|
|
|
|
|
&mbfl_encoding_byte4be,
|
|
|
|
|
&mbfl_encoding_byte4le,
|
|
|
|
|
&mbfl_encoding_base64,
|
2001-05-12 23:42:09 +00:00
|
|
|
|
&mbfl_encoding_uuencode,
|
2002-08-04 14:20:11 +00:00
|
|
|
|
&mbfl_encoding_html_ent,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_encoding_qprint,
|
|
|
|
|
&mbfl_encoding_7bit,
|
|
|
|
|
&mbfl_encoding_8bit,
|
|
|
|
|
&mbfl_encoding_ucs4,
|
|
|
|
|
&mbfl_encoding_ucs4be,
|
|
|
|
|
&mbfl_encoding_ucs4le,
|
|
|
|
|
&mbfl_encoding_ucs2,
|
|
|
|
|
&mbfl_encoding_ucs2be,
|
|
|
|
|
&mbfl_encoding_ucs2le,
|
|
|
|
|
&mbfl_encoding_utf32,
|
|
|
|
|
&mbfl_encoding_utf32be,
|
|
|
|
|
&mbfl_encoding_utf32le,
|
|
|
|
|
&mbfl_encoding_utf16,
|
|
|
|
|
&mbfl_encoding_utf16be,
|
|
|
|
|
&mbfl_encoding_utf16le,
|
|
|
|
|
&mbfl_encoding_utf8,
|
|
|
|
|
&mbfl_encoding_utf7,
|
|
|
|
|
&mbfl_encoding_utf7imap,
|
|
|
|
|
&mbfl_encoding_ascii,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_encoding_euc_jp,
|
|
|
|
|
&mbfl_encoding_sjis,
|
|
|
|
|
&mbfl_encoding_eucjp_win,
|
|
|
|
|
&mbfl_encoding_sjis_win,
|
|
|
|
|
&mbfl_encoding_jis,
|
|
|
|
|
&mbfl_encoding_2022jp,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
2001-08-25 09:21:43 +00:00
|
|
|
|
&mbfl_encoding_cp1252,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&mbfl_encoding_8859_1,
|
|
|
|
|
&mbfl_encoding_8859_2,
|
|
|
|
|
&mbfl_encoding_8859_3,
|
|
|
|
|
&mbfl_encoding_8859_4,
|
|
|
|
|
&mbfl_encoding_8859_5,
|
|
|
|
|
&mbfl_encoding_8859_6,
|
|
|
|
|
&mbfl_encoding_8859_7,
|
|
|
|
|
&mbfl_encoding_8859_8,
|
|
|
|
|
&mbfl_encoding_8859_9,
|
|
|
|
|
&mbfl_encoding_8859_10,
|
|
|
|
|
&mbfl_encoding_8859_13,
|
|
|
|
|
&mbfl_encoding_8859_14,
|
|
|
|
|
&mbfl_encoding_8859_15,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
&mbfl_encoding_euc_cn,
|
|
|
|
|
&mbfl_encoding_cp936,
|
2002-05-12 13:06:13 +00:00
|
|
|
|
&mbfl_encoding_hz,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
&mbfl_encoding_euc_tw,
|
|
|
|
|
&mbfl_encoding_big5,
|
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
&mbfl_encoding_euc_kr,
|
|
|
|
|
&mbfl_encoding_uhc,
|
2002-05-24 22:28:42 +00:00
|
|
|
|
&mbfl_encoding_2022kr,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
|
|
|
|
&mbfl_encoding_cp1251,
|
|
|
|
|
&mbfl_encoding_cp866,
|
|
|
|
|
&mbfl_encoding_koi8r,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
2001-05-01 01:52:55 +00:00
|
|
|
|
NULL
|
|
|
|
|
};
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
/* hex character table "0123456789ABCDEF" */
|
|
|
|
|
static char mbfl_hexchar_table[] = {
|
|
|
|
|
0x30,0x31,0x32,0x33,0x34,0x35,0x36,0x37,0x38,0x39,0x41,0x42,0x43,0x44,0x45,0x46
|
|
|
|
|
};
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* forward */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
static void mbfl_filt_conv_common_ctor(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_common_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static void mbfl_filt_conv_common_dtor(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
|
|
|
|
static int mbfl_filt_conv_pass(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_byte2be(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_byte2be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_byte2le(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_byte2le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_byte4be(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_byte4be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_byte4le(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_byte4le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_any_7bit(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
|
|
|
|
static int mbfl_filt_conv_base64enc(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_base64enc_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_base64dec(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_base64dec_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_uudec(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
2002-08-04 14:20:11 +00:00
|
|
|
|
static void mbfl_filt_conv_html_dec_ctor(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static void mbfl_filt_conv_html_dec_dtor(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_html_enc(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_html_enc_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_html_dec(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_html_dec_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
static int mbfl_filt_conv_qprintenc(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_qprintenc_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_qprintdec(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_qprintdec_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
|
|
|
|
static int mbfl_filt_conv_ucs4_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_ucs4be(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_ucs4le(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_ucs2_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_ucs2be(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_ucs2le(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf16_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf16be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf16be(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf16le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf16le(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf8_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf8(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf7_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf7(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf7_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_utf7imap_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf7imap(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_utf7imap_flush(mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_ascii(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
|
|
|
|
static int mbfl_filt_conv_wchar_cp1252(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_cp1252_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_1(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_2_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_2(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_3_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_3(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_4_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_4(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_5_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_5(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_6_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_6(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_7_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_7(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_8_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_8(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_9_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_9(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_10_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_10(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_13_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_13(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_14_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_14(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_8859_15_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_conv_wchar_8859_15(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
|
|
|
|
|
|
|
|
|
static void mbfl_filt_ident_common_ctor(mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static void mbfl_filt_ident_common_dtor(mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static void mbfl_filt_ident_false_ctor(mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_utf8(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_utf7(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_ascii(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2002-04-10 12:47:41 +00:00
|
|
|
|
static int mbfl_filt_ident_eucjp(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_sjis(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_sjiswin(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_jis(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_2022jp(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_JA */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
static int mbfl_filt_ident_euccn(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_cp936(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-05-12 13:06:13 +00:00
|
|
|
|
static int mbfl_filt_ident_hz(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_CN */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
static int mbfl_filt_ident_euctw(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_big5(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
#endif /* HAVE_MBSTR_TW */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
static int mbfl_filt_ident_euckr(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_uhc(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-05-24 22:28:42 +00:00
|
|
|
|
static int mbfl_filt_ident_2022kr(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_KR */
|
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
|
|
|
|
static int mbfl_filt_ident_cp1251(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_cp866(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_koi8r(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
#endif /* HAVE_MBSTR_RU */
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
static int mbfl_filt_ident_cp1252(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2002-04-10 12:47:41 +00:00
|
|
|
|
static int mbfl_filt_ident_false(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
|
|
|
|
static int mbfl_filt_ident_true(int c, mbfl_identify_filter *filter TSRMLS_DC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* convert filter function table */
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_pass = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_pass,
|
|
|
|
|
mbfl_no_encoding_pass,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_pass,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_byte2be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte2be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte2be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_byte2be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_byte2be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_byte2be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_byte2le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte2le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte2le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_byte2le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_byte2le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_byte2le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_byte4be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte4be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_byte4be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_byte4be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_byte4be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_byte4le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_byte4le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_byte4le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_byte4le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_byte4le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8bit_b64 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_base64enc,
|
|
|
|
|
mbfl_filt_conv_base64enc_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_b64_8bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_base64,
|
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_base64dec,
|
|
|
|
|
mbfl_filt_conv_base64dec_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_uuencode_8bit = {
|
2001-05-12 23:42:09 +00:00
|
|
|
|
mbfl_no_encoding_uuencode,
|
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_uudec,
|
2002-08-02 10:22:31 +00:00
|
|
|
|
mbfl_filt_conv_common_flush };
|
2001-05-12 23:42:09 +00:00
|
|
|
|
|
2002-08-04 14:20:11 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_html = {
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_html_ent,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_html_enc,
|
|
|
|
|
mbfl_filt_conv_html_enc_flush };
|
|
|
|
|
|
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_html_wchar = {
|
|
|
|
|
mbfl_no_encoding_html_ent,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_html_dec_ctor,
|
|
|
|
|
mbfl_filt_conv_html_dec_dtor,
|
|
|
|
|
mbfl_filt_conv_html_dec,
|
|
|
|
|
mbfl_filt_conv_html_dec_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8bit_qprint = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_qprintenc,
|
|
|
|
|
mbfl_filt_conv_qprintenc_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_qprint_8bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_qprint,
|
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_qprintdec,
|
|
|
|
|
mbfl_filt_conv_qprintdec_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8bit_7bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_no_encoding_7bit,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_any_7bit,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_7bit_8bit = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_7bit,
|
|
|
|
|
mbfl_no_encoding_8bit,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_pass,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs4_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_ucs4_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs4 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs4,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs4be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs4be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs4be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs4le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs4le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs4le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs4le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs2_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_ucs2_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs2 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs2,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs2be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs2be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte2be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs2be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs2be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs2be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ucs2le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ucs2le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte2le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ucs2le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ucs2le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs2le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf32_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_ucs4_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf32 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf32,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf32be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf32be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf32be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf32le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf32le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_byte4le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf32le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf32le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ucs4le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf16_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf16_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf16 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf16,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf16be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf16be_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16be,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf16be_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf16be = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf16be,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf16be,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf16le_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf16le,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf16le_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf16le = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf16le,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf16le,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf8_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf8_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf8,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf7_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf7,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf7_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf7,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf7,
|
|
|
|
|
mbfl_filt_conv_wchar_utf7_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_utf7imap_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf7imap,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_utf7imap_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_utf7imap = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_utf7imap,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_utf7imap,
|
|
|
|
|
mbfl_filt_conv_wchar_utf7imap_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_ascii_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ascii,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_pass,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_ascii = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_ascii,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_ascii,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_eucjp_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_euc_jp,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_eucjp_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_eucjp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_euc_jp,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_eucjp,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_sjis_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_sjis_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_sjis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_sjis,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_sjis,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_jis_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_jis,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_jis_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_jis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_jis,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_jis,
|
|
|
|
|
mbfl_filt_conv_any_jis_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_2022jp_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_2022jp,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_jis_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_2022jp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_2022jp,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_2022jp,
|
|
|
|
|
mbfl_filt_conv_any_jis_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_eucjpwin_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_eucjp_win,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_eucjpwin_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_eucjpwin = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_eucjp_win,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_eucjpwin,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_sjiswin_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis_win,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_sjiswin_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_sjiswin = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_sjis_win,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_sjiswin,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_JA */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_euccn_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_euc_cn,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_euccn_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_euccn = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_euc_cn,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_euccn,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_cp936_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_cp936,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_cp936_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_cp936 = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_cp936,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_cp936,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
2002-05-12 13:06:13 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_hz_wchar = {
|
2002-05-12 13:06:13 +00:00
|
|
|
|
mbfl_no_encoding_hz,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_hz_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_hz = {
|
2002-05-12 13:06:13 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_hz,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_hz,
|
|
|
|
|
mbfl_filt_conv_any_hz_flush };
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_CN */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_euctw_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_euc_tw,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_euctw_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
|
|
|
|
static struct mbfl_convert_vtbl vtbl_wchar_euctw = {
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_euc_tw,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_euctw,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_big5_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_big5,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_big5_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_big5 = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_big5,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_big5,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
#endif /* HAVE_MBSTR_TW */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_euckr_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_euc_kr,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_euckr_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_euckr = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_euc_kr,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_euckr,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_uhc_wchar = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_uhc,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_uhc_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_uhc = {
|
2002-04-30 12:00:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_uhc,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_uhc,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
2002-05-24 22:28:42 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_2022kr = {
|
2002-05-24 22:28:42 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_2022kr,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_2022kr,
|
|
|
|
|
mbfl_filt_conv_any_2022kr_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_2022kr_wchar = {
|
2002-05-24 22:28:42 +00:00
|
|
|
|
mbfl_no_encoding_2022kr,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_2022kr_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_KR */
|
2002-05-15 12:13:56 +00:00
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_cp1251 = {
|
2002-05-15 12:13:56 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-08-24 09:48:00 +00:00
|
|
|
|
mbfl_no_encoding_cp1251,
|
2002-05-15 12:13:56 +00:00
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_filt_conv_wchar_cp1251,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
2002-05-15 12:13:56 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_cp1251_wchar = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_cp1251,
|
2002-05-15 12:13:56 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_filt_conv_cp1251_wchar,
|
2002-05-15 12:13:56 +00:00
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_cp866 = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-08-24 09:48:00 +00:00
|
|
|
|
mbfl_no_encoding_cp866,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_cp866,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_cp866_wchar = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_cp866,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_cp866_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_koi8r = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_koi8r,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_koi8r,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_koi8r_wchar = {
|
2002-05-21 07:00:34 +00:00
|
|
|
|
mbfl_no_encoding_koi8r,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_koi8r_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
#endif /* HAVE_MBSTR_RU */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_cp1252_wchar = {
|
2001-08-25 09:21:43 +00:00
|
|
|
|
mbfl_no_encoding_cp1252,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_cp1252_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_cp1252 = {
|
2001-08-25 09:21:43 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-05-05 11:42:18 +00:00
|
|
|
|
mbfl_no_encoding_cp1252,
|
2001-08-25 09:21:43 +00:00
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_cp1252,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_1_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_1,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_pass,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_1 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_1,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_1,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_2_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_2,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_2_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_2 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_2,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_2,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_3_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_3,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_3_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_3 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_3,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_3,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_4_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_4,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_4_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_4 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_4,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_4,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_5_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_5,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_5_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_5 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_5,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_5,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_6_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_6,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_6_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_6 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_6,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_6,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_7_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_7,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_7_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_7,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_7,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_8_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_8,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_8_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_8,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_8,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_9_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_9,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_9_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_9 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_9,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_9,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_10_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_10,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_10_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_10 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_10,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_10,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_13_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_13,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_13_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_13 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_13,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_13,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_8859_14_wchar = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_14,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_14_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_14 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_14,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_14,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
|
|
|
|
static struct mbfl_convert_vtbl vtbl_8859_15_wchar = {
|
|
|
|
|
mbfl_no_encoding_8859_15,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_8859_15_wchar,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl vtbl_wchar_8859_15 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_no_encoding_8859_15,
|
|
|
|
|
mbfl_filt_conv_common_ctor,
|
|
|
|
|
mbfl_filt_conv_common_dtor,
|
|
|
|
|
mbfl_filt_conv_wchar_8859_15,
|
|
|
|
|
mbfl_filt_conv_common_flush };
|
|
|
|
|
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl *mbfl_convert_filter_list[] = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_utf8_wchar,
|
|
|
|
|
&vtbl_wchar_utf8,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_eucjp_wchar,
|
|
|
|
|
&vtbl_wchar_eucjp,
|
|
|
|
|
&vtbl_sjis_wchar,
|
|
|
|
|
&vtbl_wchar_sjis,
|
|
|
|
|
&vtbl_jis_wchar,
|
|
|
|
|
&vtbl_wchar_jis,
|
|
|
|
|
&vtbl_2022jp_wchar,
|
|
|
|
|
&vtbl_wchar_2022jp,
|
|
|
|
|
&vtbl_eucjpwin_wchar,
|
|
|
|
|
&vtbl_wchar_eucjpwin,
|
|
|
|
|
&vtbl_sjiswin_wchar,
|
|
|
|
|
&vtbl_wchar_sjiswin,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
&vtbl_euccn_wchar,
|
|
|
|
|
&vtbl_wchar_euccn,
|
|
|
|
|
&vtbl_cp936_wchar,
|
|
|
|
|
&vtbl_wchar_cp936,
|
2002-05-12 13:06:13 +00:00
|
|
|
|
&vtbl_hz_wchar,
|
|
|
|
|
&vtbl_wchar_hz,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
&vtbl_euctw_wchar,
|
|
|
|
|
&vtbl_wchar_euctw,
|
|
|
|
|
&vtbl_big5_wchar,
|
|
|
|
|
&vtbl_wchar_big5,
|
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
&vtbl_euckr_wchar,
|
|
|
|
|
&vtbl_wchar_euckr,
|
|
|
|
|
&vtbl_uhc_wchar,
|
|
|
|
|
&vtbl_wchar_uhc,
|
2002-05-24 22:28:42 +00:00
|
|
|
|
&vtbl_2022kr_wchar,
|
|
|
|
|
&vtbl_wchar_2022kr,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
|
|
|
|
&vtbl_cp1251_wchar,
|
|
|
|
|
&vtbl_wchar_cp1251,
|
|
|
|
|
&vtbl_cp866_wchar,
|
|
|
|
|
&vtbl_wchar_cp866,
|
|
|
|
|
&vtbl_koi8r_wchar,
|
|
|
|
|
&vtbl_wchar_koi8r,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
2001-08-25 09:21:43 +00:00
|
|
|
|
&vtbl_cp1252_wchar,
|
|
|
|
|
&vtbl_wchar_cp1252,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_ascii_wchar,
|
|
|
|
|
&vtbl_wchar_ascii,
|
|
|
|
|
&vtbl_8859_1_wchar,
|
|
|
|
|
&vtbl_wchar_8859_1,
|
|
|
|
|
&vtbl_8859_2_wchar,
|
|
|
|
|
&vtbl_wchar_8859_2,
|
|
|
|
|
&vtbl_8859_3_wchar,
|
|
|
|
|
&vtbl_wchar_8859_3,
|
|
|
|
|
&vtbl_8859_4_wchar,
|
|
|
|
|
&vtbl_wchar_8859_4,
|
|
|
|
|
&vtbl_8859_5_wchar,
|
|
|
|
|
&vtbl_wchar_8859_5,
|
|
|
|
|
&vtbl_8859_6_wchar,
|
|
|
|
|
&vtbl_wchar_8859_6,
|
|
|
|
|
&vtbl_8859_7_wchar,
|
|
|
|
|
&vtbl_wchar_8859_7,
|
|
|
|
|
&vtbl_8859_8_wchar,
|
|
|
|
|
&vtbl_wchar_8859_8,
|
|
|
|
|
&vtbl_8859_9_wchar,
|
|
|
|
|
&vtbl_wchar_8859_9,
|
|
|
|
|
&vtbl_8859_10_wchar,
|
|
|
|
|
&vtbl_wchar_8859_10,
|
|
|
|
|
&vtbl_8859_13_wchar,
|
|
|
|
|
&vtbl_wchar_8859_13,
|
|
|
|
|
&vtbl_8859_14_wchar,
|
|
|
|
|
&vtbl_wchar_8859_14,
|
|
|
|
|
&vtbl_8859_15_wchar,
|
|
|
|
|
&vtbl_wchar_8859_15,
|
|
|
|
|
&vtbl_8bit_b64,
|
|
|
|
|
&vtbl_b64_8bit,
|
2001-05-12 23:42:09 +00:00
|
|
|
|
&vtbl_uuencode_8bit,
|
2002-08-04 14:20:11 +00:00
|
|
|
|
&vtbl_wchar_html,
|
|
|
|
|
&vtbl_html_wchar,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_8bit_qprint,
|
|
|
|
|
&vtbl_qprint_8bit,
|
|
|
|
|
&vtbl_8bit_7bit,
|
|
|
|
|
&vtbl_7bit_8bit,
|
|
|
|
|
&vtbl_utf7_wchar,
|
|
|
|
|
&vtbl_wchar_utf7,
|
|
|
|
|
&vtbl_utf7imap_wchar,
|
|
|
|
|
&vtbl_wchar_utf7imap,
|
|
|
|
|
&vtbl_utf16_wchar,
|
|
|
|
|
&vtbl_wchar_utf16,
|
|
|
|
|
&vtbl_utf16be_wchar,
|
|
|
|
|
&vtbl_wchar_utf16be,
|
|
|
|
|
&vtbl_utf16le_wchar,
|
|
|
|
|
&vtbl_wchar_utf16le,
|
|
|
|
|
&vtbl_utf32_wchar,
|
|
|
|
|
&vtbl_wchar_utf32,
|
|
|
|
|
&vtbl_utf32be_wchar,
|
|
|
|
|
&vtbl_wchar_utf32be,
|
|
|
|
|
&vtbl_utf32le_wchar,
|
|
|
|
|
&vtbl_wchar_utf32le,
|
|
|
|
|
&vtbl_ucs4_wchar,
|
|
|
|
|
&vtbl_wchar_ucs4,
|
|
|
|
|
&vtbl_ucs4be_wchar,
|
|
|
|
|
&vtbl_wchar_ucs4be,
|
|
|
|
|
&vtbl_ucs4le_wchar,
|
|
|
|
|
&vtbl_wchar_ucs4le,
|
|
|
|
|
&vtbl_ucs2_wchar,
|
|
|
|
|
&vtbl_wchar_ucs2,
|
|
|
|
|
&vtbl_ucs2be_wchar,
|
|
|
|
|
&vtbl_wchar_ucs2be,
|
|
|
|
|
&vtbl_ucs2le_wchar,
|
|
|
|
|
&vtbl_wchar_ucs2le,
|
|
|
|
|
&vtbl_byte4be_wchar,
|
|
|
|
|
&vtbl_wchar_byte4be,
|
|
|
|
|
&vtbl_byte4le_wchar,
|
|
|
|
|
&vtbl_wchar_byte4le,
|
|
|
|
|
&vtbl_byte2be_wchar,
|
|
|
|
|
&vtbl_wchar_byte2be,
|
|
|
|
|
&vtbl_byte2le_wchar,
|
|
|
|
|
&vtbl_wchar_byte2le,
|
|
|
|
|
&vtbl_pass,
|
|
|
|
|
NULL
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* identify filter function table */
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_ascii = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_ascii,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_ascii };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_utf8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf8,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_utf8 };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_utf7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_utf7,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_utf7 };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_eucjp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_euc_jp,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_eucjp };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_eucjpwin = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_eucjp_win,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_eucjp };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_sjis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_sjis };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_sjiswin = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_sjis_win,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_sjiswin };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_jis = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_jis,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_jis };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_2022jp = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_2022jp,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_2022jp };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_JA */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_euccn = {
|
|
|
|
|
mbfl_no_encoding_euc_cn,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_euccn };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_cp936 = {
|
|
|
|
|
mbfl_no_encoding_cp936,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_cp936 };
|
2002-05-12 13:06:13 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_hz = {
|
|
|
|
|
mbfl_no_encoding_hz,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_hz };
|
2002-05-12 13:06:13 +00:00
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_CN */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_euctw = {
|
|
|
|
|
mbfl_no_encoding_euc_tw,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_euctw };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_big5 = {
|
|
|
|
|
mbfl_no_encoding_big5,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_big5 };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_TW */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_euckr = {
|
|
|
|
|
mbfl_no_encoding_euc_kr,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_euckr };
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_uhc = {
|
|
|
|
|
mbfl_no_encoding_uhc,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_uhc };
|
2002-05-24 22:28:42 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_2022kr = {
|
|
|
|
|
mbfl_no_encoding_2022kr,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_2022kr };
|
2002-05-24 22:28:42 +00:00
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_KR */
|
2002-05-15 12:13:56 +00:00
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_cp1251 = {
|
|
|
|
|
mbfl_no_encoding_cp1251,
|
2002-05-15 12:13:56 +00:00
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_cp1251 };
|
2002-05-15 12:13:56 +00:00
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_cp866 = {
|
|
|
|
|
mbfl_no_encoding_cp866,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_cp866 };
|
2002-05-21 07:00:34 +00:00
|
|
|
|
|
|
|
|
|
static struct mbfl_identify_vtbl vtbl_identify_koi8r = {
|
|
|
|
|
mbfl_no_encoding_koi8r,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_koi8r };
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_RU */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_cp1252 = {
|
2001-08-25 09:21:43 +00:00
|
|
|
|
mbfl_no_encoding_cp1252,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_cp1252 };
|
2001-08-25 09:21:43 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_1 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_1,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_2 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_2,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_3 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_3,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_4 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_4,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_5 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_5,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_6 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_6,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_7 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_7,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_8 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_8,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_9 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_9,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_10 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_10,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_13 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_13,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_14 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_14,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_8859_15 = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_8859_15,
|
|
|
|
|
mbfl_filt_ident_common_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_true };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl vtbl_identify_false = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no_encoding_pass,
|
|
|
|
|
mbfl_filt_ident_false_ctor,
|
|
|
|
|
mbfl_filt_ident_common_dtor,
|
2002-08-14 06:38:07 +00:00
|
|
|
|
mbfl_filt_ident_false };
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl *mbfl_identify_filter_list[] = {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_identify_utf8,
|
|
|
|
|
&vtbl_identify_utf7,
|
|
|
|
|
&vtbl_identify_ascii,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_identify_eucjp,
|
|
|
|
|
&vtbl_identify_sjis,
|
|
|
|
|
&vtbl_identify_eucjpwin,
|
|
|
|
|
&vtbl_identify_sjiswin,
|
|
|
|
|
&vtbl_identify_jis,
|
|
|
|
|
&vtbl_identify_2022jp,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
&vtbl_identify_euccn,
|
|
|
|
|
&vtbl_identify_cp936,
|
2002-05-12 13:06:13 +00:00
|
|
|
|
&vtbl_identify_hz,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
&vtbl_identify_euctw,
|
|
|
|
|
&vtbl_identify_big5,
|
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
&vtbl_identify_euckr,
|
|
|
|
|
&vtbl_identify_uhc,
|
2002-05-24 22:28:42 +00:00
|
|
|
|
&vtbl_identify_2022kr,
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#endif
|
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
|
|
|
|
&vtbl_identify_cp1251,
|
|
|
|
|
&vtbl_identify_cp866,
|
|
|
|
|
&vtbl_identify_koi8r,
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif
|
2001-08-25 09:21:43 +00:00
|
|
|
|
&vtbl_identify_cp1252,
|
2001-05-01 01:52:55 +00:00
|
|
|
|
&vtbl_identify_8859_1,
|
|
|
|
|
&vtbl_identify_8859_2,
|
|
|
|
|
&vtbl_identify_8859_3,
|
|
|
|
|
&vtbl_identify_8859_4,
|
|
|
|
|
&vtbl_identify_8859_5,
|
|
|
|
|
&vtbl_identify_8859_6,
|
|
|
|
|
&vtbl_identify_8859_7,
|
|
|
|
|
&vtbl_identify_8859_8,
|
|
|
|
|
&vtbl_identify_8859_9,
|
|
|
|
|
&vtbl_identify_8859_10,
|
|
|
|
|
&vtbl_identify_8859_13,
|
|
|
|
|
&vtbl_identify_8859_14,
|
|
|
|
|
&vtbl_identify_8859_15,
|
|
|
|
|
&vtbl_identify_false,
|
|
|
|
|
NULL
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* language resolver */
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_name2language(const char *name)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *language;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i, j;
|
|
|
|
|
|
|
|
|
|
if (name == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((language = mbfl_language_ptr_table[i++]) != NULL){
|
|
|
|
|
if (strcasecmp(language->name, name) == 0) {
|
|
|
|
|
return language;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-08 14:33:20 +00:00
|
|
|
|
i = 0;
|
|
|
|
|
while ((language = mbfl_language_ptr_table[i++]) != NULL){
|
|
|
|
|
if (strcasecmp(language->short_name, name) == 0) {
|
|
|
|
|
return language;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* serch aliases */
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((language = mbfl_language_ptr_table[i++]) != NULL) {
|
|
|
|
|
if (language->aliases != NULL) {
|
|
|
|
|
j = 0;
|
|
|
|
|
while ((*language->aliases)[j] != NULL) {
|
|
|
|
|
if (strcasecmp((*language->aliases)[j], name) == 0) {
|
|
|
|
|
return language;
|
|
|
|
|
}
|
|
|
|
|
j++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no2language(enum mbfl_no_language no_language)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *language;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((language = mbfl_language_ptr_table[i++]) != NULL){
|
|
|
|
|
if (language->no_language == no_language) {
|
|
|
|
|
return language;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
enum mbfl_no_language
|
|
|
|
|
mbfl_name2no_language(const char *name)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *language;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
language = mbfl_name2language(name);
|
|
|
|
|
if (language == NULL) {
|
|
|
|
|
return mbfl_no_language_invalid;
|
|
|
|
|
} else {
|
|
|
|
|
return language->no_language;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-08 14:33:20 +00:00
|
|
|
|
const char *
|
|
|
|
|
mbfl_no_language2name(enum mbfl_no_language no_language)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_language *language;
|
2001-05-08 14:33:20 +00:00
|
|
|
|
|
|
|
|
|
language = mbfl_no2language(no_language);
|
|
|
|
|
if (language == NULL) {
|
|
|
|
|
return "";
|
|
|
|
|
} else {
|
|
|
|
|
return language->name;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* encoding resolver */
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_name2encoding(const char *name)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i, j;
|
|
|
|
|
|
|
|
|
|
if (name == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((encoding = mbfl_encoding_ptr_list[i++]) != NULL){
|
|
|
|
|
if (strcasecmp(encoding->name, name) == 0) {
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* serch MIME charset name */
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((encoding = mbfl_encoding_ptr_list[i++]) != NULL) {
|
|
|
|
|
if (encoding->mime_name != NULL) {
|
|
|
|
|
if (strcasecmp(encoding->mime_name, name) == 0) {
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* serch aliases */
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((encoding = mbfl_encoding_ptr_list[i++]) != NULL) {
|
|
|
|
|
if (encoding->aliases != NULL) {
|
|
|
|
|
j = 0;
|
|
|
|
|
while ((*encoding->aliases)[j] != NULL) {
|
|
|
|
|
if (strcasecmp((*encoding->aliases)[j], name) == 0) {
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
j++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_no2encoding(enum mbfl_no_encoding no_encoding)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((encoding = mbfl_encoding_ptr_list[i++]) != NULL){
|
|
|
|
|
if (encoding->no_encoding == no_encoding) {
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
enum mbfl_no_encoding
|
|
|
|
|
mbfl_name2no_encoding(const char *name)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_name2encoding(name);
|
|
|
|
|
if (encoding == NULL) {
|
|
|
|
|
return mbfl_no_encoding_invalid;
|
|
|
|
|
} else {
|
|
|
|
|
return encoding->no_encoding;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const char *
|
|
|
|
|
mbfl_no_encoding2name(enum mbfl_no_encoding no_encoding)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(no_encoding);
|
|
|
|
|
if (encoding == NULL) {
|
|
|
|
|
return "";
|
|
|
|
|
} else {
|
|
|
|
|
return encoding->name;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const char *
|
|
|
|
|
mbfl_no2preferred_mime_name(enum mbfl_no_encoding no_encoding)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(no_encoding);
|
|
|
|
|
if (encoding != NULL && encoding->mime_name != NULL && encoding->mime_name[0] != '\0') {
|
|
|
|
|
return encoding->mime_name;
|
|
|
|
|
} else {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
|
|
|
|
mbfl_is_support_encoding(const char *name)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_name2encoding(name);
|
|
|
|
|
if (encoding == NULL) {
|
|
|
|
|
return 0;
|
|
|
|
|
} else {
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* memory device output functions
|
|
|
|
|
*/
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(mbfl_memory_device *device, int initsz, int allocsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device) {
|
|
|
|
|
device->length = 0;
|
|
|
|
|
device->buffer = (unsigned char *)0;
|
|
|
|
|
if (initsz > 0) {
|
|
|
|
|
device->buffer = (unsigned char *)mbfl_malloc(initsz*sizeof(unsigned char));
|
|
|
|
|
if (device->buffer != NULL) {
|
|
|
|
|
device->length = initsz;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
device->pos= 0;
|
|
|
|
|
if (allocsz > MBFL_MEMORY_DEVICE_ALLOC_SIZE) {
|
|
|
|
|
device->allocsz = allocsz;
|
|
|
|
|
} else {
|
|
|
|
|
device->allocsz = MBFL_MEMORY_DEVICE_ALLOC_SIZE;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_realloc(mbfl_memory_device *device, int initsz, int allocsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
unsigned char *tmp;
|
|
|
|
|
|
|
|
|
|
if (device) {
|
|
|
|
|
if (initsz > device->length) {
|
|
|
|
|
tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, initsz*sizeof(unsigned char));
|
|
|
|
|
if (tmp != NULL) {
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
device->length = initsz;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (allocsz > MBFL_MEMORY_DEVICE_ALLOC_SIZE) {
|
|
|
|
|
device->allocsz = allocsz;
|
|
|
|
|
} else {
|
|
|
|
|
device->allocsz = MBFL_MEMORY_DEVICE_ALLOC_SIZE;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_clear(mbfl_memory_device *device TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device) {
|
|
|
|
|
if (device->buffer) {
|
|
|
|
|
mbfl_free(device->buffer);
|
|
|
|
|
}
|
|
|
|
|
device->buffer = (unsigned char *)0;
|
|
|
|
|
device->length = 0;
|
|
|
|
|
device->pos = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_reset(mbfl_memory_device *device TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device) {
|
|
|
|
|
device->pos = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_unput(mbfl_memory_device *device TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device->pos > 0) {
|
|
|
|
|
device->pos--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_result(mbfl_memory_device *device, mbfl_string *result TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device && result) {
|
|
|
|
|
result->len = device->pos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output4('\0', device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
result->val = device->buffer;
|
|
|
|
|
device->buffer = (unsigned char *)0;
|
|
|
|
|
device->length = 0;
|
|
|
|
|
device->pos= 0;
|
|
|
|
|
if (result->val == NULL) {
|
|
|
|
|
result->len = 0;
|
|
|
|
|
result = NULL;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
result = NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_memory_device *device = (mbfl_memory_device *)data;
|
|
|
|
|
|
|
|
|
|
if (device->pos >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen;
|
|
|
|
|
unsigned char *tmp;
|
|
|
|
|
|
|
|
|
|
newlen = device->length + device->allocsz;
|
|
|
|
|
tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)c;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output2(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_memory_device *device = (mbfl_memory_device *)data;
|
|
|
|
|
|
|
|
|
|
if ((device->pos + 2) >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen;
|
|
|
|
|
unsigned char *tmp;
|
|
|
|
|
|
|
|
|
|
newlen = device->length + device->allocsz;
|
|
|
|
|
tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)((c >> 8) & 0xff);
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)(c & 0xff);
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output4(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_memory_device *device = (mbfl_memory_device *)data;
|
|
|
|
|
|
|
|
|
|
if ((device->pos + 4) >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen;
|
|
|
|
|
unsigned char *tmp;
|
|
|
|
|
|
|
|
|
|
newlen = device->length + device->allocsz;
|
|
|
|
|
tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)((c >> 24) & 0xff);
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)((c >> 16) & 0xff);
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)((c >> 8) & 0xff);
|
|
|
|
|
device->buffer[device->pos++] = (unsigned char)(c & 0xff);
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strcat(mbfl_memory_device *device, const char *psrc TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int len;
|
|
|
|
|
unsigned char *w;
|
|
|
|
|
const unsigned char *p;
|
|
|
|
|
|
|
|
|
|
len = 0;
|
|
|
|
|
p = psrc;
|
|
|
|
|
while (*p) {
|
|
|
|
|
p++;
|
|
|
|
|
len++;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ((device->pos + len) >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen = device->length + (len + MBFL_MEMORY_DEVICE_ALLOC_SIZE)*sizeof(unsigned char);
|
|
|
|
|
unsigned char *tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
p = psrc;
|
|
|
|
|
w = &device->buffer[device->pos];
|
|
|
|
|
device->pos += len;
|
|
|
|
|
while (len > 0) {
|
|
|
|
|
*w++ = *p++;
|
|
|
|
|
len--;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return len;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(mbfl_memory_device *device, const char *psrc, int len TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
unsigned char *w;
|
|
|
|
|
|
|
|
|
|
if ((device->pos + len) >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen = device->length + len + MBFL_MEMORY_DEVICE_ALLOC_SIZE;
|
|
|
|
|
unsigned char *tmp = (unsigned char *)mbfl_realloc((void *)device->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
w = &device->buffer[device->pos];
|
|
|
|
|
device->pos += len;
|
|
|
|
|
while (len > 0) {
|
|
|
|
|
*w++ = *psrc++;
|
|
|
|
|
len--;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return len;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_devcat(mbfl_memory_device *dest, mbfl_memory_device *src TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p, *w;
|
|
|
|
|
|
|
|
|
|
if ((dest->pos + src->pos) >= dest->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen = dest->length + src->pos + MBFL_MEMORY_DEVICE_ALLOC_SIZE;
|
|
|
|
|
unsigned char *tmp = (unsigned char *)mbfl_realloc((void *)dest->buffer, newlen*sizeof(unsigned char));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
dest->length = newlen;
|
|
|
|
|
dest->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
p = src->buffer;
|
|
|
|
|
w = &dest->buffer[dest->pos];
|
|
|
|
|
n = src->pos;
|
|
|
|
|
dest->pos += n;
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
*w++ = *p++;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return n;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_init(mbfl_wchar_device *device TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device) {
|
|
|
|
|
device->buffer = (unsigned int *)0;
|
|
|
|
|
device->length = 0;
|
|
|
|
|
device->pos= 0;
|
|
|
|
|
device->allocsz = MBFL_MEMORY_DEVICE_ALLOC_SIZE;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_clear(mbfl_wchar_device *device TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (device) {
|
|
|
|
|
if (device->buffer) {
|
|
|
|
|
mbfl_free(device->buffer);
|
|
|
|
|
}
|
|
|
|
|
device->buffer = (unsigned int*)0;
|
|
|
|
|
device->length = 0;
|
|
|
|
|
device->pos = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_output(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_wchar_device *device = (mbfl_wchar_device *)data;
|
|
|
|
|
|
|
|
|
|
if (device->pos >= device->length) {
|
|
|
|
|
/* reallocate buffer */
|
|
|
|
|
int newlen;
|
|
|
|
|
unsigned int *tmp;
|
|
|
|
|
|
|
|
|
|
newlen = device->length + device->allocsz;
|
|
|
|
|
tmp = (unsigned int *)mbfl_realloc((void *)device->buffer, newlen*sizeof(int));
|
|
|
|
|
if (tmp == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
device->length = newlen;
|
|
|
|
|
device->buffer = tmp;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
device->buffer[device->pos++] = c;
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2001-05-09 11:18:11 +00:00
|
|
|
|
/*
|
|
|
|
|
* string object
|
|
|
|
|
*/
|
2001-05-01 01:52:55 +00:00
|
|
|
|
void
|
|
|
|
|
mbfl_string_init(mbfl_string *string)
|
|
|
|
|
{
|
|
|
|
|
if (string) {
|
|
|
|
|
string->no_language = mbfl_no_language_uni;
|
|
|
|
|
string->no_encoding = mbfl_no_encoding_pass;
|
|
|
|
|
string->val = (unsigned char*)0;
|
|
|
|
|
string->len = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-09 11:18:11 +00:00
|
|
|
|
void
|
|
|
|
|
mbfl_string_init_set(mbfl_string *string, enum mbfl_no_language no_language, enum mbfl_no_encoding no_encoding)
|
|
|
|
|
{
|
|
|
|
|
if (string) {
|
|
|
|
|
string->no_language = no_language;
|
|
|
|
|
string->no_encoding = no_encoding;
|
|
|
|
|
string->val = (unsigned char*)0;
|
|
|
|
|
string->len = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
|
mbfl_string_clear(mbfl_string *string)
|
|
|
|
|
{
|
|
|
|
|
if (string) {
|
|
|
|
|
if (string->val != (unsigned char*)0) {
|
|
|
|
|
mbfl_free(string->val);
|
|
|
|
|
}
|
|
|
|
|
string->val = (unsigned char*)0;
|
|
|
|
|
string->len = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* encoding filter
|
|
|
|
|
*/
|
|
|
|
|
#define CK(statement) do { if ((statement) < 0) return (-1); } while (0)
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* commonly used constructor and destructor
|
|
|
|
|
*/
|
|
|
|
|
static void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_common_ctor(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_common_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2001-05-04 10:42:54 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_common_dtor(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2001-05-04 10:42:54 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_pass(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return (*filter->output_function)(c, filter->data TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_any_7bit(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < 0x80) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_byte2be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (filter->status == 0) {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = (c & 0xff) | filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_byte2be(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_byte2le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (filter->status == 0) {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = ((c & 0xff) << 8) | filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_byte2le(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_byte4be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (filter->status == 0) {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = (c & 0xff) << 24;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
} else if (filter->status == 1) {
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
n = (c & 0xff) << 16;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
} else if (filter->status == 2) {
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = (c & 0xff) | filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_byte4be(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((c >> 24) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 16) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_byte4le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (filter->status == 0) {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = (c & 0xff);
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
} else if (filter->status == 1) {
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
} else if (filter->status == 2) {
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
n = (c & 0xff) << 16;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = ((c & 0xff) << 24) | filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_byte4le(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 16) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 24) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2001-05-12 23:42:09 +00:00
|
|
|
|
/* uuencode => any */
|
|
|
|
|
#define UUDEC(c) (char)(((c)-' ')&077)
|
2001-05-13 12:04:37 +00:00
|
|
|
|
static const char * uuenc_begin_text = "begin ";
|
2001-05-12 23:42:09 +00:00
|
|
|
|
enum { uudec_state_ground=0, uudec_state_inbegin,
|
|
|
|
|
uudec_state_until_newline,
|
|
|
|
|
uudec_state_size, uudec_state_a, uudec_state_b, uudec_state_c, uudec_state_d,
|
|
|
|
|
uudec_state_skip_newline};
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_uudec(int c, mbfl_convert_filter * filter TSRMLS_DC)
|
2001-05-12 23:42:09 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
switch(filter->status) {
|
|
|
|
|
case uudec_state_ground:
|
|
|
|
|
/* looking for "begin 0666 filename\n" line */
|
|
|
|
|
if (filter->cache == 0 && c == 'b')
|
|
|
|
|
{
|
|
|
|
|
filter->status = uudec_state_inbegin;
|
|
|
|
|
filter->cache = 1; /* move to 'e' */
|
|
|
|
|
}
|
|
|
|
|
else if (c == '\n')
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
else
|
|
|
|
|
filter->cache++;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_inbegin:
|
|
|
|
|
if (uuenc_begin_text[filter->cache++] != c) {
|
|
|
|
|
/* doesn't match pattern */
|
|
|
|
|
filter->status = uudec_state_ground;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (filter->cache == 5)
|
|
|
|
|
{
|
|
|
|
|
/* thats good enough - wait for a newline */
|
|
|
|
|
filter->status = uudec_state_until_newline;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_until_newline:
|
|
|
|
|
if (c == '\n')
|
|
|
|
|
filter->status = uudec_state_size;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_size:
|
|
|
|
|
/* get "size" byte */
|
|
|
|
|
n = UUDEC(c);
|
|
|
|
|
filter->cache = n << 24;
|
|
|
|
|
filter->status = uudec_state_a;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_a:
|
|
|
|
|
/* get "a" byte */
|
|
|
|
|
n = UUDEC(c);
|
|
|
|
|
filter->cache |= (n << 16);
|
|
|
|
|
filter->status = uudec_state_b;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_b:
|
|
|
|
|
/* get "b" byte */
|
|
|
|
|
n = UUDEC(c);
|
|
|
|
|
filter->cache |= (n << 8);
|
|
|
|
|
filter->status = uudec_state_c;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_c:
|
|
|
|
|
/* get "c" byte */
|
|
|
|
|
n = UUDEC(c);
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
filter->status = uudec_state_d;
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_d:
|
|
|
|
|
/* get "d" byte */
|
|
|
|
|
{
|
|
|
|
|
int A, B, C, D = UUDEC(c);
|
|
|
|
|
A = (filter->cache >> 16) & 0xff;
|
|
|
|
|
B = (filter->cache >> 8) & 0xff;
|
|
|
|
|
C = (filter->cache) & 0xff;
|
|
|
|
|
n = (filter->cache >> 24) & 0xff;
|
|
|
|
|
if (n-- > 0)
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)( (A << 2) | (B >> 4), filter->data TSRMLS_CC));
|
2001-05-12 23:42:09 +00:00
|
|
|
|
if (n-- > 0)
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)( (B << 4) | (C >> 2), filter->data TSRMLS_CC));
|
2001-05-12 23:42:09 +00:00
|
|
|
|
if (n-- > 0)
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)( (C << 6) | D, filter->data TSRMLS_CC));
|
2001-05-12 23:42:09 +00:00
|
|
|
|
filter->cache = n << 24;
|
|
|
|
|
|
|
|
|
|
if (n == 0)
|
|
|
|
|
filter->status = uudec_state_skip_newline; /* skip next byte (newline) */
|
|
|
|
|
else
|
|
|
|
|
filter->status = uudec_state_a; /* go back to fetch "A" byte */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case uudec_state_skip_newline:
|
|
|
|
|
/* skip newline */
|
2001-08-28 21:50:29 +00:00
|
|
|
|
filter->status = uudec_state_size;
|
2001-05-12 23:42:09 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* any => BASE64
|
|
|
|
|
*/
|
|
|
|
|
static const unsigned char mbfl_base64_table[] =
|
|
|
|
|
{
|
|
|
|
|
/* 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', */
|
|
|
|
|
0x41,0x42,0x43,0x44,0x45,0x46,0x47,0x48,0x49,0x4a,0x4b,0x4c,0x4d,
|
|
|
|
|
/* 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', */
|
|
|
|
|
0x4e,0x4f,0x50,0x51,0x52,0x53,0x54,0x55,0x56,0x57,0x58,0x59,0x5a,
|
|
|
|
|
/* 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', */
|
|
|
|
|
0x61,0x62,0x63,0x64,0x65,0x66,0x67,0x68,0x69,0x6a,0x6b,0x6c,0x6d,
|
|
|
|
|
/* 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', */
|
|
|
|
|
0x6e,0x6f,0x70,0x71,0x72,0x73,0x74,0x75,0x76,0x77,0x78,0x79,0x7a,
|
|
|
|
|
/* '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', '/', '\0' */
|
|
|
|
|
0x30,0x31,0x32,0x33,0x34,0x35,0x36,0x37,0x38,0x39,0x2b,0x2f,0x00
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
#define MBFL_BASE64_STS_MIME_HEADER 0x1000000
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_base64enc(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
n = (filter->status & 0xff);
|
|
|
|
|
if (n == 0) {
|
|
|
|
|
filter->status++;
|
|
|
|
|
filter->cache = (c & 0xff) << 16;
|
|
|
|
|
} else if (n == 1) {
|
|
|
|
|
filter->status++;
|
|
|
|
|
filter->cache |= (c & 0xff) << 8;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status &= ~0xff;
|
|
|
|
|
if ((filter->status & MBFL_BASE64_STS_MIME_HEADER) == 0) {
|
|
|
|
|
n = (filter->status & 0xff00) >> 8;
|
|
|
|
|
if (n > 72) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x0d, filter->data TSRMLS_CC)); /* CR */
|
|
|
|
|
CK((*filter->output_function)(0x0a, filter->data TSRMLS_CC)); /* LF */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status &= ~0xff00;
|
|
|
|
|
}
|
|
|
|
|
filter->status += 0x400;
|
|
|
|
|
}
|
|
|
|
|
n = filter->cache | (c & 0xff);
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(n >> 18) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(n >> 12) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(n >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[n & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_base64enc_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int status, cache, len;
|
|
|
|
|
|
|
|
|
|
status = filter->status & 0xff;
|
|
|
|
|
cache = filter->cache;
|
|
|
|
|
len = (filter->status & 0xff00) >> 8;
|
|
|
|
|
filter->status &= ~0xffff;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
if (status >= 1) {
|
|
|
|
|
if ((filter->status & MBFL_BASE64_STS_MIME_HEADER) == 0) {
|
|
|
|
|
if (len > 72){
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x0d, filter->data TSRMLS_CC)); /* CR */
|
|
|
|
|
CK((*filter->output_function)(0x0a, filter->data TSRMLS_CC)); /* LF */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 18) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 12) & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (status == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* BASE64 => any
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_base64dec(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (c == 0x0d || c == 0x0a || c == 0x20 || c == 0x09 || c == 0x3d) { /* CR or LF or SPACE or HTAB or '=' */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
n = 0;
|
|
|
|
|
if (c >= 0x41 && c <= 0x5a) { /* A - Z */
|
|
|
|
|
n = c - 65;
|
|
|
|
|
} else if (c >= 0x61 && c <= 0x7a) { /* a - z */
|
|
|
|
|
n = c - 71;
|
|
|
|
|
} else if (c >= 0x30 && c <= 0x39) { /* 0 - 9 */
|
|
|
|
|
n = c + 4;
|
|
|
|
|
} else if (c == 0x2b) { /* '+' */
|
|
|
|
|
n = 62;
|
|
|
|
|
} else if (c == 0x2f) { /* '/' */
|
|
|
|
|
n = 63;
|
|
|
|
|
}
|
|
|
|
|
n &= 0x3f;
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0:
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
filter->cache = n << 18;
|
|
|
|
|
break;
|
|
|
|
|
case 1:
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
filter->cache |= n << 12;
|
|
|
|
|
break;
|
|
|
|
|
case 2:
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
filter->cache |= n << 6;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n |= filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((n >> 16) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((n >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(n & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_base64dec_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int status, cache;
|
|
|
|
|
|
|
|
|
|
status = filter->status;
|
|
|
|
|
cache = filter->cache;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
if (status >= 2) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((cache >> 16) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (status >= 3) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((cache >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
2002-08-04 14:20:11 +00:00
|
|
|
|
/*
|
|
|
|
|
* any => HTML
|
|
|
|
|
*/
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_conv_html_enc(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
int tmp[10];
|
|
|
|
|
int i = 0, p = 0, e;
|
2002-10-07 16:11:30 +00:00
|
|
|
|
unsigned int uc;
|
2002-08-04 14:20:11 +00:00
|
|
|
|
|
|
|
|
|
if (c<256 && mblen_table_html[c]==1) {
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
|
|
|
|
} else {
|
2002-08-27 15:32:04 +00:00
|
|
|
|
/*php_error_docref("ref.mbstring" TSRMLS_CC, E_NOTICE, "mbfl_filt_conv_html_enc(0x%08X = %d)", c, c);*/
|
2002-08-04 14:20:11 +00:00
|
|
|
|
CK((*filter->output_function)('&', filter->data TSRMLS_CC));
|
|
|
|
|
while (1) {
|
|
|
|
|
e = mbfl_html_entity_list[i].code;
|
|
|
|
|
if (c < e || e == -1) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (c == e) {
|
|
|
|
|
while(mbfl_html_entity_list[i].name[p]) {
|
|
|
|
|
CK((*filter->output_function)((int)mbfl_html_entity_list[i].name[p++], filter->data TSRMLS_CC));
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
i++;
|
|
|
|
|
}
|
2002-10-07 16:11:30 +00:00
|
|
|
|
i=0;
|
2002-08-04 14:20:11 +00:00
|
|
|
|
if (!p) {
|
|
|
|
|
CK((*filter->output_function)('#', filter->data TSRMLS_CC));
|
2002-10-07 16:11:30 +00:00
|
|
|
|
uc = (unsigned int)c;
|
2002-08-04 14:20:11 +00:00
|
|
|
|
do {
|
2002-10-07 16:11:30 +00:00
|
|
|
|
tmp[i++] = '0'+uc%10;
|
|
|
|
|
uc /= 10;
|
|
|
|
|
} while (uc);
|
2002-08-04 14:20:11 +00:00
|
|
|
|
do {
|
|
|
|
|
CK((*filter->output_function)(tmp[--i], filter->data TSRMLS_CC));
|
2002-10-07 16:11:30 +00:00
|
|
|
|
} while (i);
|
2002-08-04 14:20:11 +00:00
|
|
|
|
}
|
|
|
|
|
CK((*filter->output_function)(';', filter->data TSRMLS_CC));
|
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_conv_html_enc_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* HTML => any
|
|
|
|
|
*/
|
|
|
|
|
#define html_enc_buffer_size 16
|
|
|
|
|
static const char html_entity_chars[] = "#0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";
|
|
|
|
|
|
|
|
|
|
static void
|
|
|
|
|
mbfl_filt_conv_html_dec_ctor(mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
2002-10-07 16:05:28 +00:00
|
|
|
|
filter->cache = (int)mbfl_malloc(html_enc_buffer_size+1);
|
2002-08-04 14:20:11 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void
|
|
|
|
|
mbfl_filt_conv_html_dec_dtor(mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
if (filter->cache)
|
|
|
|
|
{
|
|
|
|
|
mbfl_free((void*)filter->cache);
|
|
|
|
|
}
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_conv_html_dec(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
int pos, ent = 0;
|
|
|
|
|
const mbfl_html_entity *entity;
|
|
|
|
|
char *buffer = (char*)filter->cache;
|
|
|
|
|
|
|
|
|
|
if (!filter->status)
|
|
|
|
|
{
|
|
|
|
|
if (c == '&' )
|
|
|
|
|
{
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
buffer[0] = '&';
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
if (c == ';')
|
|
|
|
|
{
|
|
|
|
|
buffer[filter->status] = 0;
|
|
|
|
|
if (buffer[1]=='#')
|
|
|
|
|
{
|
|
|
|
|
/* numeric entity */
|
|
|
|
|
for (pos=2; pos<filter->status; pos++)
|
|
|
|
|
ent = ent*10 + (buffer[pos] - '0');
|
|
|
|
|
CK((*filter->output_function)(ent, filter->data TSRMLS_CC));
|
|
|
|
|
filter->status = 0;
|
2002-08-27 15:32:04 +00:00
|
|
|
|
/*php_error_docref("ref.mbstring" TSRMLS_CC, E_NOTICE, "mbstring decoded '%s'=%d", buffer, ent);*/
|
2002-08-04 14:20:11 +00:00
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
/* named entity */
|
|
|
|
|
entity = mbfl_html_entity_list;
|
|
|
|
|
while (entity->name)
|
|
|
|
|
{
|
|
|
|
|
if (!strcmp(buffer+1, entity->name))
|
|
|
|
|
{
|
|
|
|
|
ent = entity->code;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
entity++;
|
|
|
|
|
}
|
|
|
|
|
if (ent)
|
|
|
|
|
{
|
|
|
|
|
/* decoded */
|
|
|
|
|
CK((*filter->output_function)(ent, filter->data TSRMLS_CC));
|
|
|
|
|
filter->status = 0;
|
2002-08-27 15:32:04 +00:00
|
|
|
|
/*php_error_docref("ref.mbstring" TSRMLS_CC, E_NOTICE,"mbstring decoded '%s'=%d", buffer, ent);*/
|
2002-08-04 14:20:11 +00:00
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
/* failure */
|
|
|
|
|
buffer[filter->status++] = ';';
|
|
|
|
|
buffer[filter->status] = 0;
|
2002-08-27 15:32:04 +00:00
|
|
|
|
php_error_docref("ref.mbstring" TSRMLS_CC, E_WARNING, "mbstring cannot decode '%s'", buffer);
|
2002-08-04 14:20:11 +00:00
|
|
|
|
mbfl_filt_conv_html_dec_flush(filter TSRMLS_CC);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
else
|
|
|
|
|
{
|
|
|
|
|
/* add character */
|
|
|
|
|
buffer[filter->status++] = c;
|
|
|
|
|
/* add character and check */
|
|
|
|
|
if (!strchr(html_entity_chars, c) || filter->status+1==html_enc_buffer_size || (c=='#' && filter->status>2))
|
|
|
|
|
{
|
|
|
|
|
/* illegal character or end of buffer */
|
|
|
|
|
if (c=='&')
|
|
|
|
|
filter->status--;
|
|
|
|
|
buffer[filter->status] = 0;
|
2002-08-27 15:32:04 +00:00
|
|
|
|
php_error_docref("ref.mbstring" TSRMLS_CC, E_WARNING, "mbstring cannot decode '%s'", buffer);
|
2002-08-04 14:20:11 +00:00
|
|
|
|
mbfl_filt_conv_html_dec_flush(filter TSRMLS_CC);
|
|
|
|
|
if (c=='&')
|
|
|
|
|
{
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
buffer[0] = '&';
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_conv_html_dec_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
int status, pos = 0;
|
|
|
|
|
char *buffer;
|
|
|
|
|
|
|
|
|
|
buffer = (char*)filter->cache;
|
|
|
|
|
status = filter->status;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
while (status--)
|
|
|
|
|
{
|
|
|
|
|
CK((*filter->output_function)(buffer[pos++], filter->data TSRMLS_CC));
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
/*filter->buffer = 0; of cause NOT*/
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/*
|
|
|
|
|
* any => Quoted-Printable
|
|
|
|
|
*/
|
|
|
|
|
#define MBFL_QPRINT_STS_MIME_HEADER 0x1000000
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_qprintenc(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
switch (filter->status & 0xff) {
|
|
|
|
|
case 0:
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
s = filter->cache;
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
n = (filter->status & 0xff00) >> 8;
|
|
|
|
|
|
|
|
|
|
if (s == 0) { /* null */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status &= ~0xff00;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ((filter->status & MBFL_QPRINT_STS_MIME_HEADER) == 0) {
|
|
|
|
|
if (s == 0x0a || (s == 0x0d && c != 0x0a)) { /* line feed */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x0d, filter->data TSRMLS_CC)); /* CR */
|
|
|
|
|
CK((*filter->output_function)(0x0a, filter->data TSRMLS_CC)); /* LF */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status &= ~0xff00;
|
|
|
|
|
break;
|
|
|
|
|
} else if (s == 0x0d) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ((filter->status & MBFL_QPRINT_STS_MIME_HEADER) == 0 && n >= 72) { /* soft line feed */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
|
|
|
|
CK((*filter->output_function)(0x0d, filter->data TSRMLS_CC)); /* CR */
|
|
|
|
|
CK((*filter->output_function)(0x0a, filter->data TSRMLS_CC)); /* LF */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status &= ~0xff00;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s <= 0 || s >= 0x80 || s == 0x3d /* not ASCII or '=' */
|
|
|
|
|
|| ((filter->status & MBFL_QPRINT_STS_MIME_HEADER) != 0 &&
|
|
|
|
|
(mbfl_charprop_table[s] & MBFL_CHP_MMHQENC) != 0)) {
|
|
|
|
|
/* hex-octet */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = (s >> 4) & 0xf;
|
|
|
|
|
if (n < 10) {
|
|
|
|
|
n += 48; /* '0' */
|
|
|
|
|
} else {
|
|
|
|
|
n += 55; /* 'A' - 10 */
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = s & 0xf;
|
|
|
|
|
if (n < 10) {
|
|
|
|
|
n += 48;
|
|
|
|
|
} else {
|
|
|
|
|
n += 55;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if ((filter->status & MBFL_QPRINT_STS_MIME_HEADER) == 0) {
|
|
|
|
|
filter->status += 0x300;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if ((filter->status & MBFL_QPRINT_STS_MIME_HEADER) == 0) {
|
|
|
|
|
filter->status += 0x100;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_qprintenc_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
/* flush filter cache */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_function)('\0', filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status &= ~0xffff;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* Quoted-Printable => any
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_qprintdec(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 1:
|
|
|
|
|
if ((c >= 0x30 && c <= 0x39) || (c >= 0x41 && c <= 0x46)) { /* 0 - 9 or A - F */
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
} else if (c == 0x0d) { /* soft line feed */
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
} else if (c == 0x0a) { /* soft line feed */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 2:
|
|
|
|
|
n = filter->cache;
|
|
|
|
|
if (n >= 0x30 && n <= 0x39) { /* '0' - '9' */
|
|
|
|
|
n -= 48; /* 48 = '0' */
|
|
|
|
|
} else {
|
|
|
|
|
n -= 55; /* 55 = 'A' - 10 */
|
|
|
|
|
}
|
|
|
|
|
n <<= 4;
|
|
|
|
|
if (c >= 0x30 && c <= 0x39) { /* '0' - '9' */
|
|
|
|
|
n += (c - 48);
|
|
|
|
|
} else if (c >= 0x41 && c <= 0x46) { /* 'A' - 'F' */
|
|
|
|
|
n += (c - 55);
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
|
|
|
|
CK((*filter->output_function)(filter->cache, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = c;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
case 3:
|
|
|
|
|
if (c != 0x0a) { /* LF */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (c == 0x3d) { /* '=' */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_qprintdec_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int status, cache;
|
|
|
|
|
|
|
|
|
|
status = filter->status;
|
|
|
|
|
cache = filter->cache;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
if (status == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (status == 2) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x3d, filter->data TSRMLS_CC)); /* '=' */
|
|
|
|
|
CK((*filter->output_function)(cache, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UCS-4 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_ucs4_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n, endian;
|
|
|
|
|
|
|
|
|
|
endian = filter->status & 0xff00;
|
|
|
|
|
switch (filter->status & 0xff) {
|
|
|
|
|
case 0:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
} else {
|
|
|
|
|
n = (c & 0xff) << 24;
|
|
|
|
|
}
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 1:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
} else {
|
|
|
|
|
n = (c & 0xff) << 16;
|
|
|
|
|
}
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 2:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = (c & 0xff) << 16;
|
|
|
|
|
} else {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
}
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = (c & 0xff) << 24;
|
|
|
|
|
} else {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
}
|
|
|
|
|
n |= filter->cache;
|
|
|
|
|
if ((n & 0xffff) == 0 && ((n >> 16) & 0xffff) == 0xfffe) {
|
|
|
|
|
if (endian) {
|
|
|
|
|
filter->status = 0; /* big-endian */
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0x100; /* little-endian */
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0xfeff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
filter->status &= ~0xff;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UCS-4BE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_ucs4be(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSGROUP_UCS4MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((c >> 24) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 16) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UCS-4LE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_ucs4le(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSGROUP_UCS4MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 16) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 24) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UCS-2 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_ucs2_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n, endian;
|
|
|
|
|
|
|
|
|
|
endian = filter->status & 0xff00;
|
|
|
|
|
switch (filter->status & 0xff) {
|
|
|
|
|
case 0:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
} else {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
}
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
} else {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
}
|
|
|
|
|
n |= filter->cache;
|
|
|
|
|
if (n == 0xfffe) {
|
|
|
|
|
if (endian) {
|
|
|
|
|
filter->status = 0; /* big-endian */
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0x100; /* little-endian */
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0xfeff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
filter->status &= ~0xff;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UCS-2BE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_ucs2be(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UCS-2LE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_ucs2le(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF-16 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf16_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n, endian;
|
|
|
|
|
|
|
|
|
|
endian = filter->status & 0xff00;
|
|
|
|
|
switch (filter->status & 0xff) {
|
|
|
|
|
case 0:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
} else {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
}
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (endian) {
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
} else {
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
}
|
|
|
|
|
n |= filter->cache & 0xffff;
|
|
|
|
|
filter->status &= ~0xff;
|
|
|
|
|
if (n == 0xfffe) {
|
|
|
|
|
if (endian) {
|
|
|
|
|
filter->status = 0; /* big-endian */
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0x100; /* little-endian */
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0xfeff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (n >= 0xd800 && n < 0xdc00) {
|
|
|
|
|
filter->cache = ((n & 0x3ff) << 16) + 0x400000;
|
|
|
|
|
} else if (n >= 0xdc00 && n < 0xe000) {
|
|
|
|
|
n &= 0x3ff;
|
|
|
|
|
n |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
if (n >= MBFL_WCSPLANE_SUPMIN && n < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
n &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
n |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF-16BE => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf16be_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0:
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = (c & 0xff) << 8;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = (filter->cache & 0xff00) | (c & 0xff);
|
|
|
|
|
if (n >= 0xd800 && n < 0xdc00) {
|
|
|
|
|
filter->cache = ((n & 0x3ff) << 16) + 0x400000;
|
|
|
|
|
} else if (n >= 0xdc00 && n < 0xe000) {
|
|
|
|
|
n &= 0x3ff;
|
|
|
|
|
n |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
if (n >= MBFL_WCSPLANE_SUPMIN && n < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
n &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
n |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UTF-16BE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf16be(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c >= MBFL_WCSPLANE_SUPMIN && c < MBFL_WCSPLANE_SUPMAX) {
|
|
|
|
|
n = ((c >> 10) - 0x40) | 0xd800;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((n >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(n & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = (c & 0x3ff) | 0xdc00;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)((n >> 8) & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(n & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF-16LE => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf16le_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0:
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
n = c & 0xff;
|
|
|
|
|
filter->cache |= n;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
n = (filter->cache & 0xff) | ((c & 0xff) << 8);
|
|
|
|
|
if (n >= 0xd800 && n < 0xdc00) {
|
|
|
|
|
filter->cache = ((n & 0x3ff) << 16) + 0x400000;
|
|
|
|
|
} else if (n >= 0xdc00 && n < 0xe000) {
|
|
|
|
|
n &= 0x3ff;
|
|
|
|
|
n |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
if (n >= MBFL_WCSPLANE_SUPMIN && n < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
n &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
n |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UTF-16LE
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf16le(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c >= MBFL_WCSPLANE_SUPMIN && c < MBFL_WCSPLANE_SUPMAX) {
|
|
|
|
|
n = ((c >> 10) - 0x40) | 0xd800;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((n >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = (c & 0x3ff) | 0xdc00;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(n & 0xff, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((n >> 8) & 0xff, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF-8 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf8_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c < 0x80) {
|
|
|
|
|
if (c >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c < 0xc0) {
|
|
|
|
|
switch (filter->status & 0xff) {
|
|
|
|
|
case 0x10: /* 2byte code 2nd char */
|
|
|
|
|
case 0x21: /* 3byte code 3rd char */
|
|
|
|
|
case 0x32: /* 4byte code 4th char */
|
|
|
|
|
case 0x43: /* 5byte code 5th char */
|
|
|
|
|
case 0x54: /* 6byte code 6th char */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
s = filter->cache | (c & 0x3f);
|
|
|
|
|
if (s >= 0x80) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 0x20: /* 3byte code 2nd char */
|
|
|
|
|
case 0x31: /* 4byte code 3rd char */
|
|
|
|
|
case 0x42: /* 5byte code 4th char */
|
|
|
|
|
case 0x53: /* 6byte code 5th char */
|
|
|
|
|
filter->cache |= ((c & 0x3f) << 6);
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 0x30: /* 4byte code 2nd char */
|
|
|
|
|
case 0x41: /* 5byte code 3rd char */
|
|
|
|
|
case 0x52: /* 6byte code 4th char */
|
|
|
|
|
filter->cache |= ((c & 0x3f) << 12);
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 0x40: /* 5byte code 2nd char */
|
|
|
|
|
case 0x51: /* 6byte code 3rd char */
|
|
|
|
|
filter->cache |= ((c & 0x3f) << 18);
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 0x50: /* 6byte code 2nd char */
|
|
|
|
|
filter->cache |= ((c & 0x3f) << 24);
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
} else if (c < 0xe0) { /* 2byte code first char */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
filter->cache = (c & 0x1f) << 6;
|
|
|
|
|
} else if (c < 0xf0) { /* 3byte code first char */
|
|
|
|
|
filter->status = 0x20;
|
|
|
|
|
filter->cache = (c & 0xf) << 12;
|
|
|
|
|
} else if (c < 0xf8) { /* 4byte code first char */
|
|
|
|
|
filter->status = 0x30;
|
|
|
|
|
filter->cache = (c & 0x7) << 18;
|
|
|
|
|
} else if (c < 0xfc) { /* 5byte code first char */
|
|
|
|
|
filter->status = 0x40;
|
|
|
|
|
filter->cache = (c & 0x3) << 24;
|
|
|
|
|
} else if (c < 0xfe) { /* 6 byte code first char */
|
|
|
|
|
filter->status = 0x50;
|
|
|
|
|
filter->cache = (c & 0x1) << 30;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UTF-8
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf8(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < MBFL_WCSGROUP_UCS4MAX) {
|
|
|
|
|
if (c < 0x80) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c < 0x800) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(((c >> 6) & 0x1f) | 0xc0, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c < 0x10000) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(((c >> 12) & 0x0f) | 0xe0, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 6) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c < 0x200000) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(((c >> 18) & 0x07) | 0xf0, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 12) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 6) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c < 0x4000000) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(((c >> 24) & 0x03) | 0xf8, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 18) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 12) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 6) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(((c >> 30) & 0x01) | 0xfc, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 24) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 18) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 12) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(((c >> 6) & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)((c & 0x3f) | 0x80, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF-7 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf7_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
n = -1;
|
|
|
|
|
if (filter->status != 0) { /* Modified Base64 */
|
|
|
|
|
if (c >= 0x41 && c <= 0x5a) { /* A - Z */
|
|
|
|
|
n = c - 65;
|
|
|
|
|
} else if (c >= 0x61 && c <= 0x7a) { /* a - z */
|
|
|
|
|
n = c - 71;
|
|
|
|
|
} else if (c >= 0x30 && c <= 0x39) { /* 0 - 9 */
|
|
|
|
|
n = c + 4;
|
|
|
|
|
} else if (c == 0x2b) { /* '+' */
|
|
|
|
|
n = 62;
|
|
|
|
|
} else if (c == 0x2f) { /* '/' */
|
|
|
|
|
n = 63;
|
|
|
|
|
}
|
|
|
|
|
if (n < 0 || n > 63) {
|
|
|
|
|
if (c == 0x2d) {
|
|
|
|
|
if (filter->status == 1) { /* "+-" -> "+" */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2b, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* ASCII exclude '-' */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s = c & MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
/* directly encoded characters */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x2b) { /* '+' shift character */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* ASCII */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s = c & MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* decode Modified Base64 */
|
|
|
|
|
case 1:
|
|
|
|
|
case 2:
|
|
|
|
|
filter->cache |= n << 10;
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
break;
|
|
|
|
|
case 3:
|
|
|
|
|
filter->cache |= n << 4;
|
|
|
|
|
filter->status = 4;
|
|
|
|
|
break;
|
|
|
|
|
case 4:
|
|
|
|
|
s = ((n >> 2) & 0xf) | (filter->cache & 0xffff);
|
|
|
|
|
n = (n & 0x3) << 14;
|
|
|
|
|
filter->status = 5;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000) | n;
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = n;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 5:
|
|
|
|
|
filter->cache |= n << 8;
|
|
|
|
|
filter->status = 6;
|
|
|
|
|
break;
|
|
|
|
|
case 6:
|
|
|
|
|
filter->cache |= n << 2;
|
|
|
|
|
filter->status = 7;
|
|
|
|
|
break;
|
|
|
|
|
case 7:
|
|
|
|
|
s = ((n >> 4) & 0x3) | (filter->cache & 0xffff);
|
|
|
|
|
n = (n & 0xf) << 12;
|
|
|
|
|
filter->status = 8;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000) | n;
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = n;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 8:
|
|
|
|
|
filter->cache |= n << 6;
|
|
|
|
|
filter->status = 9;
|
|
|
|
|
break;
|
|
|
|
|
case 9:
|
|
|
|
|
s = n | (filter->cache & 0xffff);
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000);
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UTF-7
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf7(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
n = 0;
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ASCII */
|
|
|
|
|
if (c >= 0x41 && c <= 0x5a) { /* A - Z */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c >= 0x61 && c <= 0x7a) { /* a - z */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c >= 0x30 && c <= 0x39) { /* 0 - 9 */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == '\0') { /* '\0' */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == 0x2f) { /* '/' */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == 0x2d) { /* '-' */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == 0x20) { /* SPACE */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x09) { /* HTAB */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x0d) { /* CR */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x0a) { /* LF */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x27) { /* "'" */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x28) { /* '(' */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x29) { /* ')' */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x2c) { /* ',' */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x2e) { /* '.' */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x3a) { /* ':' */
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c == 0x3f) { /* '?' */
|
|
|
|
|
n = 2;
|
|
|
|
|
}
|
|
|
|
|
} else if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
|
|
|
|
;
|
|
|
|
|
} else if (c >= MBFL_WCSPLANE_SUPMIN && c < MBFL_WCSPLANE_SUPMAX) {
|
|
|
|
|
s = ((c >> 10) - 0x40) | 0xd800;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->filter_function)(s, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
s = (c & 0x3ff) | 0xdc00;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->filter_function)(s, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0:
|
|
|
|
|
if (n != 0) { /* directly encode characters */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* Modified Base64 */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2b, filter->data TSRMLS_CC)); /* '+' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status++;
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* encode Modified Base64 */
|
|
|
|
|
case 1:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 10) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 4) & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s << 2) & 0x3c], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status++;
|
|
|
|
|
filter->cache = ((s & 0xf) << 16) | c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 14) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 8) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 2) & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s << 4) & 0x30], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status++;
|
|
|
|
|
filter->cache = ((s & 0x3) << 16) | c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 12) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(s >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[s & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf7_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int status, cache;
|
|
|
|
|
|
|
|
|
|
status = filter->status;
|
|
|
|
|
cache = filter->cache;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
switch (status) {
|
|
|
|
|
case 1:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 10) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 4) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache << 2) & 0x3c], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 14) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 8) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 2) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache << 4) & 0x30], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 12) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[(cache >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_base64_table[cache & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* UTF7-IMAP => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_utf7imap_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
n = -1;
|
|
|
|
|
if (filter->status != 0) { /* Modified Base64 */
|
|
|
|
|
if (c >= 0x41 && c <= 0x5a) { /* A - Z */
|
|
|
|
|
n = c - 65;
|
|
|
|
|
} else if (c >= 0x61 && c <= 0x7a) { /* a - z */
|
|
|
|
|
n = c - 71;
|
|
|
|
|
} else if (c >= 0x30 && c <= 0x39) { /* 0 - 9 */
|
|
|
|
|
n = c + 4;
|
|
|
|
|
} else if (c == 0x2b) { /* '+' */
|
|
|
|
|
n = 62;
|
|
|
|
|
} else if (c == 0x2c) { /* ',' */
|
|
|
|
|
n = 63;
|
|
|
|
|
}
|
|
|
|
|
if (n < 0 || n > 63) {
|
|
|
|
|
if (c == 0x2d) {
|
|
|
|
|
if (filter->status == 1) { /* "&-" -> "&" */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x26, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* ASCII exclude '-' */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s = c & MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
/* directly encoded characters */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x26) { /* '&' shift character */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* ASCII */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s = c & MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* decode Modified Base64 */
|
|
|
|
|
case 1:
|
|
|
|
|
case 2:
|
|
|
|
|
filter->cache |= n << 10;
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
break;
|
|
|
|
|
case 3:
|
|
|
|
|
filter->cache |= n << 4;
|
|
|
|
|
filter->status = 4;
|
|
|
|
|
break;
|
|
|
|
|
case 4:
|
|
|
|
|
s = ((n >> 2) & 0xf) | (filter->cache & 0xffff);
|
|
|
|
|
n = (n & 0x3) << 14;
|
|
|
|
|
filter->status = 5;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000) | n;
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = n;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 5:
|
|
|
|
|
filter->cache |= n << 8;
|
|
|
|
|
filter->status = 6;
|
|
|
|
|
break;
|
|
|
|
|
case 6:
|
|
|
|
|
filter->cache |= n << 2;
|
|
|
|
|
filter->status = 7;
|
|
|
|
|
break;
|
|
|
|
|
case 7:
|
|
|
|
|
s = ((n >> 4) & 0x3) | (filter->cache & 0xffff);
|
|
|
|
|
n = (n & 0xf) << 12;
|
|
|
|
|
filter->status = 8;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000) | n;
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = n;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = n;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 8:
|
|
|
|
|
filter->cache |= n << 6;
|
|
|
|
|
filter->status = 9;
|
|
|
|
|
break;
|
|
|
|
|
case 9:
|
|
|
|
|
s = n | (filter->cache & 0xffff);
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
if (s >= 0xd800 && s < 0xdc00) {
|
|
|
|
|
s = (((s & 0x3ff) << 16) + 0x400000);
|
|
|
|
|
filter->cache = s;
|
|
|
|
|
} else if (s >= 0xdc00 && s < 0xe000) {
|
|
|
|
|
s &= 0x3ff;
|
|
|
|
|
s |= (filter->cache & 0xfff0000) >> 6;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
if (s >= MBFL_WCSPLANE_SUPMIN && s < MBFL_WCSPLANE_SUPMAX) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else { /* illegal character */
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
filter->cache = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static const unsigned char mbfl_utf7imap_base64_table[] =
|
|
|
|
|
{
|
|
|
|
|
/* 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', */
|
|
|
|
|
0x41,0x42,0x43,0x44,0x45,0x46,0x47,0x48,0x49,0x4a,0x4b,0x4c,0x4d,
|
|
|
|
|
/* 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', */
|
|
|
|
|
0x4e,0x4f,0x50,0x51,0x52,0x53,0x54,0x55,0x56,0x57,0x58,0x59,0x5a,
|
|
|
|
|
/* 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', */
|
|
|
|
|
0x61,0x62,0x63,0x64,0x65,0x66,0x67,0x68,0x69,0x6a,0x6b,0x6c,0x6d,
|
|
|
|
|
/* 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', */
|
|
|
|
|
0x6e,0x6f,0x70,0x71,0x72,0x73,0x74,0x75,0x76,0x77,0x78,0x79,0x7a,
|
|
|
|
|
/* '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', ',', '\0' */
|
|
|
|
|
0x30,0x31,0x32,0x33,0x34,0x35,0x36,0x37,0x38,0x39,0x2b,0x2c,0x00
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => UTF7-IMAP
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf7imap(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n, s;
|
|
|
|
|
|
|
|
|
|
n = 0;
|
|
|
|
|
if (c == 0x26) {
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if ((c >= 0x20 && c <= 0x7e) || c == 0) {
|
|
|
|
|
n = 2;
|
|
|
|
|
} else if (c >= 0 && c < MBFL_WCSPLANE_UCS2MAX) {
|
|
|
|
|
;
|
|
|
|
|
} else if (c >= MBFL_WCSPLANE_SUPMIN && c < MBFL_WCSPLANE_SUPMAX) {
|
|
|
|
|
s = ((c >> 10) - 0x40) | 0xd800;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->filter_function)(s, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
s = (c & 0x3ff) | 0xdc00;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->filter_function)(s, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return c;
|
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0:
|
|
|
|
|
if (n != 0) { /* directly encode characters */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
} else { /* Modified Base64 */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x26, filter->data TSRMLS_CC)); /* '&' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter->status = 1;
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* encode Modified Base64 */
|
|
|
|
|
case 1:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 10) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 4) & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s << 2) & 0x3c], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
filter->cache = ((s & 0xf) << 16) | c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 14) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 8) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 2) & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s << 4) & 0x30], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
filter->cache = ((s & 0x3) << 16) | c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3:
|
|
|
|
|
s = filter->cache;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 12) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(s >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[s & 0x3f], filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n == 1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
filter->cache = c;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_utf7imap_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int status, cache;
|
|
|
|
|
|
|
|
|
|
status = filter->status;
|
|
|
|
|
cache = filter->cache;
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->cache = 0;
|
|
|
|
|
/* flush fragments */
|
|
|
|
|
switch (status) {
|
|
|
|
|
case 1:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 10) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 4) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache << 2) & 0x3c], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 14) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 8) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 2) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache << 4) & 0x30], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 12) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[(cache >> 6) & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(mbfl_utf7imap_base64_table[cache & 0x3f], filter->data TSRMLS_CC));
|
|
|
|
|
CK((*filter->output_function)(0x2d, filter->data TSRMLS_CC)); /* '-' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ASCII
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_ascii(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < 0x80) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
2001-08-25 09:21:43 +00:00
|
|
|
|
/*
|
|
|
|
|
* wchar => cp1252
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_cp1252(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-08-25 09:21:43 +00:00
|
|
|
|
{
|
2002-04-07 18:09:31 +00:00
|
|
|
|
int s=-1, n;
|
2001-08-25 09:21:43 +00:00
|
|
|
|
|
|
|
|
|
if (c >= 0x100) {
|
|
|
|
|
/* look it up from the cp1252 table */
|
|
|
|
|
s = -1;
|
2002-05-05 11:42:18 +00:00
|
|
|
|
n = 31;
|
2001-08-25 09:21:43 +00:00
|
|
|
|
while (n >= 0) {
|
2002-05-05 11:42:18 +00:00
|
|
|
|
if (c == cp1252_ucs_table[n] && c != 0xfffe) {
|
2001-08-25 09:21:43 +00:00
|
|
|
|
s = 0x80 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_1)
|
|
|
|
|
{
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
else if (c >= 0 && c < 0x100) {
|
|
|
|
|
s = c;
|
|
|
|
|
}
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-08-25 09:21:43 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-08-25 09:21:43 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* cp1252 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_cp1252_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-08-25 09:21:43 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0x80 && c < 0xa0) {
|
|
|
|
|
s = cp1252_ucs_table[c - 0x80];
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-08-25 09:21:43 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-1
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_1(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0 && c < 0x100) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(c, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-2 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_2_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_2_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_2;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-2
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_2(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_2_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_2) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-3 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_3_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_3_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_3;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-3
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_3(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_3_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_3) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-4 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_4_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_4_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_4;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-4
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_4(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_4_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_4) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-5 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_5_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_5_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_5;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-5
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_5(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_5_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_5) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-6 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_6_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_6_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_6;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-6
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_6(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_6_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_6) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-7 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_7_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_7_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_7;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-7
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_7(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_7_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_7) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-8 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_8_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_8_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_8;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-8
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_8(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_8_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_8) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-9 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_9_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_9_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_9;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-9
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_9(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_9_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_9) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-10 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_10_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_10_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_10;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-10
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_10(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_10_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_10) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-13 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_13_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_13_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_13;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-13
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_13(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_13_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_13) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-14 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_14_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_14_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_14;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-14
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_14(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_14_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_14) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* ISO-8859-15 => wchar
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_8859_15_wchar(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else if (c >= 0xa0 && c < 0x100) {
|
|
|
|
|
s = iso8859_15_ucs_table[c - 0xa0];
|
|
|
|
|
if (s <= 0) {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
s |= MBFL_WCSPLANE_8859_15;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
s = c;
|
|
|
|
|
s &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
s |= MBFL_WCSGROUP_THROUGH;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* wchar => ISO-8859-15
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_wchar_8859_15(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, n;
|
|
|
|
|
|
|
|
|
|
if (c >= 0 && c < 0xa0) {
|
|
|
|
|
s = c;
|
|
|
|
|
} else {
|
|
|
|
|
s = -1;
|
|
|
|
|
n = 95;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
if (c == iso8859_15_ucs_table[n]) {
|
|
|
|
|
s = 0xa0 + n;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
if (s <= 0 && (c & ~MBFL_WCSPLANE_MASK) == MBFL_WCSPLANE_8859_15) {
|
|
|
|
|
s = c & MBFL_WCSPLANE_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK((*filter->output_function)(s, filter->data TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (filter->illegal_mode != MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
CK(mbfl_filt_conv_illegal_output(c, filter TSRMLS_CC));
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
*
|
|
|
|
|
* identify filter functions
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
static void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_common_ctor(mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_common_dtor(mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_ascii(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x20 && c < 0x80) {
|
|
|
|
|
;
|
|
|
|
|
} else if (c == 0x0d || c == 0x0a || c == 0x09 || c == 0) { /* CR or LF or HTAB or null */
|
|
|
|
|
;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_utf8(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c < 0x80) {
|
|
|
|
|
if (c < 0) {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
} else if (c != 0 && filter->status) {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c < 0xc0) {
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0x20: /* 3 byte code 2nd char */
|
|
|
|
|
case 0x30: /* 4 byte code 2nd char */
|
|
|
|
|
case 0x31: /* 4 byte code 3rd char */
|
|
|
|
|
case 0x40: /* 5 byte code 2nd char */
|
|
|
|
|
case 0x41: /* 5 byte code 3rd char */
|
|
|
|
|
case 0x42: /* 5 byte code 4th char */
|
|
|
|
|
case 0x50: /* 6 byte code 2nd char */
|
|
|
|
|
case 0x51: /* 6 byte code 3rd char */
|
|
|
|
|
case 0x52: /* 6 byte code 4th char */
|
|
|
|
|
case 0x53: /* 6 byte code 5th char */
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 0x10: /* 2 byte code 2nd char */
|
|
|
|
|
case 0x21: /* 3 byte code 3rd char */
|
|
|
|
|
case 0x32: /* 4 byte code 4th char */
|
|
|
|
|
case 0x43: /* 5 byte code 5th char */
|
|
|
|
|
case 0x54: /* 6 byte code 6th char */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
if (filter->status) {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
if (c < 0xe0) { /* 2 byte code first char */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
} else if (c < 0xf0) { /* 3 byte code 1st char */
|
|
|
|
|
filter->status = 0x20;
|
|
|
|
|
} else if (c < 0xf8) { /* 4 byte code 1st char */
|
|
|
|
|
filter->status = 0x30;
|
|
|
|
|
} else if (c < 0xfc) { /* 5 byte code 1st char */
|
|
|
|
|
filter->status = 0x40;
|
|
|
|
|
} else if (c < 0xfe) { /* 6 byte code 1st char */
|
|
|
|
|
filter->status = 0x50;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_utf7(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
/* directly encoded characters */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x2b) { /* '+' shift character */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else if (c == 0x5c || c == 0x7e || c < 0 || c > 0x7f) { /* illegal character */
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* Modified Base64 */
|
|
|
|
|
case 1:
|
|
|
|
|
case 2:
|
|
|
|
|
n = 0;
|
|
|
|
|
if (c >= 0x41 && c <= 0x5a) { /* A - Z */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c >= 0x61 && c <= 0x7a) { /* a - z */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c >= 0x30 && c <= 0x39) { /* 0 - 9 */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == 0x2b) { /* '+' */
|
|
|
|
|
n = 1;
|
|
|
|
|
} else if (c == 0x2f) { /* '/' */
|
|
|
|
|
n = 1;
|
|
|
|
|
}
|
|
|
|
|
if (n <= 0) {
|
|
|
|
|
if (filter->status == 1 && c != 0x2d) {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
} else if (c < 0 || c > 0x7f) {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_JA)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_eucjp(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0: /* latin */
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xff) { /* kanji first char */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else if (c == 0x8e) { /* kana first char */
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
} else if (c == 0x8f) { /* X 0212 first char */
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 1: /* got first half */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2: /* got 0x8e */
|
|
|
|
|
if (c < 0xa1 || c > 0xdf) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3: /* got 0x8f */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status++;
|
|
|
|
|
break;
|
|
|
|
|
case 4: /* got 0x8f */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_sjis(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter->status) { /* kanji second char */
|
|
|
|
|
if (c < 0x40 || c > 0xfc || c == 0x7f) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xe0) { /* kana ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0x80 && c < 0xf0 && c != 0xa0) { /* kanji first char */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_sjiswin(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter->status) { /* kanji second char */
|
|
|
|
|
if (c < 0x40 || c > 0xfc || c == 0x7f) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xe0) { /* kana ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0x80 && c < 0xfd && c != 0xa0) { /* kanji first char */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_jis(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
retry:
|
|
|
|
|
switch (filter->status & 0xf) {
|
|
|
|
|
/* case 0x00: ASCII */
|
|
|
|
|
/* case 0x10: X 0201 latin */
|
|
|
|
|
/* case 0x20: X 0201 kana */
|
|
|
|
|
/* case 0x80: X 0208 */
|
|
|
|
|
/* case 0x90: X 0212 */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x1b) {
|
|
|
|
|
filter->status += 2;
|
|
|
|
|
} else if (c == 0x0e) { /* "kana in" */
|
|
|
|
|
filter->status = 0x20;
|
|
|
|
|
} else if (c == 0x0f) { /* "kana out" */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if ((filter->status == 0x80 || filter->status == 0x90) && c > 0x20 && c < 0x7f) { /* kanji first char */
|
|
|
|
|
filter->status += 1;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin, CTLs */
|
|
|
|
|
;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* case 0x81: X 0208 second char */
|
|
|
|
|
/* case 0x91: X 0212 second char */
|
|
|
|
|
case 1:
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
if (c == 0x1b) {
|
|
|
|
|
goto retry;
|
|
|
|
|
} else if (c < 0x21 || c > 0x7e) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC */
|
|
|
|
|
case 2:
|
|
|
|
|
if (c == 0x24) { /* '$' */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else if (c == 0x28) { /* '(' */
|
|
|
|
|
filter->status += 3;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC $ */
|
|
|
|
|
case 3:
|
|
|
|
|
if (c == 0x40 || c == 0x42) { /* '@' or 'B' */
|
|
|
|
|
filter->status = 0x80;
|
|
|
|
|
} else if (c == 0x28) { /* '(' */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC $ ( */
|
|
|
|
|
case 4:
|
|
|
|
|
if (c == 0x40 || c == 0x42) { /* '@' or 'B' */
|
|
|
|
|
filter->status = 0x80;
|
|
|
|
|
} else if (c == 0x44) { /* 'D' */
|
|
|
|
|
filter->status = 0x90;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC ( */
|
|
|
|
|
case 5:
|
|
|
|
|
if (c == 0x42 || c == 0x48) { /* 'B' or 'H' */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c == 0x4a) { /* 'J' */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
} else if (c == 0x49) { /* 'I' */
|
|
|
|
|
filter->status = 0x20;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_JA */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_CN)
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_euccn(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0: /* latin */
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xff) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 1: /* got lead byte */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_cp936(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
if (filter->status) { /* kanji second char */
|
|
|
|
|
if (c < 0x40 || c > 0xfe || c == 0x7f) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0x80 && c < 0xff) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
2002-05-12 13:06:13 +00:00
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_hz(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
switch (filter->status & 0xf) {
|
|
|
|
|
/* case 0x00: ASCII */
|
|
|
|
|
/* case 0x10: GB2312 */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x7e) {
|
|
|
|
|
filter->status += 2;
|
|
|
|
|
} else if (filter->status == 0x10 && c > 0x20 && c < 0x7f) { /* DBCS first char */
|
|
|
|
|
filter->status += 1;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin, CTLs */
|
|
|
|
|
;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* case 0x11: GB2312 second char */
|
|
|
|
|
case 1:
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
if (c < 0x21 || c > 0x7e) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
|
if (c == 0x7d) { /* '}' */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c == 0x7b) { /* '{' */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
} else if (c == 0x7e) { /* '~' */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
#endif /* HAVE_MBSTR_CN */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_TW)
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_euctw(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0: /* latin */
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xff) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else if (c == 0x8e) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 2;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 1: /* got lead byte */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 2: /* got lead byte */
|
|
|
|
|
if (c >= 0xa1 && c < 0xaf) { /* ok */
|
|
|
|
|
filter->status = 3;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3: /* got lead byte */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 4;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 4: /* got lead byte */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_big5(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
if (filter->status) { /* kanji second char */
|
|
|
|
|
if (c < 0x40 || (c > 0x7e && c < 0xa1) ||c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xff) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#endif /* HAVE_MBSTR_TW */
|
|
|
|
|
|
|
|
|
|
#if defined(HAVE_MBSTR_KR)
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_euckr(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0: /* latin */
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c > 0xa0 && c < 0xff) { /* DBCS lead byte */
|
|
|
|
|
filter->status = 1;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 1: /* got lead byte */
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_uhc(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
switch (filter->status) {
|
|
|
|
|
case 0: /* latin */
|
|
|
|
|
if (c >= 0 && c < 0x80) { /* ok */
|
|
|
|
|
;
|
|
|
|
|
} else if (c >= 0x81 && c <= 0xa0) { /* dbcs first char */
|
|
|
|
|
filter->status= 1;
|
|
|
|
|
} else if (c >= 0xa1 && c <= 0xc6) { /* dbcs first char */
|
|
|
|
|
filter->status= 2;
|
|
|
|
|
} else if (c >= 0xc7 && c <= 0xfe) { /* dbcs first char */
|
|
|
|
|
filter->status= 3;
|
|
|
|
|
} else { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
|
case 2:
|
|
|
|
|
if (c < 0x41 || (c > 0x5a && c < 0x61)
|
|
|
|
|
|| (c > 0x7a && c < 0x81) || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 3:
|
|
|
|
|
if (c < 0xa1 || c > 0xfe) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
|
2002-05-24 22:28:42 +00:00
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
|
|
|
|
mbfl_filt_ident_2022kr(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
retry:
|
|
|
|
|
switch (filter->status & 0xf) {
|
|
|
|
|
/* case 0x00: ASCII */
|
|
|
|
|
/* case 0x10: KSC5601 mode */
|
|
|
|
|
/* case 0x20: KSC5601 DBCS */
|
|
|
|
|
/* case 0x40: KSC5601 SBCS */
|
|
|
|
|
case 0:
|
|
|
|
|
if (!(filter->status & 0x10)) {
|
|
|
|
|
if (c == 0x1b)
|
|
|
|
|
filter->status += 2;
|
|
|
|
|
} else if (filter->status == 0x20 && c > 0x20 && c < 0x7f) { /* kanji first char */
|
|
|
|
|
filter->status += 1;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin, CTLs */
|
|
|
|
|
;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* case 0x21: KSC5601 second char */
|
|
|
|
|
case 1:
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
if (c < 0x21 || c > 0x7e) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC */
|
|
|
|
|
case 2:
|
|
|
|
|
if (c == 0x24) { /* '$' */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC $ */
|
|
|
|
|
case 3:
|
|
|
|
|
if (c == 0x29) { /* ')' */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC $) */
|
|
|
|
|
case 5:
|
|
|
|
|
if (c == 0x43) { /* 'C' */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#endif /* HAVE_MBSTR_KR */
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2001-08-25 09:21:43 +00:00
|
|
|
|
/* We only distinguish the MS extensions to ISO-8859-1.
|
|
|
|
|
* Actually, this is pretty much a NO-OP, since the identification
|
|
|
|
|
* system doesn't allow us to discriminate between a positive match,
|
|
|
|
|
* a possible match and a definite non-match.
|
|
|
|
|
* The problem here is that cp1252 looks like SJIS for certain chars.
|
|
|
|
|
* */
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_cp1252(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-08-25 09:21:43 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x80 && c < 0xa0)
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
else
|
|
|
|
|
filter->flag = 1; /* not it */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
2002-05-21 07:00:34 +00:00
|
|
|
|
#if defined(HAVE_MBSTR_RU)
|
2002-08-20 10:00:28 +00:00
|
|
|
|
/* all of this is so ugly now! */
|
2002-05-21 07:00:34 +00:00
|
|
|
|
static int
|
2002-06-01 05:45:25 +00:00
|
|
|
|
mbfl_filt_ident_cp1251(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2002-05-21 07:00:34 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x80 && c < 0xff)
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
else
|
|
|
|
|
filter->flag = 1; /* not it */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-06-01 05:45:25 +00:00
|
|
|
|
mbfl_filt_ident_cp866(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2002-05-21 07:00:34 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x80 && c < 0xff)
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
else
|
|
|
|
|
filter->flag = 1; /* not it */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-06-01 05:45:25 +00:00
|
|
|
|
mbfl_filt_ident_koi8r(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2002-05-21 07:00:34 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x80 && c < 0xff)
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
else
|
|
|
|
|
filter->flag = 1; /* not it */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
#endif /* HAVE_MBSTR_RU */
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_2022jp(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
retry:
|
|
|
|
|
switch (filter->status & 0xf) {
|
|
|
|
|
/* case 0x00: ASCII */
|
|
|
|
|
/* case 0x10: X 0201 latin */
|
|
|
|
|
/* case 0x80: X 0208 */
|
|
|
|
|
case 0:
|
|
|
|
|
if (c == 0x1b) {
|
|
|
|
|
filter->status += 2;
|
|
|
|
|
} else if (filter->status == 0x80 && c > 0x20 && c < 0x7f) { /* kanji first char */
|
|
|
|
|
filter->status += 1;
|
|
|
|
|
} else if (c >= 0 && c < 0x80) { /* latin, CTLs */
|
|
|
|
|
;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* case 0x81: X 0208 second char */
|
|
|
|
|
case 1:
|
|
|
|
|
if (c == 0x1b) {
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else {
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
if (c < 0x21 || c > 0x7e) { /* bad */
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC */
|
|
|
|
|
case 2:
|
|
|
|
|
if (c == 0x24) { /* '$' */
|
|
|
|
|
filter->status++;
|
|
|
|
|
} else if (c == 0x28) { /* '(' */
|
|
|
|
|
filter->status += 3;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC $ */
|
|
|
|
|
case 3:
|
|
|
|
|
if (c == 0x40 || c == 0x42) { /* '@' or 'B' */
|
|
|
|
|
filter->status = 0x80;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
/* ESC ( */
|
|
|
|
|
case 5:
|
|
|
|
|
if (c == 0x42) { /* 'B' */
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
} else if (c == 0x4a) { /* 'J' */
|
|
|
|
|
filter->status = 0x10;
|
|
|
|
|
} else {
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
filter->status &= ~0xf;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_false_ctor(mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->flag = 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_false(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
filter->flag = 1; /* bad */
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_ident_true(int c, mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* convert filter
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
/* setup filter function table */
|
|
|
|
|
static void
|
2002-08-02 10:22:31 +00:00
|
|
|
|
mbfl_convert_filter_set_vtbl(mbfl_convert_filter *filter, const struct mbfl_convert_vtbl *vtbl)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter && vtbl) {
|
|
|
|
|
filter->filter_ctor = vtbl->filter_ctor;
|
|
|
|
|
filter->filter_dtor = vtbl->filter_dtor;
|
|
|
|
|
filter->filter_function = vtbl->filter_function;
|
|
|
|
|
filter->filter_flush = vtbl->filter_flush;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_convert_vtbl *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_convert_filter_get_vtbl(enum mbfl_no_encoding from, enum mbfl_no_encoding to)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const struct mbfl_convert_vtbl *vtbl;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
if (to == mbfl_no_encoding_base64 ||
|
|
|
|
|
to == mbfl_no_encoding_qprint ||
|
|
|
|
|
to == mbfl_no_encoding_7bit) {
|
|
|
|
|
from = mbfl_no_encoding_8bit;
|
|
|
|
|
} else if (from == mbfl_no_encoding_base64 ||
|
2001-05-12 23:42:09 +00:00
|
|
|
|
from == mbfl_no_encoding_qprint ||
|
|
|
|
|
from == mbfl_no_encoding_uuencode) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
to = mbfl_no_encoding_8bit;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((vtbl = mbfl_convert_filter_list[i++]) != NULL){
|
|
|
|
|
if (vtbl->from == from && vtbl->to == to) {
|
|
|
|
|
return vtbl;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
static void
|
|
|
|
|
mbfl_convert_filter_select_vtbl(mbfl_convert_filter *filter)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const struct mbfl_convert_vtbl *vtbl;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
vtbl = mbfl_convert_filter_get_vtbl(filter->from->no_encoding, filter->to->no_encoding);
|
|
|
|
|
if (vtbl == NULL) {
|
|
|
|
|
vtbl = &vtbl_pass;
|
|
|
|
|
}
|
|
|
|
|
mbfl_convert_filter_set_vtbl(filter, vtbl);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* filter pipe */
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filter_output_pipe(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_convert_filter *filter = (mbfl_convert_filter*)data;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return (*filter->filter_function)(c, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/* null output */
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filter_output_null(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
mbfl_convert_filter *
|
|
|
|
|
mbfl_convert_filter_new(
|
|
|
|
|
enum mbfl_no_encoding from,
|
|
|
|
|
enum mbfl_no_encoding to,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int (*output_function)(int, void* TSRMLS_DC),
|
|
|
|
|
int (*flush_function)(void* TSRMLS_DC),
|
|
|
|
|
void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_convert_filter * filter;
|
|
|
|
|
|
|
|
|
|
/* allocate */
|
|
|
|
|
filter = (mbfl_convert_filter *)mbfl_malloc(sizeof(mbfl_convert_filter));
|
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* encoding structure */
|
|
|
|
|
filter->from = mbfl_no2encoding(from);
|
|
|
|
|
filter->to = mbfl_no2encoding(to);
|
|
|
|
|
if (filter->from == NULL) {
|
|
|
|
|
filter->from = &mbfl_encoding_pass;
|
|
|
|
|
}
|
|
|
|
|
if (filter->to == NULL) {
|
|
|
|
|
filter->to = &mbfl_encoding_pass;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (output_function != NULL) {
|
|
|
|
|
filter->output_function = output_function;
|
|
|
|
|
} else {
|
|
|
|
|
filter->output_function = mbfl_filter_output_null;
|
|
|
|
|
}
|
|
|
|
|
filter->flush_function = flush_function;
|
|
|
|
|
filter->data = data;
|
|
|
|
|
filter->illegal_mode = MBFL_OUTPUTFILTER_ILLEGAL_MODE_CHAR;
|
|
|
|
|
filter->illegal_substchar = 0x3f; /* '?' */
|
|
|
|
|
|
|
|
|
|
/* setup the function table */
|
|
|
|
|
mbfl_convert_filter_select_vtbl(filter);
|
|
|
|
|
|
|
|
|
|
/* constructor */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_ctor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return filter;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_dtor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_free((void*)filter);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_feed(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return (*filter->filter_function)(c, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_flush)(filter TSRMLS_CC);
|
|
|
|
|
return (filter->flush_function ? (*filter->flush_function)(filter->data TSRMLS_CC) : 0);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
|
mbfl_convert_filter_reset(
|
|
|
|
|
mbfl_convert_filter *filter,
|
|
|
|
|
enum mbfl_no_encoding from,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
enum mbfl_no_encoding to TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
/* destruct old filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_dtor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* resset filter member */
|
|
|
|
|
filter->from = mbfl_no2encoding(from);
|
|
|
|
|
filter->to = mbfl_no2encoding(to);
|
|
|
|
|
|
|
|
|
|
/* set the vtbl */
|
|
|
|
|
mbfl_convert_filter_select_vtbl(filter);
|
|
|
|
|
|
|
|
|
|
/* construct new filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_ctor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
|
mbfl_convert_filter_copy(
|
|
|
|
|
mbfl_convert_filter *src,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter *dist TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
dist->filter_ctor = src->filter_ctor;
|
|
|
|
|
dist->filter_dtor = src->filter_dtor;
|
|
|
|
|
dist->filter_function = src->filter_function;
|
|
|
|
|
dist->filter_flush = src->filter_flush;
|
|
|
|
|
dist->output_function = src->output_function;
|
|
|
|
|
dist->flush_function = src->flush_function;
|
|
|
|
|
dist->data = src->data;
|
|
|
|
|
dist->status = src->status;
|
|
|
|
|
dist->cache = src->cache;
|
|
|
|
|
dist->from = src->from;
|
|
|
|
|
dist->to = src->to;
|
|
|
|
|
dist->illegal_mode = src->illegal_mode;
|
|
|
|
|
dist->illegal_substchar = src->illegal_substchar;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(mbfl_convert_filter *filter, mbfl_memory_device *src
|
|
|
|
|
TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
|
|
|
|
|
p = src->buffer;
|
|
|
|
|
n = src->pos;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return n;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_strcat(mbfl_convert_filter *filter, const unsigned char *p TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int c;
|
|
|
|
|
|
|
|
|
|
while ((c = *p++) != '\0') {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter->filter_function)(c, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#if 0
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_strncat(mbfl_convert_filter *filter, const unsigned char *p,
|
|
|
|
|
int n TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return n;
|
|
|
|
|
}
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
/* illegal character output function for conv-filter */
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filt_conv_illegal_output(int c, mbfl_convert_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int mode_backup, ret, n, m, r;
|
|
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
mode_backup = filter->illegal_mode;
|
|
|
|
|
filter->illegal_mode = MBFL_OUTPUTFILTER_ILLEGAL_MODE_NONE;
|
|
|
|
|
switch (mode_backup) {
|
|
|
|
|
case MBFL_OUTPUTFILTER_ILLEGAL_MODE_CHAR:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
ret = (*filter->filter_function)(filter->illegal_substchar, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case MBFL_OUTPUTFILTER_ILLEGAL_MODE_LONG:
|
|
|
|
|
if (c >= 0) {
|
|
|
|
|
if (c < MBFL_WCSGROUP_UCS4MAX) { /* unicode */
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"U+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (c < MBFL_WCSGROUP_WCHARMAX) {
|
|
|
|
|
m = c & ~MBFL_WCSPLANE_MASK;
|
|
|
|
|
switch (m) {
|
|
|
|
|
case MBFL_WCSPLANE_JIS0208:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"JIS+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case MBFL_WCSPLANE_JIS0212:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"JIS2+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case MBFL_WCSPLANE_WINCP932:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"W932+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case MBFL_WCSPLANE_8859_1:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"I8859_1+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
default:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"?+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
c &= MBFL_WCSPLANE_MASK;
|
|
|
|
|
} else {
|
2002-11-02 13:38:32 +00:00
|
|
|
|
ret = mbfl_convert_filter_strcat(filter, (const unsigned char *)"BAD+" TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
c &= MBFL_WCSGROUP_MASK;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (ret >= 0) {
|
|
|
|
|
m = 0;
|
|
|
|
|
r = 28;
|
|
|
|
|
while (r >= 0) {
|
|
|
|
|
n = (c >> r) & 0xf;
|
|
|
|
|
if (n || m) {
|
|
|
|
|
m = 1;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
ret = (*filter->filter_function)(mbfl_hexchar_table[n], filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (ret < 0) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
r -= 4;
|
|
|
|
|
}
|
|
|
|
|
if (m == 0 && ret >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
ret = (*filter->filter_function)(mbfl_hexchar_table[0], filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
filter->illegal_mode = mode_backup;
|
|
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* identify filter
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
static void
|
2002-08-02 10:22:31 +00:00
|
|
|
|
mbfl_identify_filter_set_vtbl(mbfl_identify_filter *filter, const struct mbfl_identify_vtbl *vtbl)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter && vtbl) {
|
|
|
|
|
filter->filter_ctor = vtbl->filter_ctor;
|
|
|
|
|
filter->filter_dtor = vtbl->filter_dtor;
|
|
|
|
|
filter->filter_function = vtbl->filter_function;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
static const struct mbfl_identify_vtbl *
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_identify_filter_get_vtbl(enum mbfl_no_encoding encoding)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const struct mbfl_identify_vtbl * vtbl;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while ((vtbl = mbfl_identify_filter_list[i++]) != NULL) {
|
|
|
|
|
if (vtbl->encoding == encoding) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return vtbl;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void
|
|
|
|
|
mbfl_identify_filter_select_vtbl(mbfl_identify_filter *filter)
|
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const struct mbfl_identify_vtbl *vtbl;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
vtbl = mbfl_identify_filter_get_vtbl(filter->encoding->no_encoding);
|
|
|
|
|
if (vtbl == NULL) {
|
|
|
|
|
vtbl = &vtbl_identify_false;
|
|
|
|
|
}
|
|
|
|
|
mbfl_identify_filter_set_vtbl(filter, vtbl);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_identify_filter *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_filter_new(enum mbfl_no_encoding encoding TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_identify_filter * filter;
|
|
|
|
|
|
|
|
|
|
/* allocate */
|
|
|
|
|
filter = (mbfl_identify_filter *)mbfl_malloc(sizeof(mbfl_identify_filter));
|
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* encoding structure */
|
|
|
|
|
filter->encoding = mbfl_no2encoding(encoding);
|
|
|
|
|
if (filter->encoding == NULL) {
|
|
|
|
|
filter->encoding = &mbfl_encoding_pass;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
filter->status = 0;
|
|
|
|
|
filter->flag = 0;
|
|
|
|
|
filter->score = 0;
|
|
|
|
|
|
|
|
|
|
/* setup the function table */
|
|
|
|
|
mbfl_identify_filter_select_vtbl(filter);
|
|
|
|
|
|
|
|
|
|
/* constructor */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_ctor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return filter;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_filter_delete(mbfl_identify_filter *filter TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (filter) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_dtor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_free((void*)filter);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* buffering converter
|
|
|
|
|
*/
|
|
|
|
|
mbfl_buffer_converter *
|
|
|
|
|
mbfl_buffer_converter_new(
|
|
|
|
|
enum mbfl_no_encoding from,
|
|
|
|
|
enum mbfl_no_encoding to,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int buf_initsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_buffer_converter *convd;
|
|
|
|
|
|
|
|
|
|
/* allocate */
|
|
|
|
|
convd = (mbfl_buffer_converter*)mbfl_malloc(sizeof (mbfl_buffer_converter));
|
|
|
|
|
if (convd == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* initialize */
|
|
|
|
|
convd->from = mbfl_no2encoding(from);
|
|
|
|
|
convd->to = mbfl_no2encoding(to);
|
|
|
|
|
if (convd->from == NULL) {
|
|
|
|
|
convd->from = &mbfl_encoding_pass;
|
|
|
|
|
}
|
|
|
|
|
if (convd->to == NULL) {
|
|
|
|
|
convd->to = &mbfl_encoding_pass;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* create convert filter */
|
|
|
|
|
convd->filter1 = NULL;
|
|
|
|
|
convd->filter2 = NULL;
|
|
|
|
|
if (mbfl_convert_filter_get_vtbl(convd->from->no_encoding, convd->to->no_encoding) != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
convd->filter1 = mbfl_convert_filter_new(convd->from->no_encoding, convd->to->no_encoding, mbfl_memory_device_output, 0, &convd->device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
convd->filter2 = mbfl_convert_filter_new(mbfl_no_encoding_wchar, convd->to->no_encoding, mbfl_memory_device_output, 0, &convd->device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (convd->filter2 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
convd->filter1 = mbfl_convert_filter_new(convd->from->no_encoding, mbfl_no_encoding_wchar, (int (*)(int, void* TSRMLS_DC))convd->filter2->filter_function, NULL, convd->filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (convd->filter1 == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(convd->filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (convd->filter1 == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&convd->device, buf_initsz, buf_initsz/4 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return convd;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_delete(mbfl_buffer_converter *convd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (convd != NULL) {
|
|
|
|
|
if (convd->filter1) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(convd->filter1 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
if (convd->filter2) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(convd->filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_clear(&convd->device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_free((void*)convd);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_reset(mbfl_buffer_converter *convd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_reset(&convd->device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_illegal_mode(mbfl_buffer_converter *convd, int mode TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (convd != NULL) {
|
|
|
|
|
if (convd->filter2 != NULL) {
|
|
|
|
|
convd->filter2->illegal_mode = mode;
|
|
|
|
|
} else if (convd->filter1 != NULL) {
|
|
|
|
|
convd->filter1->illegal_mode = mode;
|
|
|
|
|
} else {
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_illegal_substchar(mbfl_buffer_converter *convd, int substchar TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (convd != NULL) {
|
|
|
|
|
if (convd->filter2 != NULL) {
|
|
|
|
|
convd->filter2->illegal_substchar = substchar;
|
|
|
|
|
} else if (convd->filter1 != NULL) {
|
|
|
|
|
convd->filter1->illegal_substchar = substchar;
|
|
|
|
|
} else {
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_strncat(mbfl_buffer_converter *convd, const unsigned char *p, int n TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_convert_filter *filter;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int (*filter_function)(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
if (convd != NULL && p != NULL) {
|
|
|
|
|
filter = convd->filter1;
|
|
|
|
|
if (filter != NULL) {
|
|
|
|
|
filter_function = filter->filter_function;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return n;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_feed(mbfl_buffer_converter *convd, mbfl_string *string TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
mbfl_convert_filter *filter;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int (*filter_function)(int c, mbfl_convert_filter *filter TSRMLS_DC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
if (convd == NULL || string == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_realloc(&convd->device, convd->device.pos + string->len, string->len/4 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* feed data */
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
filter = convd->filter1;
|
|
|
|
|
if (filter != NULL) {
|
|
|
|
|
filter_function = filter->filter_function;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-09 11:18:11 +00:00
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_flush(mbfl_buffer_converter *convd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2001-05-09 11:18:11 +00:00
|
|
|
|
if (convd == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (convd->filter1 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(convd->filter1 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
if (convd->filter2 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(convd->filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2001-05-09 11:18:11 +00:00
|
|
|
|
|
|
|
|
|
return 0;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_getbuffer(mbfl_buffer_converter *convd, mbfl_string *result TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2001-05-09 11:18:11 +00:00
|
|
|
|
if (convd != NULL && result != NULL && convd->device.buffer != NULL) {
|
|
|
|
|
result->no_encoding = convd->to->no_encoding;
|
|
|
|
|
result->val = convd->device.buffer;
|
|
|
|
|
result->len = convd->device.pos;
|
|
|
|
|
} else {
|
|
|
|
|
result = NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_result(mbfl_buffer_converter *convd, mbfl_string *result TSRMLS_DC)
|
2001-05-09 11:18:11 +00:00
|
|
|
|
{
|
|
|
|
|
if (convd == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
result->no_encoding = convd->to->no_encoding;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mbfl_memory_device_result(&convd->device, result TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_feed_result(mbfl_buffer_converter *convd, mbfl_string *string,
|
|
|
|
|
mbfl_string *result TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2001-05-09 11:18:11 +00:00
|
|
|
|
if (convd == NULL || string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_buffer_converter_feed(convd, string TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (convd->filter1 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(convd->filter1 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
if (convd->filter2 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(convd->filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2001-05-09 11:18:11 +00:00
|
|
|
|
result->no_encoding = convd->to->no_encoding;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mbfl_memory_device_result(&convd->device, result TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* encoding detector
|
|
|
|
|
*/
|
|
|
|
|
mbfl_encoding_detector *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_encoding_detector_new(enum mbfl_no_encoding *elist, int eliztsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_encoding_detector *identd;
|
|
|
|
|
|
|
|
|
|
int i, num;
|
|
|
|
|
mbfl_identify_filter *filter;
|
|
|
|
|
|
|
|
|
|
if (elist == NULL || eliztsz <= 0) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* allocate */
|
|
|
|
|
identd = (mbfl_encoding_detector*)mbfl_malloc(sizeof(mbfl_encoding_detector));
|
|
|
|
|
if (identd == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
identd->filter_list = (mbfl_identify_filter **)mbfl_calloc(eliztsz, sizeof(mbfl_identify_filter *));
|
|
|
|
|
if (identd->filter_list == NULL) {
|
|
|
|
|
mbfl_free(identd);
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* create filters */
|
|
|
|
|
i = 0;
|
|
|
|
|
num = 0;
|
|
|
|
|
while (i < eliztsz) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter = mbfl_identify_filter_new(elist[i] TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter != NULL) {
|
|
|
|
|
identd->filter_list[num] = filter;
|
|
|
|
|
num++;
|
|
|
|
|
}
|
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
identd->filter_list_size = num;
|
|
|
|
|
|
|
|
|
|
return identd;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_encoding_detector_delete(mbfl_encoding_detector *identd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int i;
|
|
|
|
|
|
|
|
|
|
if (identd != NULL) {
|
|
|
|
|
if (identd->filter_list != NULL) {
|
|
|
|
|
i = identd->filter_list_size;
|
|
|
|
|
while (i > 0) {
|
|
|
|
|
i--;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_filter_delete(identd->filter_list[i] TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
mbfl_free((void *)identd->filter_list);
|
|
|
|
|
}
|
|
|
|
|
mbfl_free((void *)identd);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_encoding_detector_feed(mbfl_encoding_detector *identd, mbfl_string *string TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int i, n, num, bad, res;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
mbfl_identify_filter *filter;
|
|
|
|
|
|
|
|
|
|
res = 0;
|
|
|
|
|
/* feed data */
|
|
|
|
|
if (identd != NULL && string != NULL && string->val != NULL) {
|
|
|
|
|
num = identd->filter_list_size;
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
i = 0;
|
|
|
|
|
bad = 0;
|
|
|
|
|
while (i < num) {
|
|
|
|
|
filter = identd->filter_list[i];
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_function)(*p, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter->flag) {
|
|
|
|
|
bad++;
|
|
|
|
|
}
|
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
if ((num - 1) <= bad) {
|
|
|
|
|
res = 1;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
p++;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return res;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
enum mbfl_no_encoding mbfl_encoding_detector_judge(mbfl_encoding_detector *identd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
mbfl_identify_filter *filter;
|
|
|
|
|
enum mbfl_no_encoding encoding;
|
|
|
|
|
int n;
|
|
|
|
|
|
|
|
|
|
/* judge */
|
|
|
|
|
encoding = mbfl_no_encoding_invalid;
|
|
|
|
|
if (identd != NULL) {
|
|
|
|
|
n = identd->filter_list_size - 1;
|
|
|
|
|
while (n >= 0) {
|
|
|
|
|
filter = identd->filter_list[n];
|
|
|
|
|
if (!filter->flag) {
|
|
|
|
|
encoding = filter->encoding->no_encoding;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* encoding converter
|
|
|
|
|
*/
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_convert_encoding(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
enum mbfl_no_encoding toenc TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
mbfl_convert_filter *filter1;
|
|
|
|
|
mbfl_convert_filter *filter2;
|
|
|
|
|
|
|
|
|
|
/* initialize */
|
|
|
|
|
encoding = mbfl_no2encoding(toenc);
|
|
|
|
|
if (encoding == NULL || string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
filter1 = NULL;
|
|
|
|
|
filter2 = NULL;
|
|
|
|
|
if (mbfl_convert_filter_get_vtbl(string->no_encoding, toenc) != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter1 = mbfl_convert_filter_new(string->no_encoding, toenc, mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter2 = mbfl_convert_filter_new(mbfl_no_encoding_wchar, toenc, mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter2 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter1 = mbfl_convert_filter_new(string->no_encoding, mbfl_no_encoding_wchar, (int (*)(int, void* TSRMLS_DC))filter2->filter_function, NULL, filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter1 == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (filter1 == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
filter2->illegal_mode = MBFL_OUTPUTFILTER_ILLEGAL_MODE_CHAR;
|
|
|
|
|
filter2->illegal_substchar = 0x3f; /* '?' */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&device, string->len, (string->len >> 2) + 8 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter1->filter_function)(*p++, filter1 TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(filter1 TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter1 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter2 != NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(filter2 TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter2 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mbfl_memory_device_result(&device, result TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* identify encoding
|
|
|
|
|
*/
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_encoding(mbfl_string *string, enum mbfl_no_encoding *elist, int eliztsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int i, n, num, bad;
|
|
|
|
|
unsigned char *p;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const struct mbfl_identify_vtbl *vtbl;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_identify_filter *flist, *filter;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* initialize */
|
|
|
|
|
flist = (mbfl_identify_filter *)mbfl_calloc(eliztsz, sizeof(mbfl_identify_filter));
|
|
|
|
|
if (flist == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
i = 0;
|
|
|
|
|
num = 0;
|
|
|
|
|
if (elist != NULL) {
|
|
|
|
|
while (i < eliztsz) {
|
|
|
|
|
vtbl = mbfl_identify_filter_get_vtbl(elist[i]);
|
|
|
|
|
if (vtbl != NULL) {
|
|
|
|
|
filter = &flist[num];
|
|
|
|
|
mbfl_identify_filter_set_vtbl(filter, vtbl);
|
|
|
|
|
filter->encoding = mbfl_no2encoding(vtbl->encoding);
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_ctor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
num++;
|
|
|
|
|
}
|
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
i = 0;
|
|
|
|
|
bad = 0;
|
|
|
|
|
while (i < num) {
|
|
|
|
|
filter = &flist[i];
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_function)(*p, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter->flag) {
|
|
|
|
|
bad++;
|
|
|
|
|
}
|
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
if ((num - 1) <= bad) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
p++;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* judge */
|
|
|
|
|
i = num - 1;
|
|
|
|
|
bad = 1;
|
|
|
|
|
encoding = NULL;
|
|
|
|
|
while (i >= 0) {
|
|
|
|
|
filter = &flist[i];
|
|
|
|
|
if (filter->flag) {
|
|
|
|
|
bad++;
|
|
|
|
|
} else {
|
|
|
|
|
encoding = filter->encoding;
|
|
|
|
|
}
|
|
|
|
|
i--;
|
|
|
|
|
}
|
|
|
|
|
#if 0
|
|
|
|
|
if (bad < num) {
|
|
|
|
|
encoding = NULL;
|
|
|
|
|
}
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
i = 0;
|
|
|
|
|
while (i < num) {
|
|
|
|
|
filter = &flist[i];
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_dtor)(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
i++;
|
|
|
|
|
}
|
|
|
|
|
mbfl_free((void *)flist);
|
|
|
|
|
|
|
|
|
|
return encoding;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const char*
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_encoding_name(mbfl_string *string, enum mbfl_no_encoding *elist, int eliztsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
encoding = mbfl_identify_encoding(string, elist, eliztsz TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (encoding != NULL &&
|
|
|
|
|
encoding->no_encoding > mbfl_no_encoding_charset_min &&
|
|
|
|
|
encoding->no_encoding < mbfl_no_encoding_charset_max) {
|
|
|
|
|
return encoding->name;
|
|
|
|
|
} else {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const enum mbfl_no_encoding
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_identify_encoding_no(mbfl_string *string, enum mbfl_no_encoding *elist, int eliztsz TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
encoding = mbfl_identify_encoding(string, elist, eliztsz TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (encoding != NULL &&
|
|
|
|
|
encoding->no_encoding > mbfl_no_encoding_charset_min &&
|
|
|
|
|
encoding->no_encoding < mbfl_no_encoding_charset_max) {
|
|
|
|
|
return encoding->no_encoding;
|
|
|
|
|
} else {
|
|
|
|
|
return mbfl_no_encoding_invalid;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* strlen
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter_count_output(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
(*(int *)data)++;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_strlen(mbfl_string *string TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int len, n, m, k;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
const unsigned char *mbtab;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(string->no_encoding);
|
|
|
|
|
if (encoding == NULL || string == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
len = 0;
|
|
|
|
|
if (encoding->flag & MBFL_ENCTYPE_SBCS) {
|
|
|
|
|
len = string->len;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_WCS2LE)) {
|
|
|
|
|
len = string->len/2;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_WCS4LE)) {
|
|
|
|
|
len = string->len/4;
|
|
|
|
|
} else if (encoding->mblen_table != NULL) {
|
|
|
|
|
mbtab = encoding->mblen_table;
|
|
|
|
|
n = 0;
|
|
|
|
|
p = string->val;
|
|
|
|
|
k = string->len;
|
|
|
|
|
/* count */
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n < k) {
|
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
len++;
|
|
|
|
|
};
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
/* wchar filter */
|
|
|
|
|
mbfl_convert_filter *filter = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter_count_output, 0, &len TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
/* count */
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_function)(*p++, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return len;
|
|
|
|
|
}
|
|
|
|
|
|
2002-05-08 12:33:44 +00:00
|
|
|
|
#ifdef ZEND_MULTIBYTE
|
|
|
|
|
/*
|
|
|
|
|
* oddlen
|
|
|
|
|
*/
|
|
|
|
|
int
|
|
|
|
|
mbfl_oddlen(mbfl_string *string)
|
|
|
|
|
{
|
|
|
|
|
int len, n, m, k;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
const unsigned char *mbtab;
|
2002-10-20 02:57:40 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2002-05-08 12:33:44 +00:00
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(string->no_encoding);
|
|
|
|
|
if (encoding == NULL || string == NULL) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
2002-05-08 12:33:44 +00:00
|
|
|
|
len = 0;
|
|
|
|
|
if (encoding->flag & MBFL_ENCTYPE_SBCS) {
|
|
|
|
|
return 0;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_WCS2LE)) {
|
|
|
|
|
return len % 2;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_WCS4LE)) {
|
|
|
|
|
return len % 4;
|
|
|
|
|
} else if (encoding->mblen_table != NULL) {
|
|
|
|
|
mbtab = encoding->mblen_table;
|
|
|
|
|
n = 0;
|
|
|
|
|
p = string->val;
|
|
|
|
|
k = string->len;
|
|
|
|
|
/* count */
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n < k) {
|
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
};
|
|
|
|
|
}
|
|
|
|
|
return n-k;
|
|
|
|
|
} else {
|
|
|
|
|
/* how can i do ? */
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
/* NOT REACHED */
|
|
|
|
|
}
|
|
|
|
|
#endif /* ZEND_MULTIBYTE */
|
|
|
|
|
|
|
|
|
|
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/*
|
|
|
|
|
* strpos
|
|
|
|
|
*/
|
|
|
|
|
struct collector_strpos_data {
|
|
|
|
|
mbfl_convert_filter *next_filter;
|
|
|
|
|
mbfl_wchar_device needle;
|
|
|
|
|
int needle_len;
|
|
|
|
|
int start;
|
|
|
|
|
int output;
|
|
|
|
|
int found_pos;
|
|
|
|
|
int needle_pos;
|
|
|
|
|
int matched_pos;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_strpos(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int *p, *h, *m, n;
|
|
|
|
|
struct collector_strpos_data *pc = (struct collector_strpos_data*)data;
|
|
|
|
|
|
|
|
|
|
if (pc->output >= pc->start) {
|
2002-04-30 12:45:14 +00:00
|
|
|
|
if (c == (int)pc->needle.buffer[pc->needle_pos]) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pc->needle_pos == 0) {
|
|
|
|
|
pc->found_pos = pc->output; /* found position */
|
|
|
|
|
}
|
|
|
|
|
pc->needle_pos++; /* needle pointer */
|
|
|
|
|
if (pc->needle_pos >= pc->needle_len) {
|
|
|
|
|
pc->matched_pos = pc->found_pos; /* matched position */
|
|
|
|
|
pc->needle_pos--;
|
|
|
|
|
goto retry;
|
|
|
|
|
}
|
|
|
|
|
} else if (pc->needle_pos != 0) {
|
|
|
|
|
retry:
|
2002-11-02 13:38:32 +00:00
|
|
|
|
h = (int *)pc->needle.buffer;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
h++;
|
|
|
|
|
for (;;) {
|
|
|
|
|
pc->found_pos++;
|
|
|
|
|
p = h;
|
|
|
|
|
m = pc->needle.buffer;
|
|
|
|
|
n = pc->needle_pos - 1;
|
|
|
|
|
while (n > 0 && *p == *m) {
|
|
|
|
|
n--;
|
|
|
|
|
p++;
|
|
|
|
|
m++;
|
|
|
|
|
}
|
|
|
|
|
if (n <= 0) {
|
|
|
|
|
if (*m != c) {
|
|
|
|
|
pc->needle_pos = 0;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
} else {
|
|
|
|
|
h++;
|
|
|
|
|
pc->needle_pos--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pc->output++;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
|
|
|
|
mbfl_strpos(
|
|
|
|
|
mbfl_string *haystack,
|
|
|
|
|
mbfl_string *needle,
|
|
|
|
|
int offset,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int reverse TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n, result;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
mbfl_convert_filter *filter;
|
|
|
|
|
struct collector_strpos_data pc;
|
|
|
|
|
|
|
|
|
|
if (haystack == NULL || needle == NULL) {
|
|
|
|
|
return -8;
|
|
|
|
|
}
|
|
|
|
|
/* needle is converted into wchar */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_init(&pc.needle TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
filter = mbfl_convert_filter_new(
|
|
|
|
|
needle->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_output, 0, &pc.needle TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
p = needle->val;
|
|
|
|
|
n = needle->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pc.needle_len = pc.needle.pos;
|
|
|
|
|
if (pc.needle.buffer == NULL) {
|
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
if (pc.needle_len <= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -2;
|
|
|
|
|
}
|
|
|
|
|
/* initialize filter and collector data */
|
|
|
|
|
filter = mbfl_convert_filter_new(
|
|
|
|
|
haystack->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_strpos, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
pc.start = offset;
|
|
|
|
|
pc.output = 0;
|
|
|
|
|
pc.needle_pos = 0;
|
|
|
|
|
pc.found_pos = 0;
|
|
|
|
|
pc.matched_pos = -1;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = haystack->val;
|
|
|
|
|
n = haystack->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pc.matched_pos = -4;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (pc.matched_pos >= 0 && !reverse) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
result = pc.matched_pos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
2002-11-09 17:05:47 +00:00
|
|
|
|
/*
|
|
|
|
|
* substr_count
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
int
|
|
|
|
|
mbfl_substr_count(
|
|
|
|
|
mbfl_string *haystack,
|
|
|
|
|
mbfl_string *needle
|
|
|
|
|
TSRMLS_DC)
|
|
|
|
|
{
|
|
|
|
|
int n, result = 0;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
mbfl_convert_filter *filter;
|
|
|
|
|
struct collector_strpos_data pc;
|
|
|
|
|
|
|
|
|
|
if (haystack == NULL || needle == NULL) {
|
|
|
|
|
return -8;
|
|
|
|
|
}
|
|
|
|
|
/* needle is converted into wchar */
|
|
|
|
|
mbfl_wchar_device_init(&pc.needle TSRMLS_CC);
|
|
|
|
|
filter = mbfl_convert_filter_new(
|
|
|
|
|
needle->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
mbfl_wchar_device_output, 0, &pc.needle TSRMLS_CC);
|
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
p = needle->val;
|
|
|
|
|
n = needle->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
mbfl_convert_filter_flush(filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
|
|
|
|
pc.needle_len = pc.needle.pos;
|
|
|
|
|
if (pc.needle.buffer == NULL) {
|
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
if (pc.needle_len <= 0) {
|
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
|
|
|
|
return -2;
|
|
|
|
|
}
|
|
|
|
|
/* initialize filter and collector data */
|
|
|
|
|
filter = mbfl_convert_filter_new(
|
|
|
|
|
haystack->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
collector_strpos, 0, &pc TSRMLS_CC);
|
|
|
|
|
if (filter == NULL) {
|
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
|
|
|
|
return -4;
|
|
|
|
|
}
|
|
|
|
|
pc.start = 0;
|
|
|
|
|
pc.output = 0;
|
|
|
|
|
pc.needle_pos = 0;
|
|
|
|
|
pc.found_pos = 0;
|
|
|
|
|
pc.matched_pos = -1;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = haystack->val;
|
|
|
|
|
n = haystack->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
if ((*filter->filter_function)(*p++, filter TSRMLS_CC) < 0) {
|
|
|
|
|
pc.matched_pos = -4;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (pc.matched_pos >= 0) {
|
|
|
|
|
++result;
|
|
|
|
|
pc.matched_pos = -1;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
mbfl_convert_filter_flush(filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
|
|
|
|
mbfl_wchar_device_clear(&pc.needle TSRMLS_CC);
|
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* substr
|
|
|
|
|
*/
|
|
|
|
|
struct collector_substr_data {
|
|
|
|
|
mbfl_convert_filter *next_filter;
|
|
|
|
|
int start;
|
|
|
|
|
int stop;
|
|
|
|
|
int output;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_substr(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_substr_data *pc = (struct collector_substr_data*)data;
|
|
|
|
|
|
|
|
|
|
if (pc->output >= pc->stop) {
|
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (pc->output >= pc->start) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->next_filter->filter_function)(c, pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pc->output++;
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_substr(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
|
|
|
|
int from,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int length TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int n, m, k, len, start, end;
|
|
|
|
|
unsigned char *p, *w;
|
|
|
|
|
const unsigned char *mbtab;
|
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(string->no_encoding);
|
|
|
|
|
if (encoding == NULL || string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
|
|
|
|
|
|
|
|
|
if ((encoding->flag & (MBFL_ENCTYPE_SBCS | MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_WCS2LE | MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_WCS4LE)) ||
|
|
|
|
|
encoding->mblen_table != NULL) {
|
|
|
|
|
len = string->len;
|
|
|
|
|
start = from;
|
|
|
|
|
end = from + length;
|
|
|
|
|
if (encoding->flag & (MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_MWC2LE)) {
|
|
|
|
|
start *= 2;
|
|
|
|
|
end = start + length*2;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_MWC4LE)) {
|
|
|
|
|
start *= 4;
|
|
|
|
|
end = start + length*4;
|
|
|
|
|
} else if (encoding->mblen_table != NULL) {
|
|
|
|
|
mbtab = encoding->mblen_table;
|
|
|
|
|
start = 0;
|
|
|
|
|
end = 0;
|
|
|
|
|
n = 0;
|
|
|
|
|
k = 0;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
/* search start position */
|
2001-05-10 13:12:03 +00:00
|
|
|
|
while (k <= from) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
start = n;
|
2001-05-10 13:12:03 +00:00
|
|
|
|
if (n >= len) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
k++;
|
2001-05-10 13:12:03 +00:00
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* detect end position */
|
|
|
|
|
k = 0;
|
|
|
|
|
end = start;
|
2001-05-10 13:12:03 +00:00
|
|
|
|
while (k < length) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
end = n;
|
2001-05-10 13:12:03 +00:00
|
|
|
|
if (n >= len) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
k++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (start > len) {
|
|
|
|
|
start = len;
|
|
|
|
|
}
|
|
|
|
|
if (start < 0) {
|
|
|
|
|
start = 0;
|
|
|
|
|
}
|
|
|
|
|
if (end > len) {
|
|
|
|
|
end = len;
|
|
|
|
|
}
|
|
|
|
|
if (end < 0) {
|
|
|
|
|
end = 0;
|
|
|
|
|
}
|
|
|
|
|
if (start > end) {
|
|
|
|
|
start = end;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* allocate memory and copy */
|
|
|
|
|
n = end - start;
|
|
|
|
|
result->len = 0;
|
|
|
|
|
result->val = w = (unsigned char*)mbfl_malloc((n + 8)*sizeof(unsigned char));
|
|
|
|
|
if (w != NULL) {
|
2001-05-10 13:12:03 +00:00
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
p += start;
|
|
|
|
|
result->len = n;
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
*w++ = *p++;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w = '\0';
|
|
|
|
|
} else {
|
|
|
|
|
result = NULL;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
struct collector_substr_data pc;
|
|
|
|
|
mbfl_convert_filter *decoder;
|
|
|
|
|
mbfl_convert_filter *encoder;
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&device, length + 1, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
|
|
|
|
/* output code filter */
|
|
|
|
|
decoder = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* wchar filter */
|
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_substr, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (decoder == NULL || encoder == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
pc.next_filter = decoder;
|
|
|
|
|
pc.start = from;
|
|
|
|
|
pc.stop = from + length;
|
|
|
|
|
pc.output = 0;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = string->val;
|
|
|
|
|
n = string->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_flush(decoder TSRMLS_CC);
|
|
|
|
|
result = mbfl_memory_device_result(&device, result TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* strcut
|
|
|
|
|
*/
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_strcut(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
|
|
|
|
int from,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int length TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
int n, m, k, len, start, end;
|
|
|
|
|
unsigned char *p, *w;
|
|
|
|
|
const unsigned char *mbtab;
|
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
mbfl_convert_filter *encoder, *encoder_tmp, *decoder, *decoder_tmp;
|
|
|
|
|
|
|
|
|
|
encoding = mbfl_no2encoding(string->no_encoding);
|
|
|
|
|
if (encoding == NULL || string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
|
|
|
|
|
|
|
|
|
if ((encoding->flag & (MBFL_ENCTYPE_SBCS | MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_WCS2LE | MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_WCS4LE)) ||
|
|
|
|
|
encoding->mblen_table != NULL) {
|
|
|
|
|
len = string->len;
|
|
|
|
|
start = from;
|
|
|
|
|
end = from + length;
|
|
|
|
|
if (encoding->flag & (MBFL_ENCTYPE_WCS2BE | MBFL_ENCTYPE_WCS2LE)) {
|
|
|
|
|
start /= 2;
|
|
|
|
|
start *= 2;
|
|
|
|
|
end = length/2;
|
|
|
|
|
end *= 2;
|
|
|
|
|
end += start;
|
|
|
|
|
} else if (encoding->flag & (MBFL_ENCTYPE_WCS4BE | MBFL_ENCTYPE_WCS4LE)) {
|
|
|
|
|
start /= 4;
|
|
|
|
|
start *= 4;
|
|
|
|
|
end = length/4;
|
|
|
|
|
end *= 4;
|
|
|
|
|
end += start;
|
|
|
|
|
} else if (encoding->mblen_table != NULL) {
|
|
|
|
|
mbtab = encoding->mblen_table;
|
|
|
|
|
start = 0;
|
|
|
|
|
end = 0;
|
|
|
|
|
n = 0;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
/* search start position */
|
|
|
|
|
for (;;) {
|
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
if (n > from) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
start = n;
|
|
|
|
|
}
|
|
|
|
|
/* search end position */
|
|
|
|
|
k = start + length;
|
2002-04-30 12:45:14 +00:00
|
|
|
|
if (k >= (int)string->len) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
end = string->len;
|
|
|
|
|
} else {
|
|
|
|
|
end = start;
|
|
|
|
|
while (n <= k) {
|
|
|
|
|
end = n;
|
|
|
|
|
m = mbtab[*p];
|
|
|
|
|
n += m;
|
|
|
|
|
p += m;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (start > len) {
|
|
|
|
|
start = len;
|
|
|
|
|
}
|
|
|
|
|
if (start < 0) {
|
|
|
|
|
start = 0;
|
|
|
|
|
}
|
|
|
|
|
if (end > len) {
|
|
|
|
|
end = len;
|
|
|
|
|
}
|
|
|
|
|
if (end < 0) {
|
|
|
|
|
end = 0;
|
|
|
|
|
}
|
|
|
|
|
if (start > end) {
|
|
|
|
|
start = end;
|
|
|
|
|
}
|
|
|
|
|
/* allocate memory and copy string */
|
|
|
|
|
n = end - start;
|
|
|
|
|
result->len = 0;
|
|
|
|
|
result->val = w = (unsigned char*)mbfl_malloc((n + 8)*sizeof(unsigned char));
|
|
|
|
|
if (w != NULL) {
|
|
|
|
|
result->len = n;
|
|
|
|
|
p = &(string->val[start]);
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
*w++ = *p++;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w++ = '\0';
|
|
|
|
|
*w = '\0';
|
|
|
|
|
} else {
|
|
|
|
|
result = NULL;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
/* wchar filter */
|
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filter_output_null, 0, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
encoder_tmp = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_filter_output_null, 0, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* output code filter */
|
|
|
|
|
decoder = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
decoder_tmp = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (encoder == NULL || encoder_tmp == NULL || decoder == NULL || decoder_tmp == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder_tmp TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder_tmp TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&device, length + 8, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
k = 0;
|
|
|
|
|
n = 0;
|
|
|
|
|
p = string->val;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
/* seartch start position */
|
|
|
|
|
while (n < from) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*encoder->filter_function)(*p++, encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n++;
|
|
|
|
|
}
|
|
|
|
|
/* output a little shorter than "length" */
|
|
|
|
|
encoder->output_function = mbfl_filter_output_pipe;
|
|
|
|
|
encoder->data = decoder;
|
|
|
|
|
k = length - 20;
|
|
|
|
|
len = string->len;
|
|
|
|
|
while (n < len && device.pos < k) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*encoder->filter_function)(*p++, encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n++;
|
|
|
|
|
}
|
|
|
|
|
/* detect end position */
|
|
|
|
|
for (;;) {
|
|
|
|
|
/* backup current state */
|
|
|
|
|
k = device.pos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(encoder, encoder_tmp TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_copy(decoder, decoder_tmp TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n >= len) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
/* feed 1byte and flush */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*encoder->filter_function)(*p, encoder TSRMLS_CC);
|
|
|
|
|
(*encoder->filter_flush)(encoder TSRMLS_CC);
|
|
|
|
|
(*decoder->filter_flush)(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (device.pos > length) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
/* restore filter and re-feed data */
|
|
|
|
|
device.pos = k;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(encoder_tmp, encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_copy(decoder_tmp, decoder TSRMLS_CC);
|
|
|
|
|
(*encoder->filter_function)(*p, encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
p++;
|
|
|
|
|
n++;
|
|
|
|
|
}
|
|
|
|
|
device.pos = k;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(encoder_tmp, encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_copy(decoder_tmp, decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_flush(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
result = mbfl_memory_device_result(&device, result TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder_tmp TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder_tmp TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* strwidth
|
|
|
|
|
*/
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter_count_width(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (c >= 0x20) {
|
|
|
|
|
if (c < 0x2000 || (c > 0xff60 && c < 0xffa0)) {
|
|
|
|
|
(*(int *)data)++;
|
|
|
|
|
} else {
|
|
|
|
|
(*(int *)data) += 2;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_strwidth(mbfl_string *string TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int len, n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
mbfl_convert_filter *filter;
|
|
|
|
|
|
|
|
|
|
len = 0;
|
|
|
|
|
if (string->len > 0 && string->val != NULL) {
|
|
|
|
|
/* wchar filter */
|
|
|
|
|
filter = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
filter_count_width, 0, &len TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (filter == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return -1;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = string->val;
|
|
|
|
|
n = string->len;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*filter->filter_function)(*p++, filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return len;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* strimwidth
|
|
|
|
|
*/
|
|
|
|
|
struct collector_strimwidth_data {
|
|
|
|
|
mbfl_convert_filter *decoder;
|
|
|
|
|
mbfl_convert_filter *decoder_backup;
|
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
int from;
|
|
|
|
|
int width;
|
|
|
|
|
int outwidth;
|
|
|
|
|
int outchar;
|
|
|
|
|
int status;
|
|
|
|
|
int endpos;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_strimwidth(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_strimwidth_data *pc = (struct collector_strimwidth_data*)data;
|
|
|
|
|
|
|
|
|
|
switch (pc->status) {
|
|
|
|
|
case 10:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (pc->outchar >= pc->from) {
|
|
|
|
|
if (c >= 0x20) {
|
|
|
|
|
if (c < 0x2000 || (c > 0xff60 && c < 0xffa0)) {
|
|
|
|
|
pc->outwidth++;
|
|
|
|
|
} else {
|
|
|
|
|
pc->outwidth += 2;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (pc->outwidth > pc->width) {
|
|
|
|
|
if (pc->status == 0) {
|
|
|
|
|
pc->endpos = pc->device.pos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(pc->decoder, pc->decoder_backup TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
pc->status++;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
c = -1;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
pc->outchar++;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_strimwidth(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *marker,
|
|
|
|
|
mbfl_string *result,
|
|
|
|
|
int from,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int width TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_strimwidth_data pc;
|
|
|
|
|
mbfl_convert_filter *encoder;
|
|
|
|
|
int n, mkwidth;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
|
|
|
|
|
if (string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&pc.device, width, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* output code filter */
|
|
|
|
|
pc.decoder = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &pc.device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pc.decoder_backup = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &pc.device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* wchar filter */
|
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_strimwidth, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pc.decoder == NULL || pc.decoder_backup == NULL || encoder == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder_backup TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
mkwidth = 0;
|
|
|
|
|
if (marker) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mkwidth = mbfl_strwidth(marker TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
pc.from = from;
|
|
|
|
|
pc.width = width - mkwidth;
|
|
|
|
|
pc.outwidth = 0;
|
|
|
|
|
pc.outchar = 0;
|
|
|
|
|
pc.status = 0;
|
|
|
|
|
pc.endpos = 0;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = string->val;
|
|
|
|
|
n = string->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2001-08-29 11:29:52 +00:00
|
|
|
|
n--;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pc.status != 0 && mkwidth > 0) {
|
|
|
|
|
pc.width += mkwidth;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pc.status != 1) {
|
|
|
|
|
pc.status = 10;
|
|
|
|
|
pc.device.pos = pc.endpos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(pc.decoder_backup, pc.decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_reset(encoder, marker->no_encoding, mbfl_no_encoding_wchar TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
p = marker->val;
|
|
|
|
|
n = marker->len;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2001-06-05 14:25:23 +00:00
|
|
|
|
} else if (pc.status != 0) {
|
|
|
|
|
pc.device.pos = pc.endpos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(pc.decoder_backup, pc.decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(pc.decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
result = mbfl_memory_device_result(&pc.device, result TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder_backup TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* convert Hankaku and Zenkaku
|
|
|
|
|
*/
|
|
|
|
|
struct collector_hantozen_data {
|
|
|
|
|
mbfl_convert_filter *next_filter;
|
|
|
|
|
int mode;
|
|
|
|
|
int status;
|
|
|
|
|
int cache;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static const unsigned char hankana2zenkata_table[64] = {
|
|
|
|
|
0x00,0x02,0x0C,0x0D,0x01,0xFB,0xF2,0xA1,0xA3,0xA5,
|
|
|
|
|
0xA7,0xA9,0xE3,0xE5,0xE7,0xC3,0xFC,0xA2,0xA4,0xA6,
|
|
|
|
|
0xA8,0xAA,0xAB,0xAD,0xAF,0xB1,0xB3,0xB5,0xB7,0xB9,
|
|
|
|
|
0xBB,0xBD,0xBF,0xC1,0xC4,0xC6,0xC8,0xCA,0xCB,0xCC,
|
|
|
|
|
0xCD,0xCE,0xCF,0xD2,0xD5,0xD8,0xDB,0xDE,0xDF,0xE0,
|
|
|
|
|
0xE1,0xE2,0xE4,0xE6,0xE8,0xE9,0xEA,0xEB,0xEC,0xED,
|
|
|
|
|
0xEF,0xF3,0x9B,0x9C
|
|
|
|
|
};
|
|
|
|
|
static const unsigned char hankana2zenhira_table[64] = {
|
|
|
|
|
0x00,0x02,0x0C,0x0D,0x01,0xFB,0x92,0x41,0x43,0x45,
|
|
|
|
|
0x47,0x49,0x83,0x85,0x87,0x63,0xFC,0x42,0x44,0x46,
|
|
|
|
|
0x48,0x4A,0x4B,0x4D,0x4F,0x51,0x53,0x55,0x57,0x59,
|
|
|
|
|
0x5B,0x5D,0x5F,0x61,0x64,0x66,0x68,0x6A,0x6B,0x6C,
|
|
|
|
|
0x6D,0x6E,0x6F,0x72,0x75,0x78,0x7B,0x7E,0x7F,0x80,
|
|
|
|
|
0x81,0x82,0x84,0x86,0x88,0x89,0x8A,0x8B,0x8C,0x8D,
|
|
|
|
|
0x8F,0x93,0x9B,0x9C
|
|
|
|
|
};
|
|
|
|
|
static const unsigned char zenkana2hankana_table[84][2] = {
|
|
|
|
|
{0x67,0x00},{0x71,0x00},{0x68,0x00},{0x72,0x00},{0x69,0x00},
|
|
|
|
|
{0x73,0x00},{0x6A,0x00},{0x74,0x00},{0x6B,0x00},{0x75,0x00},
|
|
|
|
|
{0x76,0x00},{0x76,0x9E},{0x77,0x00},{0x77,0x9E},{0x78,0x00},
|
|
|
|
|
{0x78,0x9E},{0x79,0x00},{0x79,0x9E},{0x7A,0x00},{0x7A,0x9E},
|
|
|
|
|
{0x7B,0x00},{0x7B,0x9E},{0x7C,0x00},{0x7C,0x9E},{0x7D,0x00},
|
|
|
|
|
{0x7D,0x9E},{0x7E,0x00},{0x7E,0x9E},{0x7F,0x00},{0x7F,0x9E},
|
|
|
|
|
{0x80,0x00},{0x80,0x9E},{0x81,0x00},{0x81,0x9E},{0x6F,0x00},
|
|
|
|
|
{0x82,0x00},{0x82,0x9E},{0x83,0x00},{0x83,0x9E},{0x84,0x00},
|
|
|
|
|
{0x84,0x9E},{0x85,0x00},{0x86,0x00},{0x87,0x00},{0x88,0x00},
|
|
|
|
|
{0x89,0x00},{0x8A,0x00},{0x8A,0x9E},{0x8A,0x9F},{0x8B,0x00},
|
|
|
|
|
{0x8B,0x9E},{0x8B,0x9F},{0x8C,0x00},{0x8C,0x9E},{0x8C,0x9F},
|
|
|
|
|
{0x8D,0x00},{0x8D,0x9E},{0x8D,0x9F},{0x8E,0x00},{0x8E,0x9E},
|
|
|
|
|
{0x8E,0x9F},{0x8F,0x00},{0x90,0x00},{0x91,0x00},{0x92,0x00},
|
|
|
|
|
{0x93,0x00},{0x6C,0x00},{0x94,0x00},{0x6D,0x00},{0x95,0x00},
|
|
|
|
|
{0x6E,0x00},{0x96,0x00},{0x97,0x00},{0x98,0x00},{0x99,0x00},
|
|
|
|
|
{0x9A,0x00},{0x9B,0x00},{0x9C,0x00},{0x9C,0x00},{0x72,0x00},
|
|
|
|
|
{0x74,0x00},{0x66,0x00},{0x9D,0x00},{0x73,0x9E}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_hantozen(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int s, mode, n;
|
|
|
|
|
struct collector_hantozen_data *pc = (struct collector_hantozen_data*)data;
|
|
|
|
|
|
|
|
|
|
s = c;
|
|
|
|
|
mode = pc->mode;
|
|
|
|
|
|
|
|
|
|
if (mode & 0xf) { /* hankaku to zenkaku */
|
|
|
|
|
if ((mode & 0x1) && c >= 0x21 && c <= 0x7d && c != 0x22 && c != 0x27 && c != 0x5c) { /* all except <"> <'> <\> <~> */
|
|
|
|
|
s = c + 0xfee0;
|
|
|
|
|
} else if ((mode & 0x2) && ((c >= 0x41 && c <= 0x5a) || (c >= 0x61 && c <= 0x7a))) { /* alpha */
|
|
|
|
|
s = c + 0xfee0;
|
|
|
|
|
} else if ((mode & 0x4) && c >= 0x30 && c <= 0x39) { /* num */
|
|
|
|
|
s = c + 0xfee0;
|
|
|
|
|
} else if ((mode & 0x8) && c == 0x20) { /* spase */
|
|
|
|
|
s = 0x3000;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (mode & 0xf0) { /* zenkaku to hankaku */
|
|
|
|
|
if ((mode & 0x10) && c >= 0xff01 && c <= 0xff5d && c != 0xff02 && c != 0xff07 && c!= 0xff3c) { /* all except <"> <'> <\> <~> */
|
|
|
|
|
s = c - 0xfee0;
|
|
|
|
|
} else if ((mode & 0x20) && ((c >= 0xff21 && c <= 0xff3a) || (c >= 0xff41 && c <= 0xff5a))) { /* alpha */
|
|
|
|
|
s = c - 0xfee0;
|
|
|
|
|
} else if ((mode & 0x40) && (c >= 0xff10 && c <= 0xff19)) { /* num */
|
|
|
|
|
s = c - 0xfee0;
|
|
|
|
|
} else if ((mode & 0x80) && (c == 0x3000)) { /* spase */
|
|
|
|
|
s = 0x20;
|
|
|
|
|
} else if ((mode & 0x10) && (c == 0x2212)) { /* MINUS SIGN */
|
|
|
|
|
s = 0x2d;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (mode & 0x300) { /* hankaku kana to zenkaku kana */
|
|
|
|
|
if ((mode & 0x100) && (mode & 0x800)) { /* hankaku kana to zenkaku katakana and glue voiced sound mark */
|
|
|
|
|
if (c >= 0xff61 && c <= 0xff9f) {
|
|
|
|
|
if (pc->status) {
|
|
|
|
|
n = (pc->cache - 0xff60) & 0x3f;
|
|
|
|
|
if (c == 0xff9e && ((n >= 22 && n <= 36) || (n >= 42 && n <= 46))) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = 0x3001 + hankana2zenkata_table[n];
|
|
|
|
|
} else if (c == 0xff9e && n == 19) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = 0x30f4;
|
|
|
|
|
} else if (c == 0xff9f && (n >= 42 && n <= 46)) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = 0x3002 + hankana2zenkata_table[n];
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 1;
|
|
|
|
|
pc->cache = c;
|
|
|
|
|
s = 0x3000 + hankana2zenkata_table[n];
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 1;
|
|
|
|
|
pc->cache = c;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
if (pc->status) {
|
|
|
|
|
n = (pc->cache - 0xff60) & 0x3f;
|
|
|
|
|
pc->status = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->next_filter->filter_function)(0x3000 + hankana2zenkata_table[n], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else if ((mode & 0x200) && (mode & 0x800)) { /* hankaku kana to zenkaku hirangana and glue voiced sound mark */
|
|
|
|
|
if (c >= 0xff61 && c <= 0xff9f) {
|
|
|
|
|
if (pc->status) {
|
|
|
|
|
n = (pc->cache - 0xff60) & 0x3f;
|
|
|
|
|
if (c == 0xff9e && ((n >= 22 && n <= 36) || (n >= 42 && n <= 46))) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = 0x3001 + hankana2zenhira_table[n];
|
|
|
|
|
} else if (c == 0xff9f && (n >= 42 && n <= 46)) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = 0x3002 + hankana2zenhira_table[n];
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 1;
|
|
|
|
|
pc->cache = c;
|
|
|
|
|
s = 0x3000 + hankana2zenhira_table[n];
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 1;
|
|
|
|
|
pc->cache = c;
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
if (pc->status) {
|
|
|
|
|
n = (pc->cache - 0xff60) & 0x3f;
|
|
|
|
|
pc->status = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->next_filter->filter_function)(0x3000 + hankana2zenhira_table[n], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else if ((mode & 0x100) && c >= 0xff61 && c <= 0xff9f) { /* hankaku kana to zenkaku katakana */
|
|
|
|
|
s = 0x3000 + hankana2zenkata_table[c - 0xff60];
|
|
|
|
|
} else if ((mode & 0x200) && c >= 0xff61 && c <= 0xff9f) { /* hankaku kana to zenkaku hirangana */
|
|
|
|
|
s = 0x3000 + hankana2zenhira_table[c - 0xff60];
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (mode & 0x3000) { /* Zenkaku kana to hankaku kana */
|
|
|
|
|
if ((mode & 0x1000) && c >= 0x30a1 && c <= 0x30f4) { /* Zenkaku katakana to hankaku kana */
|
|
|
|
|
n = c - 0x30a1;
|
|
|
|
|
if (zenkana2hankana_table[n][1] != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->next_filter->filter_function)(0xff00 + zenkana2hankana_table[n][0], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
s = 0xff00 + zenkana2hankana_table[n][1];
|
|
|
|
|
} else {
|
|
|
|
|
s = 0xff00 + zenkana2hankana_table[n][0];
|
|
|
|
|
}
|
|
|
|
|
} else if ((mode & 0x2000) && c >= 0x3041 && c <= 0x3093) { /* Zenkaku hirangana to hankaku kana */
|
|
|
|
|
n = c - 0x3041;
|
|
|
|
|
if (zenkana2hankana_table[n][1] != 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->next_filter->filter_function)(0xff00 + zenkana2hankana_table[n][0], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
s = 0xff00 + zenkana2hankana_table[n][1];
|
|
|
|
|
} else {
|
|
|
|
|
s = 0xff00 + zenkana2hankana_table[n][0];
|
|
|
|
|
}
|
|
|
|
|
} else if (c == 0x3001) {
|
|
|
|
|
s = 0xff64; /* HALFWIDTH IDEOGRAPHIC COMMA */
|
|
|
|
|
} else if (c == 0x3002) {
|
|
|
|
|
s = 0xff61; /* HALFWIDTH IDEOGRAPHIC FULL STOP */
|
|
|
|
|
} else if (c == 0x300c) {
|
|
|
|
|
s = 0xff62; /* HALFWIDTH LEFT CORNER BRACKET */
|
|
|
|
|
} else if (c == 0x300d) {
|
|
|
|
|
s = 0xff63; /* HALFWIDTH RIGHT CORNER BRACKET */
|
|
|
|
|
} else if (c == 0x309b) {
|
|
|
|
|
s = 0xff9e; /* HALFWIDTH KATAKANA VOICED SOUND MARK */
|
|
|
|
|
} else if (c == 0x309c) {
|
|
|
|
|
s = 0xff9f; /* HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK */
|
|
|
|
|
} else if (c == 0x30fc) {
|
|
|
|
|
s = 0xff70; /* HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK */
|
|
|
|
|
} else if (c == 0x30fb) {
|
|
|
|
|
s = 0xff65; /* HALFWIDTH KATAKANA MIDDLE DOT */
|
|
|
|
|
}
|
|
|
|
|
} else if (mode & 0x30000) {
|
|
|
|
|
if ((mode & 0x10000) && c >= 0x3041 && c <= 0x3093) { /* Zenkaku hirangana to Zenkaku katakana */
|
|
|
|
|
s = c + 0x60;
|
|
|
|
|
} else if ((mode & 0x20000) && c >= 0x30a1 && c <= 0x30f3) { /* Zenkaku katakana to Zenkaku hirangana */
|
|
|
|
|
s = c - 0x60;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (mode & 0x100000) { /* special ascii to symbol */
|
|
|
|
|
if (c == 0x5c) {
|
|
|
|
|
s = 0xffe5; /* FULLWIDTH YEN SIGN */
|
|
|
|
|
} else if (c == 0xa5) { /* YEN SIGN */
|
|
|
|
|
s = 0xffe5; /* FULLWIDTH YEN SIGN */
|
|
|
|
|
} else if (c == 0x7e) {
|
|
|
|
|
s = 0xffe3; /* FULLWIDTH MACRON */
|
|
|
|
|
} else if (c == 0x203e) { /* OVERLINE */
|
|
|
|
|
s = 0xffe3; /* FULLWIDTH MACRON */
|
|
|
|
|
} else if (c == 0x27) {
|
|
|
|
|
s = 0x2019; /* RIGHT SINGLE QUOTATION MARK */
|
|
|
|
|
} else if (c == 0x22) {
|
|
|
|
|
s = 0x201d; /* RIGHT DOUBLE QUOTATION MARK */
|
|
|
|
|
}
|
|
|
|
|
} else if (mode & 0x200000) { /* special symbol to ascii */
|
|
|
|
|
if (c == 0xffe5) { /* FULLWIDTH YEN SIGN */
|
|
|
|
|
s = 0x5c;
|
|
|
|
|
} else if (c == 0xff3c) { /* FULLWIDTH REVERSE SOLIDUS */
|
|
|
|
|
s = 0x5c;
|
|
|
|
|
} else if (c == 0xffe3) { /* FULLWIDTH MACRON */
|
|
|
|
|
s = 0x7e;
|
|
|
|
|
} else if (c == 0x203e) { /* OVERLINE */
|
|
|
|
|
s = 0x7e;
|
|
|
|
|
} else if (c == 0x2018) { /* LEFT SINGLE QUOTATION MARK*/
|
|
|
|
|
s = 0x27;
|
|
|
|
|
} else if (c == 0x2019) { /* RIGHT SINGLE QUOTATION MARK */
|
|
|
|
|
s = 0x27;
|
|
|
|
|
} else if (c == 0x201c) { /* LEFT DOUBLE QUOTATION MARK */
|
|
|
|
|
s = 0x22;
|
|
|
|
|
} else if (c == 0x201d) { /* RIGHT DOUBLE QUOTATION MARK */
|
|
|
|
|
s = 0x22;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (mode & 0x400000) { /* special ascii to symbol */
|
|
|
|
|
if (c == 0x5c) {
|
|
|
|
|
s = 0xff3c; /* FULLWIDTH REVERSE SOLIDUS */
|
|
|
|
|
} else if (c == 0x7e) {
|
|
|
|
|
s = 0xff5e; /* FULLWIDTH TILDE */
|
|
|
|
|
} else if (c == 0x27) {
|
|
|
|
|
s = 0xff07; /* FULLWIDTH APOSTROPHE */
|
|
|
|
|
} else if (c == 0x22) {
|
|
|
|
|
s = 0xff02; /* FULLWIDTH QUOTATION MARK */
|
|
|
|
|
}
|
|
|
|
|
} else if (mode & 0x800000) { /* special symbol to ascii */
|
|
|
|
|
if (c == 0xff3c) { /* FULLWIDTH REVERSE SOLIDUS */
|
|
|
|
|
s = 0x5c;
|
|
|
|
|
} else if (c == 0xff5e) { /* FULLWIDTH TILDE */
|
|
|
|
|
s = 0x7e;
|
|
|
|
|
} else if (c == 0xff07) { /* FULLWIDTH APOSTROPHE */
|
|
|
|
|
s = 0x27;
|
|
|
|
|
} else if (c == 0xff02) { /* FULLWIDTH QUOTATION MARK */
|
|
|
|
|
s = 0x22;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return (*pc->next_filter->filter_function)(s, pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_hantozen_flush(struct collector_hantozen_data *pc TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int ret, n;
|
|
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
|
if (pc->status) {
|
|
|
|
|
n = (pc->cache - 0xff60) & 0x3f;
|
|
|
|
|
if (pc->mode & 0x100) { /* hankaku kana to zenkaku katakana */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
ret = (*pc->next_filter->filter_function)(0x3000 + hankana2zenkata_table[n], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (pc->mode & 0x200) { /* hankaku kana to zenkaku hirangana */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
ret = (*pc->next_filter->filter_function)(0x3000 + hankana2zenhira_table[n], pc->next_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_ja_jp_hantozen(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int mode TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
struct collector_hantozen_data pc;
|
|
|
|
|
mbfl_convert_filter *decoder;
|
|
|
|
|
mbfl_convert_filter *encoder;
|
|
|
|
|
|
|
|
|
|
/* initialize */
|
|
|
|
|
if (string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
encoding = mbfl_no2encoding(string->no_encoding);
|
|
|
|
|
if (encoding == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&device, string->len, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
|
|
|
|
decoder = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_hantozen, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (decoder == NULL || encoder == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
pc.next_filter = decoder;
|
|
|
|
|
pc.mode = mode;
|
|
|
|
|
pc.status = 0;
|
|
|
|
|
pc.cache = 0;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = string->val;
|
|
|
|
|
n = string->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
|
|
|
|
collector_hantozen_flush(&pc TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_flush(decoder TSRMLS_CC);
|
|
|
|
|
result = mbfl_memory_device_result(&device, result TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* MIME header encode
|
|
|
|
|
*/
|
|
|
|
|
struct mime_header_encoder_data {
|
|
|
|
|
mbfl_convert_filter *conv1_filter;
|
|
|
|
|
mbfl_convert_filter *block_filter;
|
|
|
|
|
mbfl_convert_filter *conv2_filter;
|
|
|
|
|
mbfl_convert_filter *conv2_filter_backup;
|
|
|
|
|
mbfl_convert_filter *encod_filter;
|
|
|
|
|
mbfl_convert_filter *encod_filter_backup;
|
|
|
|
|
mbfl_memory_device outdev;
|
|
|
|
|
mbfl_memory_device tmpdev;
|
|
|
|
|
int status1;
|
|
|
|
|
int status2;
|
|
|
|
|
int prevpos;
|
|
|
|
|
int linehead;
|
|
|
|
|
int firstindent;
|
|
|
|
|
int encnamelen;
|
|
|
|
|
int lwsplen;
|
|
|
|
|
char encname[128];
|
|
|
|
|
char lwsp[16];
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_block_collector(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
struct mime_header_encoder_data *pe = (struct mime_header_encoder_data *)data;
|
|
|
|
|
|
|
|
|
|
switch (pe->status2) {
|
|
|
|
|
case 1: /* encoded word */
|
|
|
|
|
pe->prevpos = pe->outdev.pos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(pe->conv2_filter, pe->conv2_filter_backup TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_copy(pe->encod_filter, pe->encod_filter_backup TSRMLS_CC);
|
|
|
|
|
(*pe->conv2_filter->filter_function)(c, pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
(*pe->conv2_filter->filter_flush)(pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
(*pe->encod_filter->filter_flush)(pe->encod_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n = pe->outdev.pos - pe->linehead + pe->firstindent;
|
|
|
|
|
pe->outdev.pos = pe->prevpos;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_copy(pe->conv2_filter_backup, pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_copy(pe->encod_filter_backup, pe->encod_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (n >= 74) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pe->conv2_filter->filter_flush)(pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
(*pe->encod_filter->filter_flush)(pe->encod_filter TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, "\x3f\x3d", 2 TSRMLS_CC); /* ?= */
|
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->lwsp, pe->lwsplen TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->linehead = pe->outdev.pos;
|
|
|
|
|
pe->firstindent = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->encname, pe->encnamelen TSRMLS_CC);
|
|
|
|
|
c = (*pe->conv2_filter->filter_function)(c, pe->conv2_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
c = (*pe->conv2_filter->filter_function)(c, pe->conv2_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->encname, pe->encnamelen TSRMLS_CC);
|
|
|
|
|
c = (*pe->conv2_filter->filter_function)(c, pe->conv2_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->status2 = 1;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_collector(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
struct mime_header_encoder_data *pe = (struct mime_header_encoder_data *)data;
|
|
|
|
|
|
|
|
|
|
switch (pe->status1) {
|
|
|
|
|
case 11: /* encoded word */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pe->block_filter->filter_function)(c, pe->block_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
default: /* ASCII */
|
|
|
|
|
if (c >= 0x21 && c < 0x7f) { /* ASCII exclude SPACE and CTLs */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->status1 = 1;
|
|
|
|
|
} else if (pe->status1 == 0 && c == 0x20) { /* repeat SPACE */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
if (pe->tmpdev.pos < 74 && c == 0x20) {
|
|
|
|
|
n = pe->outdev.pos - pe->linehead + pe->tmpdev.pos + pe->firstindent;
|
|
|
|
|
if (n > 74) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->lwsp, pe->lwsplen TSRMLS_CC); /* LWSP */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->linehead = pe->outdev.pos;
|
|
|
|
|
pe->firstindent = 0;
|
|
|
|
|
} else if (pe->outdev.pos > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(0x20, &pe->outdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_devcat(&pe->outdev, &pe->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->status1 = 0;
|
|
|
|
|
} else {
|
|
|
|
|
n = pe->outdev.pos - pe->linehead + pe->encnamelen + pe->firstindent;
|
|
|
|
|
if (n > 60) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->lwsp, pe->lwsplen TSRMLS_CC); /* LWSP */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->linehead = pe->outdev.pos;
|
|
|
|
|
pe->firstindent = 0;
|
|
|
|
|
} else if (pe->outdev.pos > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(0x20, &pe->outdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pe->block_filter, &pe->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pe->tmpdev TSRMLS_CC);
|
|
|
|
|
(*pe->block_filter->filter_function)(c, pe->block_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->status1 = 11;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_result(struct mime_header_encoder_data *pe, mbfl_string *result TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (pe->status1 >= 10) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pe->conv2_filter->filter_flush)(pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
(*pe->encod_filter->filter_flush)(pe->encod_filter TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, "\x3f\x3d", 2 TSRMLS_CC); /* ?= */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (pe->tmpdev.pos > 0) {
|
|
|
|
|
if (pe->outdev.pos > 0) {
|
|
|
|
|
if ((pe->outdev.pos - pe->linehead + pe->tmpdev.pos) > 74) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_strncat(&pe->outdev, pe->lwsp, pe->lwsplen TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(0x20, &pe->outdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_devcat(&pe->outdev, &pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_reset(&pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->prevpos = 0;
|
|
|
|
|
pe->linehead = 0;
|
|
|
|
|
pe->status1 = 0;
|
|
|
|
|
pe->status2 = 0;
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mbfl_memory_device_result(&pe->outdev, result TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
struct mime_header_encoder_data*
|
|
|
|
|
mime_header_encoder_new(
|
|
|
|
|
enum mbfl_no_encoding incode,
|
|
|
|
|
enum mbfl_no_encoding outcode,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
enum mbfl_no_encoding transenc TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
const char *s;
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *outencoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
struct mime_header_encoder_data *pe;
|
|
|
|
|
|
|
|
|
|
/* get output encoding and check MIME charset name */
|
|
|
|
|
outencoding = mbfl_no2encoding(outcode);
|
|
|
|
|
if (outencoding == NULL || outencoding->mime_name == NULL || outencoding->mime_name[0] == '\0') {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pe = (struct mime_header_encoder_data*)mbfl_malloc(sizeof(struct mime_header_encoder_data));
|
|
|
|
|
if (pe == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&pe->outdev, 0, 0 TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_init(&pe->tmpdev, 0, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pe->prevpos = 0;
|
|
|
|
|
pe->linehead = 0;
|
|
|
|
|
pe->firstindent = 0;
|
|
|
|
|
pe->status1 = 0;
|
|
|
|
|
pe->status2 = 0;
|
|
|
|
|
|
|
|
|
|
/* make the encoding description string exp. "=?ISO-2022-JP?B?" */
|
|
|
|
|
n = 0;
|
|
|
|
|
pe->encname[n++] = 0x3d;
|
|
|
|
|
pe->encname[n++] = 0x3f;
|
|
|
|
|
s = outencoding->mime_name;
|
|
|
|
|
while (*s) {
|
|
|
|
|
pe->encname[n++] = *s++;
|
|
|
|
|
}
|
|
|
|
|
pe->encname[n++] = 0x3f;
|
|
|
|
|
if (transenc == mbfl_no_encoding_qprint) {
|
|
|
|
|
pe->encname[n++] = 0x51;
|
|
|
|
|
} else {
|
|
|
|
|
pe->encname[n++] = 0x42;
|
|
|
|
|
transenc = mbfl_no_encoding_base64;
|
|
|
|
|
}
|
|
|
|
|
pe->encname[n++] = 0x3f;
|
|
|
|
|
pe->encname[n] = '\0';
|
|
|
|
|
pe->encnamelen = n;
|
|
|
|
|
|
|
|
|
|
n = 0;
|
|
|
|
|
pe->lwsp[n++] = 0x0d;
|
|
|
|
|
pe->lwsp[n++] = 0x0a;
|
|
|
|
|
pe->lwsp[n++] = 0x20;
|
|
|
|
|
pe->lwsp[n] = '\0';
|
|
|
|
|
pe->lwsplen = n;
|
|
|
|
|
|
|
|
|
|
/* transfer encode filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pe->encod_filter = mbfl_convert_filter_new(outcode, transenc, mbfl_memory_device_output, 0, &(pe->outdev) TSRMLS_CC);
|
|
|
|
|
pe->encod_filter_backup = mbfl_convert_filter_new(outcode, transenc, mbfl_memory_device_output, 0, &(pe->outdev) TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* Output code filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pe->conv2_filter = mbfl_convert_filter_new(mbfl_no_encoding_wchar, outcode, mbfl_filter_output_pipe, 0, pe->encod_filter TSRMLS_CC);
|
|
|
|
|
pe->conv2_filter_backup = mbfl_convert_filter_new(mbfl_no_encoding_wchar, outcode, mbfl_filter_output_pipe, 0, pe->encod_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* encoded block filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pe->block_filter = mbfl_convert_filter_new(mbfl_no_encoding_wchar, mbfl_no_encoding_wchar, mime_header_encoder_block_collector, 0, pe TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* Input code filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pe->conv1_filter = mbfl_convert_filter_new(incode, mbfl_no_encoding_wchar, mime_header_encoder_collector, 0, pe TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
if (pe->encod_filter == NULL ||
|
|
|
|
|
pe->encod_filter_backup == NULL ||
|
|
|
|
|
pe->conv2_filter == NULL ||
|
|
|
|
|
pe->conv2_filter_backup == NULL ||
|
|
|
|
|
pe->conv1_filter == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_delete(pe TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (transenc == mbfl_no_encoding_qprint) {
|
|
|
|
|
pe->encod_filter->status |= MBFL_QPRINT_STS_MIME_HEADER;
|
|
|
|
|
pe->encod_filter_backup->status |= MBFL_QPRINT_STS_MIME_HEADER;
|
|
|
|
|
} else {
|
|
|
|
|
pe->encod_filter->status |= MBFL_BASE64_STS_MIME_HEADER;
|
|
|
|
|
pe->encod_filter_backup->status |= MBFL_BASE64_STS_MIME_HEADER;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return pe;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_delete(struct mime_header_encoder_data *pe TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (pe) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(pe->conv1_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pe->block_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pe->conv2_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pe->conv2_filter_backup TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pe->encod_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pe->encod_filter_backup TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_clear(&pe->outdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_clear(&pe->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_free((void*)pe);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_encoder_feed(int c, struct mime_header_encoder_data *pe TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return (*pe->conv1_filter->filter_function)(c, pe->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_mime_header_encode(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
|
|
|
|
enum mbfl_no_encoding outcode,
|
|
|
|
|
enum mbfl_no_encoding encoding,
|
|
|
|
|
const char *linefeed,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int indent TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
struct mime_header_encoder_data *pe;
|
|
|
|
|
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = mbfl_no_encoding_ascii;
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pe = mime_header_encoder_new(string->no_encoding, outcode, encoding TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pe == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (linefeed != NULL) {
|
|
|
|
|
n = 0;
|
|
|
|
|
while (*linefeed && n < 8) {
|
|
|
|
|
pe->lwsp[n++] = *linefeed++;
|
|
|
|
|
}
|
|
|
|
|
pe->lwsp[n++] = 0x20;
|
|
|
|
|
pe->lwsp[n] = '\0';
|
|
|
|
|
pe->lwsplen = n;
|
|
|
|
|
}
|
|
|
|
|
if (indent > 0 && indent < 74) {
|
|
|
|
|
pe->firstindent = indent;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pe->conv1_filter->filter_function)(*p++, pe->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
result = mime_header_encoder_result(pe, result TSRMLS_CC);
|
|
|
|
|
mime_header_encoder_delete(pe TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* MIME header decode
|
|
|
|
|
*/
|
|
|
|
|
struct mime_header_decoder_data {
|
|
|
|
|
mbfl_convert_filter *deco_filter;
|
|
|
|
|
mbfl_convert_filter *conv1_filter;
|
|
|
|
|
mbfl_convert_filter *conv2_filter;
|
|
|
|
|
mbfl_memory_device outdev;
|
|
|
|
|
mbfl_memory_device tmpdev;
|
|
|
|
|
int cspos;
|
|
|
|
|
int status;
|
|
|
|
|
enum mbfl_no_encoding encoding;
|
|
|
|
|
enum mbfl_no_encoding incode;
|
|
|
|
|
enum mbfl_no_encoding outcode;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_collector(int c, void* data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-08-02 10:22:31 +00:00
|
|
|
|
const mbfl_encoding *encoding;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
struct mime_header_decoder_data *pd = (struct mime_header_decoder_data*)data;
|
|
|
|
|
|
|
|
|
|
switch (pd->status) {
|
|
|
|
|
case 1:
|
|
|
|
|
if (c == 0x3f) { /* ? */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->cspos = pd->tmpdev.pos;
|
|
|
|
|
pd->status = 2;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c == 0x3d) { /* = */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else if (c == 0x0d || c == 0x0a) { /* CR or LF */
|
|
|
|
|
pd->status = 9;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->conv1_filter->filter_function)(c, pd->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 2: /* store charset string */
|
|
|
|
|
if (c == 0x3f) { /* ? */
|
|
|
|
|
/* identify charset */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output('\0', &pd->tmpdev TSRMLS_CC);
|
2002-11-02 13:38:32 +00:00
|
|
|
|
encoding = mbfl_name2encoding((const char *)&pd->tmpdev.buffer[pd->cspos]);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (encoding != NULL) {
|
|
|
|
|
pd->incode = encoding->no_encoding;
|
|
|
|
|
pd->status = 3;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_unput(&pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pd->tmpdev.pos > 100) { /* too long charset string */
|
|
|
|
|
pd->status = 0;
|
|
|
|
|
} else if (c == 0x0d || c == 0x0a) { /* CR or LF */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_unput(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 9;
|
|
|
|
|
}
|
|
|
|
|
if (pd->status != 2) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 3: /* identify encoding */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c == 0x42 || c == 0x62) { /* 'B' or 'b' */
|
|
|
|
|
pd->encoding = mbfl_no_encoding_base64;
|
|
|
|
|
pd->status = 4;
|
|
|
|
|
} else if (c == 0x51 || c == 0x71) { /* 'Q' or 'q' */
|
|
|
|
|
pd->encoding = mbfl_no_encoding_qprint;
|
|
|
|
|
pd->status = 4;
|
|
|
|
|
} else {
|
|
|
|
|
if (c == 0x0d || c == 0x0a) { /* CR or LF */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_unput(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 9;
|
|
|
|
|
} else {
|
|
|
|
|
pd->status = 0;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 4: /* reset filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c == 0x3f) { /* ? */
|
|
|
|
|
/* charset convert filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_reset(pd->conv1_filter, pd->incode, mbfl_no_encoding_wchar TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* decode filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_reset(pd->deco_filter, pd->encoding, mbfl_no_encoding_8bit TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 5;
|
|
|
|
|
} else {
|
|
|
|
|
if (c == 0x0d || c == 0x0a) { /* CR or LF */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_unput(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 9;
|
|
|
|
|
} else {
|
|
|
|
|
pd->status = 0;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case 5: /* encoded block */
|
|
|
|
|
if (c == 0x3f) { /* ? */
|
|
|
|
|
pd->status = 6;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->deco_filter->filter_function)(c, pd->deco_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 6: /* check end position */
|
|
|
|
|
if (c == 0x3d) { /* = */
|
|
|
|
|
/* flush and reset filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->deco_filter->filter_flush)(pd->deco_filter TSRMLS_CC);
|
|
|
|
|
(*pd->conv1_filter->filter_flush)(pd->conv1_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_reset(pd->conv1_filter, mbfl_no_encoding_ascii, mbfl_no_encoding_wchar TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 7;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->deco_filter->filter_function)(0x3f, pd->deco_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c != 0x3f) { /* ? */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->deco_filter->filter_function)(c, pd->deco_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 5;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 7: /* after encoded block */
|
|
|
|
|
if (c == 0x0d || c == 0x0a) { /* CR LF */
|
|
|
|
|
pd->status = 8;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c == 0x3d) { /* = */
|
|
|
|
|
pd->status = 1;
|
|
|
|
|
} else if (c != 0x20 && c != 0x09) { /* not space */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 8: /* folding */
|
|
|
|
|
case 9: /* folding */
|
|
|
|
|
if (c != 0x0d && c != 0x0a && c != 0x20 && c != 0x09) {
|
|
|
|
|
if (c == 0x3d) { /* = */
|
|
|
|
|
if (pd->status == 8) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(0x20, &pd->tmpdev TSRMLS_CC); /* SPACE */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->conv1_filter->filter_function)(0x20, pd->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 1;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(0x20, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
default: /* non encoded block */
|
|
|
|
|
if (c == 0x0d || c == 0x0a) { /* CR LF */
|
|
|
|
|
pd->status = 9;
|
|
|
|
|
} else if (c == 0x3d) { /* = */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output(c, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 1;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->conv1_filter->filter_function)(c, pd->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_result(struct mime_header_decoder_data *pd, mbfl_string *result TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
switch (pd->status) {
|
|
|
|
|
case 1:
|
|
|
|
|
case 2:
|
|
|
|
|
case 3:
|
|
|
|
|
case 4:
|
|
|
|
|
case 7:
|
|
|
|
|
case 8:
|
|
|
|
|
case 9:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_devcat(pd->conv1_filter, &pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
case 5:
|
|
|
|
|
case 6:
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->deco_filter->filter_flush)(pd->deco_filter TSRMLS_CC);
|
|
|
|
|
(*pd->conv1_filter->filter_flush)(pd->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pd->conv2_filter->filter_flush)(pd->conv2_filter TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_reset(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->status = 0;
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mbfl_memory_device_result(&pd->outdev, result TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
struct mime_header_decoder_data*
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_new(enum mbfl_no_encoding outcode TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct mime_header_decoder_data *pd;
|
|
|
|
|
|
|
|
|
|
pd = (struct mime_header_decoder_data*)mbfl_malloc(sizeof(struct mime_header_decoder_data));
|
|
|
|
|
if (pd == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&pd->outdev, 0, 0 TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_init(&pd->tmpdev, 0, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
pd->cspos = 0;
|
|
|
|
|
pd->status = 0;
|
|
|
|
|
pd->encoding = mbfl_no_encoding_pass;
|
|
|
|
|
pd->incode = mbfl_no_encoding_ascii;
|
|
|
|
|
pd->outcode = outcode;
|
|
|
|
|
/* charset convert filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pd->conv2_filter = mbfl_convert_filter_new(mbfl_no_encoding_wchar, pd->outcode, mbfl_memory_device_output, 0, &pd->outdev TSRMLS_CC);
|
|
|
|
|
pd->conv1_filter = mbfl_convert_filter_new(pd->incode, mbfl_no_encoding_wchar, mbfl_filter_output_pipe, 0, pd->conv2_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* decode filter */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pd->deco_filter = mbfl_convert_filter_new(pd->encoding, mbfl_no_encoding_8bit, mbfl_filter_output_pipe, 0, pd->conv1_filter TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
if (pd->conv1_filter == NULL || pd->conv2_filter == NULL || pd->deco_filter == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_delete(pd TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return pd;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_delete(struct mime_header_decoder_data *pd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
if (pd) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(pd->conv2_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pd->conv1_filter TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pd->deco_filter TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_clear(&pd->outdev TSRMLS_CC);
|
|
|
|
|
mbfl_memory_device_clear(&pd->tmpdev TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
mbfl_free((void*)pd);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_feed(int c, struct mime_header_decoder_data *pd TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
2002-04-10 12:47:41 +00:00
|
|
|
|
return mime_header_decoder_collector(c, pd TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_mime_header_decode(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
enum mbfl_no_encoding outcode TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
struct mime_header_decoder_data *pd;
|
|
|
|
|
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = outcode;
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
pd = mime_header_decoder_new(outcode TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (pd == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
n = string->len;
|
|
|
|
|
p = string->val;
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mime_header_decoder_collector(*p++, pd TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
|
2002-04-10 12:47:41 +00:00
|
|
|
|
result = mime_header_decoder_result(pd, result TSRMLS_CC);
|
|
|
|
|
mime_header_decoder_delete(pd TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
* convert HTML numeric entity
|
|
|
|
|
*/
|
|
|
|
|
struct collector_htmlnumericentity_data {
|
|
|
|
|
mbfl_convert_filter *decoder;
|
|
|
|
|
int status;
|
|
|
|
|
int cache;
|
|
|
|
|
int digit;
|
|
|
|
|
int *convmap;
|
|
|
|
|
int mapsize;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_encode_htmlnumericentity(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_htmlnumericentity_data *pc = (struct collector_htmlnumericentity_data *)data;
|
|
|
|
|
int f, n, s, r, d, size, *mapelm;
|
|
|
|
|
|
|
|
|
|
size = pc->mapsize;
|
|
|
|
|
f = 0;
|
|
|
|
|
n = 0;
|
|
|
|
|
while (n < size) {
|
|
|
|
|
mapelm = &(pc->convmap[n*4]);
|
|
|
|
|
if (c >= mapelm[0] && c <= mapelm[1]) {
|
|
|
|
|
s = (c + mapelm[2]) & mapelm[3];
|
2001-05-06 22:06:10 +00:00
|
|
|
|
if (s >= 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(0x26, pc->decoder TSRMLS_CC); /* '&' */
|
|
|
|
|
(*pc->decoder->filter_function)(0x23, pc->decoder TSRMLS_CC); /* '#' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
r = 100000000;
|
|
|
|
|
s %= r;
|
|
|
|
|
while (r > 0) {
|
|
|
|
|
d = s/r;
|
|
|
|
|
if (d || f) {
|
|
|
|
|
f = 1;
|
|
|
|
|
s %= r;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(mbfl_hexchar_table[d], pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
r /= 10;
|
|
|
|
|
}
|
2001-05-06 22:06:10 +00:00
|
|
|
|
if (!f) {
|
|
|
|
|
f = 1;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(mbfl_hexchar_table[0], pc->decoder TSRMLS_CC);
|
2001-05-06 22:06:10 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(0x3b, pc->decoder TSRMLS_CC); /* ';' */
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (f) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n++;
|
|
|
|
|
}
|
|
|
|
|
if (!f) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static int
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_decode_htmlnumericentity(int c, void *data TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_htmlnumericentity_data *pc = (struct collector_htmlnumericentity_data *)data;
|
|
|
|
|
int f, n, s, r, d, size, *mapelm;
|
|
|
|
|
|
|
|
|
|
switch (pc->status) {
|
|
|
|
|
case 1:
|
|
|
|
|
if (c == 0x23) { /* '#' */
|
|
|
|
|
pc->status = 2;
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(0x26, pc->decoder TSRMLS_CC); /* '&' */
|
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 2:
|
|
|
|
|
if (c >= 0x30 && c <= 0x39) { /* '0' - '9' */
|
|
|
|
|
pc->cache = c - 0x30;
|
|
|
|
|
pc->status = 3;
|
|
|
|
|
pc->digit = 1;
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(0x26, pc->decoder TSRMLS_CC); /* '&' */
|
|
|
|
|
(*pc->decoder->filter_function)(0x23, pc->decoder TSRMLS_CC); /* '#' */
|
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case 3:
|
|
|
|
|
s = 0;
|
|
|
|
|
f = 0;
|
|
|
|
|
if (c >= 0x30 && c <= 0x39) { /* '0' - '9' */
|
|
|
|
|
if (pc->digit > 9) {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = pc->cache;
|
|
|
|
|
f = 1;
|
|
|
|
|
} else {
|
|
|
|
|
s = pc->cache*10 + c - 0x30;
|
|
|
|
|
pc->cache = s;
|
|
|
|
|
pc->digit++;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
pc->status = 0;
|
|
|
|
|
s = pc->cache;
|
|
|
|
|
f = 1;
|
|
|
|
|
n = 0;
|
|
|
|
|
size = pc->mapsize;
|
|
|
|
|
while (n < size) {
|
|
|
|
|
mapelm = &(pc->convmap[n*4]);
|
|
|
|
|
d = s - mapelm[2];
|
|
|
|
|
if (d >= mapelm[0] && d <= mapelm[1]) {
|
|
|
|
|
f = 0;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(d, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
if (c != 0x3b) { /* ';' */
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n++;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (f) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(0x26, pc->decoder TSRMLS_CC); /* '&' */
|
|
|
|
|
(*pc->decoder->filter_function)(0x23, pc->decoder TSRMLS_CC); /* '#' */
|
2001-05-06 22:06:10 +00:00
|
|
|
|
r = 1;
|
|
|
|
|
n = pc->digit;
|
|
|
|
|
while (n > 0) {
|
|
|
|
|
r *= 10;
|
|
|
|
|
n--;
|
|
|
|
|
}
|
2001-05-01 01:52:55 +00:00
|
|
|
|
s %= r;
|
2001-05-06 22:06:10 +00:00
|
|
|
|
r /= 10;
|
2001-05-01 01:52:55 +00:00
|
|
|
|
while (r > 0) {
|
|
|
|
|
d = s/r;
|
|
|
|
|
s %= r;
|
2001-05-06 22:06:10 +00:00
|
|
|
|
r /= 10;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(mbfl_hexchar_table[d], pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
if (c == 0x26) { /* '&' */
|
|
|
|
|
pc->status = 1;
|
|
|
|
|
} else {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
(*pc->decoder->filter_function)(c, pc->decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return c;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
mbfl_string *
|
|
|
|
|
mbfl_html_numeric_entity(
|
|
|
|
|
mbfl_string *string,
|
|
|
|
|
mbfl_string *result,
|
|
|
|
|
int *convmap,
|
|
|
|
|
int mapsize,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
int type TSRMLS_DC)
|
2001-05-01 01:52:55 +00:00
|
|
|
|
{
|
|
|
|
|
struct collector_htmlnumericentity_data pc;
|
|
|
|
|
mbfl_memory_device device;
|
|
|
|
|
mbfl_convert_filter *encoder;
|
|
|
|
|
int n;
|
|
|
|
|
unsigned char *p;
|
|
|
|
|
|
|
|
|
|
if (string == NULL || result == NULL) {
|
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
mbfl_string_init(result);
|
|
|
|
|
result->no_language = string->no_language;
|
|
|
|
|
result->no_encoding = string->no_encoding;
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_init(&device, string->len, 0 TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
/* output code filter */
|
|
|
|
|
pc.decoder = mbfl_convert_filter_new(
|
|
|
|
|
mbfl_no_encoding_wchar,
|
|
|
|
|
string->no_encoding,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_memory_device_output, 0, &device TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
/* wchar filter */
|
|
|
|
|
if (type == 0) {
|
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_encode_htmlnumericentity, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
} else {
|
|
|
|
|
encoder = mbfl_convert_filter_new(
|
|
|
|
|
string->no_encoding,
|
|
|
|
|
mbfl_no_encoding_wchar,
|
2002-04-10 12:47:41 +00:00
|
|
|
|
collector_decode_htmlnumericentity, 0, &pc TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
}
|
|
|
|
|
if (pc.decoder == NULL || encoder == NULL) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
return NULL;
|
|
|
|
|
}
|
|
|
|
|
pc.status = 0;
|
|
|
|
|
pc.cache = 0;
|
|
|
|
|
pc.digit = 0;
|
|
|
|
|
pc.convmap = convmap;
|
|
|
|
|
pc.mapsize = mapsize;
|
|
|
|
|
|
|
|
|
|
/* feed data */
|
|
|
|
|
p = string->val;
|
|
|
|
|
n = string->len;
|
|
|
|
|
if (p != NULL) {
|
|
|
|
|
while (n > 0) {
|
2002-04-10 12:47:41 +00:00
|
|
|
|
if ((*encoder->filter_function)(*p++, encoder TSRMLS_CC) < 0) {
|
2001-05-01 01:52:55 +00:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
n--;
|
|
|
|
|
}
|
|
|
|
|
}
|
2002-04-10 12:47:41 +00:00
|
|
|
|
mbfl_convert_filter_flush(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_flush(pc.decoder TSRMLS_CC);
|
|
|
|
|
result = mbfl_memory_device_result(&device, result TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(encoder TSRMLS_CC);
|
|
|
|
|
mbfl_convert_filter_delete(pc.decoder TSRMLS_CC);
|
2001-05-01 01:52:55 +00:00
|
|
|
|
|
|
|
|
|
return result;
|
2002-03-13 00:29:53 +00:00
|
|
|
|
}
|
2002-04-30 12:00:42 +00:00
|
|
|
|
|
2002-10-06 09:36:26 +00:00
|
|
|
|
#endif /* HAVE_MBSTRING */
|
|
|
|
|
|
2002-04-30 12:00:42 +00:00
|
|
|
|
/*
|
|
|
|
|
* Local variables:
|
|
|
|
|
* tab-width: 4
|
|
|
|
|
* c-basic-offset: 4
|
|
|
|
|
* End:
|
|
|
|
|
*/
|