r17939 - in /branches/upstream/libmime-charset-perl/current: Changes Charset-ja_JP.pod Charset.pm Charset/JA_JP.pod MANIFEST META.yml README
rmayorga-guest at users.alioth.debian.org
rmayorga-guest at users.alioth.debian.org
Mon Mar 24 05:33:21 UTC 2008
Author: rmayorga-guest
Date: Mon Mar 24 05:33:16 2008
New Revision: 17939
URL: http://svn.debian.org/wsvn/?sc=1&rev=17939
Log:
[svn-upgrade] Integrating new upstream version, libmime-charset-perl (1.002)
Added:
branches/upstream/libmime-charset-perl/current/Charset/JA_JP.pod
Removed:
branches/upstream/libmime-charset-perl/current/Charset-ja_JP.pod
Modified:
branches/upstream/libmime-charset-perl/current/Changes
branches/upstream/libmime-charset-perl/current/Charset.pm
branches/upstream/libmime-charset-perl/current/MANIFEST
branches/upstream/libmime-charset-perl/current/META.yml
branches/upstream/libmime-charset-perl/current/README
Modified: branches/upstream/libmime-charset-perl/current/Changes
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/Changes?rev=17939&op=diff
==============================================================================
--- branches/upstream/libmime-charset-perl/current/Changes (original)
+++ branches/upstream/libmime-charset-perl/current/Changes Mon Mar 24 05:33:16 2008
@@ -1,3 +1,9 @@
+2008-03-20 Hatuka*nezumi - IKEDA Soji <hatuka at nezumi.nu>
+ * Release 1.002.
+ * New method undecode().
+ * encoder(): added argument to set instance.
+ * Cleanup PODs.
+
2008-03-15 Hatuka*nezumi - IKEDA Soji <hatuka at nezumi.nu>
* Release 1.001.
Modified: branches/upstream/libmime-charset-perl/current/Charset.pm
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/Charset.pm?rev=17939&op=diff
==============================================================================
--- branches/upstream/libmime-charset-perl/current/Charset.pm (original)
+++ branches/upstream/libmime-charset-perl/current/Charset.pm Mon Mar 24 05:33:16 2008
@@ -121,7 +121,7 @@
}
}
-$VERSION = '1.001';
+$VERSION = '1.002';
######## Private Attributes ########
@@ -375,7 +375,7 @@
=item canonical_charset CHARSET
-Get canonical name for charset CHARSET.
+Get canonical name for charset.
=cut
@@ -391,23 +391,6 @@
$self->{InputCharset};
}
-=item $charset->decode(STRING [,CHECK])
-
-Decode STRING to Unicode.
-
-B<Note>:
-When Unicode/multibyte support is disabled (see L<"USE_ENCODE">),
-this function will die.
-
-=cut
-
-sub decode($$$;) {
- my $self = shift;
- my $s = shift;
- my $check = shift || 0;
- $self->{Decoder}->decode($s, $check);
-}
-
=item $charset->decoder
Get L<"Encode::Encoding"> object to decode strings by charset.
@@ -419,39 +402,23 @@
$self->{Decoder};
}
-=item $charset->encode(STRING [,CHECK])
-
-Encode STRING (Unicode or non-Unicode) using compatible charset recommended
-to be used for messages on Internet (if this module know it).
-Note that string will be decoded then encoded even if compatible charset
-was equal to original charset.
-
-B<Note>:
-When Unicode/multibyte support is disabled (see L<"USE_ENCODE">),
-this function will die.
-
-=cut
-
-sub encode($$$;) {
- my $self = shift;
- my $s = shift;
- my $check = shift || 0;
-
- unless (is_utf8($s) or $s =~ /[^\x00-\xFF]/) {
- $s = $self->{Decoder}->decode($s, ($check & 0x1)? FB_CROAK(): 0);
- }
- $self->{Encoder}->encode($s, $check);
-}
-
-=item $charset->encoder
+=item $charset->encoder([CHARSET])
Get L<"Encode::Encoding"> object to encode Unicode string using compatible
charset recommended to be used for messages on Internet.
=cut
-sub encoder($) {
- my $self = shift;
+sub encoder($$;) {
+ my $self = shift;
+ my $charset = shift;
+ if ($charset) {
+ $charset = MIME::Charset->new($charset) unless ref $charset;
+ $self->{OutputCharset} = $charset->{InputCharset};
+ $self->{Encoder} = $charset->{Decoder};
+ #XXX$self->{BodyEncoding} = $charset->{BodyEncoding};
+ #XXX$self->{HeaderEncoding} = $charset->{HeaderEncoding};
+ }
$self->{Encoder};
}
@@ -578,6 +545,47 @@
$enc = 'BASE64';
}
return ($encoded, $cset, $enc);
+}
+
+=item $charset->decode(STRING [,CHECK])
+
+Decode STRING to Unicode.
+
+B<Note>:
+When Unicode/multibyte support is disabled (see L<"USE_ENCODE">),
+this function will die.
+
+=cut
+
+sub decode($$$;) {
+ my $self = shift;
+ my $s = shift;
+ my $check = shift || 0;
+ $self->{Decoder}->decode($s, $check);
+}
+
+=item $charset->encode(STRING [,CHECK])
+
+Encode STRING (Unicode or non-Unicode) using compatible charset recommended
+to be used for messages on Internet (if this module knows it).
+Note that string will be decoded then encoded even if compatible charset
+was equal to original charset.
+
+B<Note>:
+When Unicode/multibyte support is disabled (see L<"USE_ENCODE">),
+this function will die.
+
+=cut
+
+sub encode($$$;) {
+ my $self = shift;
+ my $s = shift;
+ my $check = shift || 0;
+
+ unless (is_utf8($s) or $s =~ /[^\x00-\xFF]/) {
+ $s = $self->{Decoder}->decode($s, ($check & 0x1)? FB_CROAK(): 0);
+ }
+ $self->{Encoder}->encode($s, $check);
}
=item $charset->encoded_header_len(STRING [, ENCODING])
@@ -839,6 +847,24 @@
return $DEFAULT_CHARSET;
}
+=item $charset->undecode(STRING [,CHECK])
+
+Encode Unicode string STRING to byte string by input charset of $charset.
+This is a equivalent to C<$charset->decoder->encode()>.
+
+B<Note>:
+When Unicode/multibyte support is disabled (see L<"USE_ENCODE">),
+this function will die.
+
+=cut
+
+sub undecode($$$;) {
+ my $self = shift;
+ my $s = shift;
+ my $check = shift || 0;
+ $self->{Decoder}->encode($s, $check);
+}
+
=head2 Manipulating Module Defaults
=over 4
Added: branches/upstream/libmime-charset-perl/current/Charset/JA_JP.pod
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/Charset/JA_JP.pod?rev=17939&op=file
==============================================================================
--- branches/upstream/libmime-charset-perl/current/Charset/JA_JP.pod (added)
+++ branches/upstream/libmime-charset-perl/current/Charset/JA_JP.pod Mon Mar 24 05:33:16 2008
@@ -1,0 +1,474 @@
+=encoding utf-8
+
+=head1 NAME
+
+MIME::Charset::JA_JP - MIME ã®ãŸã‚ã®ã‚ャラクタセットæƒ
å ±
+
+=head1 SYNOPSIS
+
+ use MIME::Charset:
+
+ $charset = MIME::Charset->new("euc-jp");
+
+ã‚ャラクタセットæƒ
å ±ã®å–å¾—:
+
+ $benc = $charset->body_encoding; # 例 "Q"
+ $cset = $charset->canonical_charset; # 例 "US-ASCII"
+ $henc = $charset->header_encoding; # 例 "S"
+ $cset = $charset->output_charset; # 例 "ISO-2022-JP"
+
+テã‚ストデータã®å¤‰æ›:
+
+ ($text, $charset, $encoding) =
+ $charset->header_encode(
+ "\xc9\xc2\xc5\xaa\xc0\xde\xc3\xef\xc5\xaa".
+ "\xc7\xd1\xca\xaa\xbd\xd0\xce\xcf\xb4\xef");
+ # ...例ãˆã° (<converted>, "ISO-2022-JP", "B") ã‚’è¿”ã™
+
+ ($text, $charset, $encoding) =
+ $charset->body_encode(
+ "Collectioneur path\xe9tiquement ".
+ # ...例ãˆã° (<original>, "ISO-8859-1", "QUOTED-PRINTABLE") ã‚’è¿”ã™
+
+ $len = $charset->encoded_header_len(
+ "Perl\xe8\xa8\x80\xe8\xaa\x9e", "b"); # 例 28
+
+ãƒ¢ã‚¸ãƒ¥ãƒ¼ãƒ«æ—¢å®šå€¤ã®æ“作:
+
+ use MIME::Charset;
+
+ MIME::Charset::alias("csEUCKR", "euc-kr");
+ MIME::Charset::default("iso-8859-1");
+ MIME::Charset::fallback("us-ascii");
+
+éžOOP関数 (è¿‘ã„å°†æ¥ã«å»ƒæ¢):
+
+ use MIME::Charset qw(:info);
+
+ $benc = body_encoding("iso-8859-2"); # "Q"
+ $cset = canonical_charset("ANSI X3.4-1968"); # "US-ASCII"
+ $henc = header_encoding("utf-8"); # "S"
+ $cset = output_charset("shift_jis"); # "ISO-2022-JP"
+
+ use MIME::Charset qw(:trans);
+
+ ($text, $charset, $encoding) =
+ header_encode(
+ "\xc9\xc2\xc5\xaa\xc0\xde\xc3\xef\xc5\xaa".
+ "\xc7\xd1\xca\xaa\xbd\xd0\xce\xcf\xb4\xef",
+ "euc-jp");
+ # ...(<変æ›ã•れãŸãƒ†ã‚スト>, "ISO-2022-JP", "B") ã‚’è¿”ã™ã€‚
+
+ ($text, $charset, $encoding) =
+ body_encode(
+ "Collectioneur path\xe9tiquement ".
+ "\xe9clectique de d\xe9chets",
+ "latin1");
+ # ...(<å
ƒã®ãƒ†ã‚スト>, "ISO-8859-1", "QUOTED-PRINTABLE") ã‚’è¿”ã™ã€‚
+
+ $len = encoded_header_len(
+ "Perl\xe8\xa8\x80\xe8\xaa\x9e", "b", "utf-8"); # 28
+
+=head1 DESCRIPTION
+
+MIME::Charset ã¯ã€ã‚¤ãƒ³ã‚¿ãƒ¼ãƒãƒƒãƒˆä¸Šã§ã® MIME
+メッセージã«ç”¨ã„ã‚‹ã‚ãƒ£ãƒ©ã‚¯ã‚¿ã‚»ãƒƒãƒˆã®æƒ
å ±ã‚’æä¾›ã™ã‚‹ã€‚
+
+=head2 定義
+
+B<ã‚ャラクタセット> ã¨ã¯ã€MIME ã§ã® ``character set'' ã®ã“ã¨ã§ã€
+オクテットã®åˆ—ã‚’æ–‡å—ã®åˆ—ã«å¤‰æ›ã™ã‚‹æ–¹æ³•を指ã™ã€‚
+ã“れã¯ã€ISO/IEC ã«ãŠã‘ã‚‹ ``符å·åŒ–æ–‡å—集åˆ'' (CCS) ã¨
+``æ–‡å—符åˆåŒ–法'' (CES) ã®ä¸¡æ–¹ã®æ¦‚念をåŒ
å«ã™ã‚‹
+(ã“ã®å®šç¾©ã¯ä¸æ£ç¢ºã‹ã‚‚ã—れã¾ã›ã‚“。
+よりæ£ç¢ºãªå®šç¾©ã‚’ã”å˜ã˜ã®æ–¹ã”指å—ãã ã•ã„)。
+
+B<エンコーディング> ã¨ã¯ã€MIME ã§ã®ãれã®ã“ã¨ã§ã€
+メッセージ本体やメッセージヘッダ本体をå°å—å¯èƒ½ãª
+US-ASCII æ–‡å—ã®åˆ—ã¨ã—ã¦è¡¨ç¾ã™ã‚‹æ–¹æ³•を指ã™ã€‚
+
+=over 4
+
+
+=cut
+
+=head2 コンストラクタ
+
+=item $charset = MIME::Charset->new([CHARSET [, OPTS]])
+
+ã‚ャラクタセットオブジェクトを作æˆã—ã¦è¿”ã™ã€‚
+
+OPTS ã«ã¯ä»¥ä¸‹ã®å¯¾ã‚’指定ã§ãる。
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+変æ›ã‚’行ã‚ãªã„ã®ã§ã€ä»¥ä¸‹ã®ã‚ªãƒ—ションã¯åŠ¹æžœã‚’æŒãŸãªã„。
+
+=over 4
+
+=item Mapping => MAPTYPE
+
+ã‚ャラクタセットåã«å¯¾ã—ã¦å®Ÿéš›ã«ä½¿ã†ãƒžãƒƒãƒ”ãƒ³ã‚°ã®æ‹¡å¼µã‚’ã™ã‚‹ã‹ã©ã†ã‹ã€‚
+C<"EXTENDED"> ã¯æ‹¡å¼µãƒžãƒƒãƒ”ングを使ã†ã€‚
+C<"STANDARD"> ã¯æ¨™æº–化ã•れã¦ã„る厳密ãªãƒžãƒƒãƒ”ングを使ã†ã€‚
+既定㯠C<"EXTENDED">。
+
+=back
+
+=cut
+
+=head2 ã‚ャラクタセットæƒ
å ±ã®å–å¾—
+
+=item $charset->body_encoding
+
+=item body_encoding CHARSET
+
+CHARSET ã®ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸æœ¬ä½“ã§æŽ¨å¥¨ã•れるä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°ã‚’å–å¾—ã™ã‚‹ã€‚
+
+返値㯠C<"B"> (BASE64)ã€C<"Q"> (QUOTED-PRINTABLE)ã€
+C<undef> (ä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã—ãªãã¦ã‚ˆã„ --- 7BIT ã‹ 8BIT)
+ã®ã„ãšã‚Œã‹ã€‚ã“れã¯ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ãƒ˜ãƒƒãƒ€ã®ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°ã¨ã¯é•ã†ã“ã¨ã‚‚ã‚る。
+
+=cut
+
+=item $charset->as_string
+
+=item canonical_charset CHARSET
+
+ã‚ãƒ£ãƒ©ã‚¯ã‚¿ã‚»ãƒƒãƒˆã®æ£è¦ã®åå‰ã‚’å–å¾—ã™ã‚‹ã€‚
+
+=cut
+
+=item $charset->decoder
+
+ã‚ャラクタセットをデコードã™ã‚‹ã®ã«ä½¿ã†
+L<"Encode::Encoding"> オブジェクトを返ã™ã€‚
+
+=cut
+
+=item $charset->encoder([CHARSET])
+
+インターãƒãƒƒãƒˆä¸Šã® MIME
+メッセージã§ä½¿ã†ã“ã¨ã‚’推奨ã•れる互æ›ã‚ャラクタセットã§ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã™ã‚‹ã®ã«ä½¿ã†
+L<"Encode::Encoding"> オブジェクトを返ã™ã€‚
+
+=cut
+
+=item $charset->header_encoding
+
+=item header_encoding CHARSET
+
+CHARSET ã®ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ãƒ˜ãƒƒãƒ€ã§æŽ¨å¥¨ã•れるエンコーディング法をå–å¾—ã™ã‚‹ã€‚
+
+返値㯠C<"B">ã€C<"Q">ã€C<"S"> (ã©ã¡ã‚‰ã‹çŸããªã‚‹ã»ã†)ã€
+C<undef> (エンコードã—ãªãã¦ã‚ˆã„)
+ã®ã„ãšã‚Œã‹ã€‚ã“れã¯ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸æœ¬ä½“ã®ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°ã¨ã¯é•ã†ã“ã¨ã‚‚ã‚る。
+
+
+=cut
+
+=item $charset->output_charset
+
+=item output_charset CHARSET
+
+指定ã—㟠CHARSET ã¨äº’æ›ã§ã€ã‚¤ãƒ³ã‚¿ãƒ¼ãƒãƒƒãƒˆä¸Šã®
+MIME メッセージã§ä½¿ã†ã“ã¨ã‚’推奨ã•れるã‚ャラクタセットåã‚’
+(当モジュールãŒçŸ¥ã£ã¦ã„れã°) å–å¾—ã™ã‚‹ã€‚
+
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+ã“ã®é–¢æ•°ã¯å˜ã« L<"canonical_charset"> ã®çµæžœã‚’è¿”ã™ã€‚
+
+
+=cut
+
+=head2 テã‚ストデータã®å¤‰æ›
+
+=item $charset->body_encode(STRING [, OPTS])
+
+=item body_encode STRING, CHARSET [, OPTS]
+
+STRING ã‚’ (å¿
è¦ãªã‚‰) 変æ›ã—ãŸãƒ‡ãƒ¼ã‚¿ã¨ã€
+ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸æœ¬ä½“ã§æŽ¨å¥¨ã•れるä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°ã‚’å–å¾—ã™ã‚‹ã€‚
+CHARSET 㯠STRING を符å·åŒ–ã—ã¦ã„ã‚‹ã‚ャラクタセット。
+
+OPTS ã«ã¯ä»¥ä¸‹ã®å¯¾ã‚’指定ã§ãる。
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+変æ›ã‚’行ã‚ãªã„ã®ã§ã€ä»¥ä¸‹ã®ã‚ªãƒ—ションã¯åŠ¹æžœã‚’æŒãŸãªã„。
+
+=over 4
+
+=item Replacement => REPLACEMENT
+
+ã‚¨ãƒ©ãƒ¼å‡¦ç†æ³•ã®æŒ‡å®šã€‚L<"エラー処ç†"> å‚ç
§ã€‚
+
+=item Detect7bit => YESNO
+
+CHARSET ãŒãªã„ã¨ãã€7ビットã®ã‚ャラクタセットを自動èªè˜ã—よã†ã¨ã™ã‚‹ã€‚
+既定㯠C<"YES">。
+
+=back
+
+3è¦ç´ ã®ãƒªã‚¹ãƒˆ (I<変æ›ãšã¿ã®æ–‡å—列>, I<出力ã®ã‚ャラクタセット>,
+I<ä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°>) ãŒè¿”る。
+I<ä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°> 㯠C<"BASE64">ã€C<"QUOTED-PRINTABLE">ã€
+C<"7BIT">ã€C<"8BIT"> ã®ã„ãšã‚Œã‹ã€‚I<出力ã®ã‚ャラクタセット> ãŒæ±ºå®šã§ããšã€
+I<変æ›ãšã¿ã®æ–‡å—列> ㌠ASCII以外ã®ãƒã‚¤ãƒˆã‚’å«ã‚€ã¨ãã¯ã€
+I<出力ã®ã‚ャラクタセット> 㯠C<undef>ã€I<ä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°> 㯠C<"BASE64">
+ã¨ãªã‚‹ã€‚
+I<出力ã®ã‚ャラクタセット> ㌠C<"US-ASCII">
+ã¨ãªã‚‹ã®ã¯ã€æ–‡å—列㌠ASCII以外ã®ãƒã‚¤ãƒˆã‚’å«ã¾ãªã„ã¨ãã«é™ã‚‹ã€‚
+
+
+=cut
+
+=item $charset->decode(STRING [,CHECK])
+
+STRING ã‚’ Unicode æ–‡å—列ã«ãƒ‡ã‚³ãƒ¼ãƒ‰ã™ã‚‹ã€‚
+
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+ã“ã®æ©Ÿèƒ½ã‚’実行ã™ã‚‹ã¨æ»ã¬ã€‚
+
+=cut
+
+=item $charset->encode(STRING, [, CHECK])
+
+STRING (Unicode æ–‡å—列ã¾ãŸã¯æ™®é€šã®æ–‡å—列) ã‚’ã€
+å
ƒã®ã‚ャラクタセットã¨äº’æ›ã§ã‚¤ãƒ³ã‚¿ãƒ¼ãƒãƒƒãƒˆä¸Šã®
+MIME メッセージã§ä½¿ã†ã“ã¨ã‚’推奨ã•れるã‚ャラクタセットを
+(当モジュールãŒçŸ¥ã£ã¦ã„れã°) 使ã£ã¦ã€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã™ã‚‹ã€‚
+å
ƒã®ã‚ャラクタセットã¨äº’æ›ã‚ャラクタセットãŒåŒã˜ã§ã‚‚ã€
+æ–‡å—列をデコードã—ã¦ã‹ã‚‰ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã™ã‚‹ã“ã¨ã«æ³¨æ„。
+
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+ã“ã®æ©Ÿèƒ½ã‚’実行ã™ã‚‹ã¨æ»ã¬ã€‚
+
+=cut
+
+=item $charset->encoded_header_len(STRING [,ENCODING])
+
+=item encoded_header_len STRING, ENCODING, CHARSET
+
+STRING をメッセージヘッダã¨ã—ã¦ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã—ãŸã¨ãã®é•·ã•
+(行折りã¯ã—ãªã„ã¨ã—ã¦) ã‚’å–å¾—ã™ã‚‹ã€‚
+
+ENCODING 㯠C<"B">ã€C<"Q">ã€C<"S">
+(C<"B"> 㨠C<"Q"> ã®ã†ã¡çŸããªã‚‹ã»ã†) ã®ã„ãšã‚Œã‹ã€‚
+
+
+=cut
+
+=item $charset->heder_encode(STRING [, OPTS])
+
+=item header_encode STRING, CHARSET [, OPTS]
+
+STRING ã‚’ (å¿
è¦ãªã‚‰) 変æ›ã—ãŸãƒ‡ãƒ¼ã‚¿ã¨ã€
+ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ãƒ˜ãƒƒãƒ€ã§æŽ¨å¥¨ã•れるエンコーディング法をå–å¾—ã™ã‚‹ã€‚
+CHARSET 㯠STRING を符å·åŒ–ã—ã¦ã„ã‚‹ã‚ャラクタセット。
+
+OPTS ã«ã¯ä»¥ä¸‹ã®å¯¾ã‚’指定ã§ãる。
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+変æ›ã‚’行ã‚ãªã„ã®ã§ã€ä»¥ä¸‹ã®ã‚ªãƒ—ションã¯åŠ¹æžœã‚’æŒãŸãªã„。
+
+=over 4
+
+=item Replacement => REPLACEMENT
+
+ã‚¨ãƒ©ãƒ¼å‡¦ç†æ³•ã®æŒ‡å®šã€‚L<"エラー処ç†"> å‚ç
§ã€‚
+
+=item Detect7bit => YESNO
+
+CHARSET ãŒãªã„ã¨ãã€7ビットã®ã‚ャラクタセットを自動èªè˜ã—よã†ã¨ã™ã‚‹ã€‚
+既定㯠C<"YES">。
+
+=back
+
+3è¦ç´ ã®ãƒªã‚¹ãƒˆ (I<変æ›ãšã¿ã®æ–‡å—列>, I<出力ã®ã‚ャラクタセット>,
+I<エンコーディング法>) ãŒè¿”る。
+I<エンコーディング法> 㯠C<"B">ã€C<"Q">ã€C<undef> (エンコードã—ãªãã¦ã‚ˆã„)
+ã®ã„ãšã‚Œã‹ã€‚
+I<出力ã®ã‚ャラクタセット> ãŒæ±ºå®šã§ããšã€I<変æ›ãšã¿ã®æ–‡å—列>
+㌠ASCII以外ã®ãƒã‚¤ãƒˆã‚’å«ã‚€ã¨ãã¯ã€I<出力ã®ã‚ャラクタセット> 㯠C<"8BIT">
+(ã“れã¯ã‚ャラクタセットã®åå‰ã§ã¯I<ãªã>ã€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ä¸å¯èƒ½ãªãƒ‡ãƒ¼ã‚¿ã‚’表ã™ç‰¹æ®Šå€¤)
+ã§ I<エンコーディング法> 㯠C<undef> (エンコードã™ã‚‹ã¹ãã§ã¯ãªã„) ã¨ãªã‚‹ã€‚
+I<出力ã®ã‚ャラクタセット> ㌠C<"US-ASCII">
+ã¨ãªã‚‹ã®ã¯ã€æ–‡å—列㌠ASCII以外ã®ãƒã‚¤ãƒˆã‚’å«ã¾ãªã„ã¨ãã«é™ã‚‹ã€‚
+
+=back
+
+
+=cut
+
+=item $charset->undecode(STRING [,CHECK])
+
+Unicode æ–‡å—列 string ã‚’ã€
+$charset ã®å
¥åŠ›ã‚ャラクタセットを使ã£ã¦æ–‡å—列ã«å¤‰æ›ã™ã‚‹ã€‚
+ã“れ㯠C<$charset->decoder->encode()> ã¨åŒç‰ã§ã‚る。
+
+B<NOTE>:
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ãªã„ã¨ã (L<"USE_ENCODE"> å‚ç
§) ã¯ã€
+ã“ã®æ©Ÿèƒ½ã‚’実行ã™ã‚‹ã¨æ»ã¬ã€‚
+
+=cut
+
+=head2 ãƒ¢ã‚¸ãƒ¥ãƒ¼ãƒ«æ—¢å®šå€¤ã®æ“作
+
+=over 4
+
+=item alias ALIAS [, CHARSET]
+
+L<"canonical_charset"> ã§æ£è¦åを決定ã™ã‚‹ãŸã‚ã®ã‚ャラクタセットã®åˆ¥åã‚’å–å¾—/è¨å®šã™ã‚‹ã€‚
+
+CHARSET ãŒã‚ã£ã¦å½ã§ãªã„ã¨ãã€ALIAS ㌠CHARSET ã®åˆ¥åã«ç™»éŒ²ã•れる。
+ã•ã‚‚ãªã‘れã°ã€åˆ¥åã«å¤‰æ›´ã¯ãªã„。ã„ãšã‚Œã®å ´åˆã§ã‚‚ã€
+ç¾åœ¨ ALIAS ãŒç™»éŒ²ã•れã¦ã„ã‚‹ã‚ャラクタセットを返ã™ã€‚
+
+
+=cut
+
+=item default [CHARSET]
+
+既定ã‚ャラクタセットをå–å¾—/è¨å®šã™ã‚‹ã€‚
+
+B<既定ã‚ャラクタセット>ã¨ã¯ã€
+当モジュールã§ã€å‡¦ç†ã®ãŸã‚ã®ã‚ャラクタセットãŒä¸æ˜Žãªã¨ãã«ç”¨ã„ã‚‹ã‚ャラクタセット。
+当モジュールを利用ã™ã‚‹ãƒ¢ã‚¸ãƒ¥ãƒ¼ãƒ«ã§ã¯ã€
+処ç†ã®ãŸã‚ã®ã‚ャラクタセットãŒä¸æ˜Žãªã¨ãã‚„æš—é»™ã®æ—¢å®šå€¤ãŒå¿
è¦ãªã¨ãã€
+ã“ã®ã‚ャラクタセットを使ã†ã“ã¨ã‚’推奨ã™ã‚‹ã€‚
+ã“ã‚Œã¯æ—¢å®šã§ã¯ C<"US-ASCII">。
+
+CHARSET ãŒã‚ã£ã¦å½ã§ãªã‘れã°ã€ãれを既定ã‚ャラクタセットã«è¨å®šã™ã‚‹ã€‚
+ã•ã‚‚ãªã‘れã°ã€æ—¢å®šã‚ャラクタセットã¯å¤‰ã‚らãªã„。ã„ãšã‚Œã®å ´åˆã§ã‚‚ã€
+ç¾åœ¨ã®æ—¢å®šã‚ャラクタセットを返ã™ã€‚
+
+B<NOTE>: 既定ã‚ャラクタセットã¯å¤‰æ›´ã™ã‚‹I<ã¹ãã§ã¯ãªã„>。
+
+
+=cut
+
+=item fallback [CHARSET]
+
+予備ã‚ャラクタセットをå–å¾—/è¨å®šã™ã‚‹ã€‚
+
+B<予備ã‚ャラクタセット>ã¨ã¯ã€
+当モジュールã§ã€æŒ‡å®šã•れãŸã‚ャラクタセットã§ã®å¤‰æ›ãŒå¤±æ•—ã—ã€
+ã‚¨ãƒ©ãƒ¼å‡¦ç†æ³•ã« C<"FALLBACK"> ãŒæŒ‡å®šã•れã¦ã„ãŸã¨ãã«ç”¨ã„ã‚‹ã‚ャラクタセット。
+当モジュールを利用ã™ã‚‹ãƒ¢ã‚¸ãƒ¥ãƒ¼ãƒ«ã§ã¯ã€
+ã‚ャラクタセット変æ›ãŒå¤±æ•—ã™ã‚‹ã¨ãã«æœ€çµ‚手段ã¨ã—ã¦ã“ã®ã‚ャラクタセットを使ã£ã¦ã‚‚よã„。
+ã“ã‚Œã¯æ—¢å®šã§ã¯ C<"UTF-8">。
+
+CHARSET ãŒã‚ã£ã¦å½ã§ãªã‘れã°ã€ãれを予備ã‚ャラクタセットã«è¨å®šã™ã‚‹ã€‚
+CHARSET ㌠C<"NONE"> ã§ã‚れã°ã€äºˆå‚™ã‚ャラクタセットを未定ã«ã™ã‚‹ã€‚
+ã•ã‚‚ãªã‘れã°ã€äºˆå‚™ã‚ャラクタセットã¯å¤‰ã‚らãªã„。ã„ãšã‚Œã®å ´åˆã§ã‚‚ã€
+ç¾åœ¨ã®äºˆå‚™ã‚ャラクタセットを返ã™ã€‚
+
+B<NOTE>: 予備ã‚ャラクタセット㫠C<"US-ASCII"> を指定ã™ã‚‹ä¾¡å€¤ã¯I<ã‚ã‚‹>。
+変æ›ã®çµæžœã¯ã€ã‚ャラクタセットæƒ
å ±ãŒãªã„ã¨ãã‚‚å¯èªã¨ãªã‚‹ã€‚
+
+
+=cut
+
+=item recommended CHARSET [, HEADERENC, BODYENC [, ENCCHARSET]]
+
+ã‚ャラクタセットã®ç‰¹æ€§ã‚’å–å¾—/è¨å®šã™ã‚‹ã€‚
+
+å¿
é ˆã§ãªã„引数ãŒã‚ã£ã¦ãã®ã©ã‚Œã‹ãŒå½ã§ãªã‘れã°ã€
+ãã®å¼•æ•°ã§ CHARSET ã®ç‰¹æ€§ã‚’è¨å®šã™ã‚‹ã€‚ã•ã‚‚ãªã‘れã°ã€ç‰¹æ€§ã¯å¤‰ã‚らãªã„。
+ã„ãšã‚Œã®å ´åˆã§ã‚‚ã€CHARSET ã®ç¾åœ¨ã®ç‰¹æ€§ã‚’ 3 è¦ç´ ã®ãƒªã‚¹ãƒˆ
+(HEADERENC, BODYENC, ENCCHARSET) ã¨ã—ã¦è¿”ã™ã€‚
+
+HEADERENC ã¯ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ãƒ˜ãƒƒãƒ€ã§æŽ¨å¥¨ã•れるエンコーディング法。
+C<"B">ã€C<"Q">ã€C<"S"> (ã©ã¡ã‚‰ã‹çŸããªã‚‹ã»ã†)ã€
+C<undef> (エンコードã—ãªãã¦ã‚ˆã„) を指定ã§ãる。
+
+BODYENC ã¯ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸æœ¬ä½“ã§æŽ¨å¥¨ã•れるä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‡ã‚£ãƒ³ã‚°ã€‚
+C<"B">ã€C<"Q">ã€C<undef> (ä¼é€ã‚¨ãƒ³ã‚³ãƒ¼ãƒ‰ã—ãªãã¦ã‚ˆã„) を指定ã§ãる。
+
+ENCCHARSET ã¯ã€æŒ‡å®šã—㟠CHARSET ã¨äº’æ›ã§ã€ã‚¤ãƒ³ã‚¿ãƒ¼ãƒãƒƒãƒˆä¸Šã®
+MIME メッセージã§ä½¿ã†ã“ã¨ã‚’推奨ã•れるã‚ャラクタセットå。
+変æ›ãŒå¿
è¦ãªã„ (ã¾ãŸã¯å½“モジュールãŒé©å½“ãªã‚ャラクタセットを知らãªã„) ã¨ãã¯ã€
+ENCCHARSET 㯠C<undef>。
+
+B<NOTE>: ã“ã®é–¢æ•°ã®ä»Šå¾Œã®ç‰ˆã§ã¯ã€ã»ã‹ã«ã‚‚å¿
é ˆã§ãªã„引数をã¨ã‚Œã‚‹ã‚ˆã†ã«ãªã‚‹ã‹ã‚‚ã—れãªã„
+(ãŸã¨ãˆã°ã€æ–‡å—å¹
ã€è¡Œåˆ†å‰²ã®æŒ™å‹•ãªã©ã«ã¤ã„ã¦ã®å±žæ€§)。
+ãã®ãŸã‚ã€è¿”値ã®å½¢å¼ã‚‚変ã‚ã‚‹ã‹ã‚‚ã—れãªã„。個ã€
ã®ç‰¹æ€§ã‚’å–å¾—ã™ã‚‹ã«ã¯
+L<"header_encoding">ã€L<"body_encoding">ã€L<"output_charset"> を使ã£ã¦ã»ã—ã„。
+
+
+=cut
+
+=head2 定数
+
+=item USE_ENCODE
+
+Unicode/マルãƒãƒã‚¤ãƒˆå¯¾å¿œãƒ•ラグ。
+Unicode ã¨ãƒžãƒ«ãƒãƒã‚¤ãƒˆã¸ã®å¯¾å¿œãŒæœ‰åйã«ãªã£ã¦ã„ã‚‹ã¨ãã¯ã€ç©ºã§ãªã„æ–‡å—列ãŒè¨å®šã•れã¦ã„る。
+ç¾åœ¨ã€ã“ã®ãƒ•ラグ㯠Perl 5.8.1 以é™ã§ç©ºã§ãªãã€ãれより以å‰ã® Perl ã§ã¯ç©ºã®æ–‡å—列。
+
+=head2 エラー処ç†
+
+L<"body_encode"> 㨠L<"header_encode"> ã®
+C<Replacement> オプションã«ã¯ä»¥ä¸‹ã®ã‚‚ã®ã‚’指定ã§ãã‚‹:
+
+=item C<"DEFAULT">
+
+䏿£ãªæ–‡å—ã‚’ç½®ãæ›ãˆæ–‡å—ã§ç½®ãæ›ãˆã‚‹ã€‚
+UCM ã«åŸºã¥ãエンコーダをæŒã¤ã‚ャラクタセットã§ã¯ <subchar> を使ã†ã€‚
+
+=item C<"FALLBACK">
+
+I<予備ã‚ャラクタセット> を使ã£ã¦ C<"DEFAULT"> æ–¹å¼ã‚’ã‚„ã£ã¦ã¿ã‚‹
+(L<"fallback"> å‚ç
§)。
+予備ã‚ãƒ£ãƒ©ã‚¯ã‚¿ã‚»ãƒƒãƒˆãŒæœªå®šã§å¤‰æ›ãŒã‚¨ãƒ©ãƒ¼ã‚’èµ·ã“ã—ãŸã¨ãã¯ã€
+コードã¯ã‚¨ãƒ©ãƒ¼ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ã‚’出力ã—ã¦æ»ã¬ã€‚
+
+=item C<"CROAK">
+
+コードã¯ã‚¨ãƒ©ãƒ¼ãƒ¡ãƒƒã‚»ãƒ¼ã‚¸ã‚’出力ã—ã¦ã™ãæ»ã¬ã€‚
+ã—ãŸãŒã£ã¦ã€æœ¬å½“ã«ã‚¨ãƒ©ãƒ¼ã§æ»ãªã›ãŸããªã‘れã°
+eval{} ã§è‡´å‘½çš„エラーをå—ã‘æ¢ã‚ãªã‘れã°ã„ã‘ãªã„。
+C<"STRICT"> ã§ã‚‚åŒã˜ã€‚
+
+=item C<"PERQQ">
+
+=item C<"HTMLCREF">
+
+=item C<"XMLCREF">
+
+L<Encode> モジュールã§å®šç¾©ã—ã¦ã„ã‚‹
+C<FB_PERLQQ>ã€C<FB_HTMLCREF>ã€C<FB_XMLCREF>
+ã®æ–¹å¼ã‚’使ã†ã€‚
+
+=back
+
+ã‚¨ãƒ©ãƒ¼å‡¦ç†æ³•ãŒæŒ‡å®šã•れãªã„ã‹ã€ä¸Šè¨˜ä»¥å¤–ã®ã‚¨ãƒ©ãƒ¼å‡¦ç†æ³•ãŒæŒ‡å®šã•れãŸã¨ãã¯ã€
+C<"DEFAULT"> ã¨ã¿ãªã™ã€‚
+
+=head2 è¨å®šãƒ•ァイル
+
+オプションã®ãƒ‘ラメタã®çµ„ã¿è¾¼ã¿æ—¢å®šå€¤ã¯ã€è¨å®šãƒ•ァイル
+F<MIME/Charset/Defaults.pm> ã§å¤‰æ›´ã™ã‚‹ã“ã¨ãŒã§ãる。
+詳ã—ã㯠F<MIME/Charset/Defaults.pm.sample> ã‚’èªã‚“ã§ã»ã—ã„。
+
+=head1 VERSION
+
+$VERSION 変数を見ã¦ã»ã—ã„。
+
+ã“ã®ãƒ¢ã‚¸ãƒ¥ãƒ¼ãƒ«ã®é–‹ç™ºç‰ˆãŒ
+L<http://hatuka.nezumi.nu/repos/MIME-Charset/> ã«ã‚る。
+
+=head1 SEE ALSO
+
+Multipurpose Internet Mail Extensions (MIME).
+
+=head1 AUTHORS
+
+Copyright (C) 2006-2008 Hatuka*nezumi - IKEDA Soji <hatuka(at)nezumi.nu>.
+
+All rights reserved. This program is free software; you can redistribute
+it and/or modify it under the same terms as Perl itself.
+
+
+=cut
Modified: branches/upstream/libmime-charset-perl/current/MANIFEST
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/MANIFEST?rev=17939&op=diff
==============================================================================
--- branches/upstream/libmime-charset-perl/current/MANIFEST (original)
+++ branches/upstream/libmime-charset-perl/current/MANIFEST Mon Mar 24 05:33:16 2008
@@ -1,9 +1,9 @@
ARTISTIC
Changes
Charset.pm
-Charset-ja_JP.pod
Charset/_Compat.pm
Charset/Defaults.pm.sample
+Charset/JA_JP.pod
GPL
Makefile.PL
MANIFEST This list of files
Modified: branches/upstream/libmime-charset-perl/current/META.yml
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/META.yml?rev=17939&op=diff
==============================================================================
--- branches/upstream/libmime-charset-perl/current/META.yml (original)
+++ branches/upstream/libmime-charset-perl/current/META.yml Mon Mar 24 05:33:16 2008
@@ -1,7 +1,7 @@
# http://module-build.sourceforge.net/META-spec.html
#XXXXXXX This is a prototype!!! It will change in the future!!! XXXXX#
name: MIME-Charset
-version: 1.001
+version: 1.002
version_from: Charset.pm
installdirs: site
requires:
Modified: branches/upstream/libmime-charset-perl/current/README
URL: http://svn.debian.org/wsvn/branches/upstream/libmime-charset-perl/current/README?rev=17939&op=diff
==============================================================================
--- branches/upstream/libmime-charset-perl/current/README (original)
+++ branches/upstream/libmime-charset-perl/current/README Mon Mar 24 05:33:16 2008
@@ -70,7 +70,7 @@
MIME::Charset provides informations about character sets used for MIME
messages on Internet.
- DEFINITIONS
+ Definitions
The charset is ``character set'' used in MIME to refer to a method of
converting a sequence of octets into a sequence of characters. It
includes both concepts of ``coded character set'' (CCS) and ``character
@@ -80,11 +80,20 @@
body part or a header body as sequence(s) of printable US-ASCII
characters.
- CONSTRUCTOR
- $charset = MIME::Charset->new(CHARSET)
- Create charset object from CHARSET.
-
- GETTING INFORMATIONS OF CHARSETS
+ Constructor
+ $charset = MIME::Charset->new([CHARSET [, OPTS]])
+ Create charset object.
+
+ OPTS may accept following key-value pairs. NOTE: When
+ Unicode/multibyte support is disabled (see "USE_ENCODE"), conversion
+ will not be performed. So these options do not have any effects.
+
+ Mapping => MAPTYPE
+ Specify extended mappings actually used for charset names.
+ "EXTENDED" uses extended mappings. "STANDARD" uses standardized
+ strict mappings. Default is "EXTENDED".
+
+ Getting Informations of Charsets
$charset->body_encoding
body_encoding CHARSET
Get recommended transfer-encoding of CHARSET for message body.
@@ -93,9 +102,16 @@
or "undef" (might not be transfer-encoded; either 7BIT or 8BIT).
This may not be same as encoding for message header.
- $charset->canonical_charset
+ $charset->as_string
canonical_charset CHARSET
- Get canonical name for charset CHARSET.
+ Get canonical name for charset.
+
+ $charset->decoder
+ Get "Encode::Encoding" object to decode strings by charset.
+
+ $charset->encoder([CHARSET])
+ Get "Encode::Encoding" object to encode Unicode string using
+ compatible charset recommended to be used for messages on Internet.
$charset->header_encoding
header_encoding CHARSET
@@ -114,7 +130,7 @@
When Unicode/multibyte support is disabled (see "USE_ENCODE"), this
function will simply return the result of "canonical_charset".
- TRANSLATING TEXT DATA
+ Translating Text Data
$charset->body_encode(STRING [, OPTS])
body_encode STRING, CHARSET [, OPTS]
Get converted (if needed) data of STRING and recommended
@@ -140,6 +156,21 @@
*transfer-encoding* will be "BASE64". *Charset for output* will be
"US-ASCII" if and only if string does not contain any non-ASCII
bytes.
+
+ $charset->decode(STRING [,CHECK])
+ Decode STRING to Unicode.
+
+ Note: When Unicode/multibyte support is disabled (see "USE_ENCODE"),
+ this function will die.
+
+ $charset->encode(STRING [,CHECK])
+ Encode STRING (Unicode or non-Unicode) using compatible charset
+ recommended to be used for messages on Internet (if this module
+ knows it). Note that string will be decoded then encoded even if
+ compatible charset was equal to original charset.
+
+ Note: When Unicode/multibyte support is disabled (see "USE_ENCODE"),
+ this function will die.
$charset->encoded_header_len(STRING [, ENCODING])
encoded_header_len STRING, ENCODING, CHARSET
@@ -175,7 +206,14 @@
be "US-ASCII" if and only if string does not contain any non-ASCII
bytes.
- MANIPULATING MODULE DEFAULTS
+ $charset->undecode(STRING [,CHECK])
+ Encode Unicode string STRING to byte string by input charset of
+ $charset. This is a equivalent to "$charset-"decoder->encode()>.
+
+ Note: When Unicode/multibyte support is disabled (see "USE_ENCODE"),
+ this function will die.
+
+ Manipulating Module Defaults
alias ALIAS [, CHARSET]
Get/set charset alias for canonical names determined by
"canonical_charset".
@@ -242,14 +280,14 @@
changed. Use "header_encoding", "body_encoding" or "output_charset"
to get particular profile.
- CONSTANTS
+ Constants
USE_ENCODE
- Unicode/multibyte support flag. Non-null string will be set when
+ Unicode/multibyte support flag. Non-empty string will be set when
Unicode and multibyte support is enabled. Currently, this flag will
- be non-null on Perl 5.8.1 or later and null string on earlier
+ be non-empty on Perl 5.8.1 or later and empty string on earlier
versions of Perl.
- ERROR HANDLING
+ Error Handling
"body_encode" and "header_encode" accept following "Replacement"
options:
@@ -276,6 +314,11 @@
If error handling scheme is not specified or unknown scheme is
specified, "DEFAULT" will be assumed.
+ Configuration File
+ Built-in defaults for option parameters can be overridden by
+ configuration file: MIME/Charset/Defaults.pm. For more details read
+ MIME/Charset/Defaults.pm.sample.
+
VERSION
Consult $VERSION variable.
More information about the Pkg-perl-cvs-commits
mailing list