r55530 - in /branches/upstream/libhtml-parser-perl/current: Changes META.yml Parser.pm hparser.c lib/HTML/Entities.pm lib/HTML/HeadParser.pm t/entities.t
carnil-guest at users.alioth.debian.org
carnil-guest at users.alioth.debian.org
Tue Apr 6 19:02:17 UTC 2010
Author: carnil-guest
Date: Tue Apr 6 19:01:44 2010
New Revision: 55530
URL: http://svn.debian.org/wsvn/pkg-perl/?sc=1&rev=55530
Log:
[svn-upgrade] Integrating new upstream version, libhtml-parser-perl (3.65)
Modified:
branches/upstream/libhtml-parser-perl/current/Changes
branches/upstream/libhtml-parser-perl/current/META.yml
branches/upstream/libhtml-parser-perl/current/Parser.pm
branches/upstream/libhtml-parser-perl/current/hparser.c
branches/upstream/libhtml-parser-perl/current/lib/HTML/Entities.pm
branches/upstream/libhtml-parser-perl/current/lib/HTML/HeadParser.pm
branches/upstream/libhtml-parser-perl/current/t/entities.t
Modified: branches/upstream/libhtml-parser-perl/current/Changes
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/Changes?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/Changes (original)
+++ branches/upstream/libhtml-parser-perl/current/Changes Tue Apr 6 19:01:44 2010
@@ -1,3 +1,16 @@
+_______________________________________________________________________________
+2010-04-04 Release 3.65
+
+Gisle Aas (1):
+ Eliminate buggy entities_decode_old
+
+Salvatore Bonaccorso (1):
+ Fixed endianness typo [RT#50811]
+
+Ville Skyttä (1):
+ Documentation fixes.
+
+
_______________________________________________________________________________
2009-10-25 Release 3.64
Modified: branches/upstream/libhtml-parser-perl/current/META.yml
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/META.yml?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/META.yml (original)
+++ branches/upstream/libhtml-parser-perl/current/META.yml Tue Apr 6 19:01:44 2010
@@ -1,6 +1,6 @@
--- #YAML:1.0
name: HTML-Parser
-version: 3.64
+version: 3.65
abstract: HTML parser class
author:
- Gisle Aas <gisle at activestate.com>
@@ -22,7 +22,7 @@
directory:
- t
- inc
-generated_by: ExtUtils::MakeMaker version 6.55_02
+generated_by: ExtUtils::MakeMaker version 6.56
meta-spec:
url: http://module-build.sourceforge.net/META-spec-v1.4.html
version: 1.4
Modified: branches/upstream/libhtml-parser-perl/current/Parser.pm
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/Parser.pm?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/Parser.pm (original)
+++ branches/upstream/libhtml-parser-perl/current/Parser.pm Tue Apr 6 19:01:44 2010
@@ -9,7 +9,7 @@
use strict;
use vars qw($VERSION @ISA);
-$VERSION = "3.64";
+$VERSION = "3.65";
require HTML::Entities;
@@ -891,7 +891,7 @@
Example:
<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"
- "http://www.w3.org/TR/html40/strict.dtd">
+ "http://www.w3.org/TR/html4/strict.dtd">
DTDs inside <!DOCTYPE ...> will confuse HTML::Parser.
@@ -954,7 +954,7 @@
=head2 Unicode
-The C<HTML::Parser> can parse Unicode strings when running under
+C<HTML::Parser> can parse Unicode strings when running under
perl-5.8 or better. If Unicode is passed to $p->parse() then chunks
of Unicode will be reported to the handlers. The offset and length
argspecs will also report their position in terms of characters.
@@ -1224,10 +1224,10 @@
L<HTML::TreeBuilder> (part of the I<HTML-Tree> distribution)
-http://www.w3.org/TR/html4
+L<http://www.w3.org/TR/html4/>
More information about marked sections and processing instructions may
-be found at C<http://www.sgml.u-net.com/book/sgml-8.htm>.
+be found at L<http://www.is-thought.co.uk/book/sgml-8.htm>.
=head1 COPYRIGHT
Modified: branches/upstream/libhtml-parser-perl/current/hparser.c
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/hparser.c?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/hparser.c (original)
+++ branches/upstream/libhtml-parser-perl/current/hparser.c Tue Apr 6 19:01:44 2010
@@ -1847,7 +1847,7 @@
warn("Parsing of undecoded UTF-8 will give garbage when decoding entities");
}
if (utf8 && len >= 2 && strnEQ(beg, "\xFF\xFE", 2)) {
- warn("Parsing string decoded with wrong endianess");
+ warn("Parsing string decoded with wrong endianness");
}
#endif
if (!utf8 && len >= 4 &&
Modified: branches/upstream/libhtml-parser-perl/current/lib/HTML/Entities.pm
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/lib/HTML/Entities.pm?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/lib/HTML/Entities.pm (original)
+++ branches/upstream/libhtml-parser-perl/current/lib/HTML/Entities.pm Tue Apr 6 19:01:44 2010
@@ -434,23 +434,6 @@
my %subst; # compiled encoding regexps
-sub decode_entities_old
-{
- my $array;
- if (defined wantarray) {
- $array = [@_]; # copy
- } else {
- $array = \@_; # modify in-place
- }
- my $c;
- for (@$array) {
- s/(&\#(\d+);?)/$2 < 256 ? chr($2) : $1/eg;
- s/(&\#[xX]([0-9a-fA-F]+);?)/$c = hex($2); $c < 256 ? chr($c) : $1/eg;
- s/(&(\w+);?)/$entity2char{$2} || $1/eg;
- }
- wantarray ? @$array : $array->[0];
-}
-
sub encode_entities
{
return undef unless defined $_[0];
Modified: branches/upstream/libhtml-parser-perl/current/lib/HTML/HeadParser.pm
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/lib/HTML/HeadParser.pm?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/lib/HTML/HeadParser.pm (original)
+++ branches/upstream/libhtml-parser-perl/current/lib/HTML/HeadParser.pm Tue Apr 6 19:01:44 2010
@@ -178,7 +178,10 @@
# <!ENTITY % head.content "TITLE & BASE?">
# <!ELEMENT HEAD O O (%head.content;) +(%head.misc;)>
#
-# Added in HTML 5 as of WD-html5-20090423: noscript, command
+# From HTML 5 as of WD-html5-20090825:
+#
+# One or more elements of metadata content, [...]
+# => base, command, link, meta, noscript, script, style, title
sub start
{
Modified: branches/upstream/libhtml-parser-perl/current/t/entities.t
URL: http://svn.debian.org/wsvn/pkg-perl/branches/upstream/libhtml-parser-perl/current/t/entities.t?rev=55530&op=diff
==============================================================================
--- branches/upstream/libhtml-parser-perl/current/t/entities.t (original)
+++ branches/upstream/libhtml-parser-perl/current/t/entities.t Tue Apr 6 19:01:44 2010
@@ -1,6 +1,6 @@
use HTML::Entities qw(decode_entities encode_entities encode_entities_numeric);
-use Test::More tests => 17;
+use Test::More tests => 18;
$a = "Våre norske tegn bør æres";
@@ -73,6 +73,8 @@
is(decode_entities("Attention Homeοωnөrs...1ѕt Tімe Eνөг"),
"Attention Home\x{3BF}\x{3C9}n\x{4E9}rs...1\x{455}t T\x{456}\x{43C}e E\x{3BD}\x{4E9}\x{433}");
+is(decode_entities("{&amp;&amp;& also Яœ}"),
+ "{&&& also \x{42F}\x{153}}");
__END__
# Quoted from rfc1866.txt
More information about the Pkg-perl-cvs-commits
mailing list