[DRE-commits] [SCM] bsfilter.git branch, master, updated. debian/1%1.0.17-2-15-g15ef7f6
Taku YASUI
tach at debian.org
Sun Jun 17 15:49:50 UTC 2012
The following commit has been merged in the master branch:
commit a6181296af9a55cdea0f9c7e8d27d28ee4023d5f
Author: Taku YASUI <tach at debian.org>
Date: Sun Jun 17 22:20:36 2012 +0900
Add debian/patches/010_disable_chasen not to use chasen.
diff --git a/debian/changelog b/debian/changelog
index 3b0cd17..6ac9c23 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -5,6 +5,7 @@ bsfilter (1:1.0.17-3) UNRELEASED; urgency=low
* debian/copyright: Convert to the Debian copyright format version 1.0.
* debian/docs: Add HTML document to the package.
* debian/rules: Add to run test suite.
+ * Add debian/patches/010_disable_chasen not to use chasen.
-- Taku YASUI <tach at debian.org> Sun, 17 Jun 2012 21:54:15 +0900
diff --git a/debian/patches/debian-changes-1:1.0.17-1 b/debian/patches/000_debian-changes-1:1.0.17-1
similarity index 100%
rename from debian/patches/debian-changes-1:1.0.17-1
rename to debian/patches/000_debian-changes-1:1.0.17-1
diff --git a/debian/patches/010_disable_chasen b/debian/patches/010_disable_chasen
new file mode 100644
index 0000000..7902124
--- /dev/null
+++ b/debian/patches/010_disable_chasen
@@ -0,0 +1,112 @@
+--- a/bsfilter/bsfilter
++++ b/bsfilter/bsfilter
+@@ -1,4 +1,4 @@
+-#! /usr/bin/env ruby
++#! /usr/bin/ruby1.8
+ ## -*-Ruby-*- $Id: bsfilter,v 1.86 2010/11/20 10:07:45 nabeken Exp $
+ ## Copyright (C) 2003, 2004, 2005, 2006 NABEYA Kenichi
+ ##
+@@ -1057,9 +1057,6 @@
+ else
+ @m = MeCab::Tagger.new([$0, "-Ochasen"])
+ end
+- when "chasen"
+- Chasen.getopt("-F", '%H %m\n', "-j")
+- @method = Proc::new {|s| chasen(s)}
+ when "kakasi"
+ @method = Proc::new {|s| kakasi(s)}
+ else
+@@ -1123,31 +1120,6 @@
+ return array
+ end
+
+- def chasen(str)
+- str = str.gsub(/[\x00-\x7f]/, ' ')
+- if (str =~ /\A +\z/)
+- return []
+- end
+- array = Array::new
+- Chasen.sparse(str).split("\n").each do |hinshi_token|
+- if (hinshi_token =~ /(.*) (.*)/)
+- hinshi = $1
+- token = $2
+- if (hinshi == "\xcc\xbe\xbb\xec")
+- if ((token =~ Reg_kanji_katakana) || (token.length > 2))
+- array.push(token)
+- end
+- else
+- token.gsub!(Reg_not_kanji_katakana, '')
+- if ((token =~ Reg_kanji) || (token.length > 2))
+- array.push(token)
+- end
+- end
+- end
+- end
+- return array
+- end
+-
+ def block(str)
+ tokens = str.scan(Reg_kanji)
+ tokens.concat(str.scan(Reg_katakana))
+@@ -1960,7 +1932,7 @@
+ specify the name of database type
+ "sdbm" by default
+
+- --jtokenizer|-j bigram|block|mecab|chasen|kakasi
++ --jtokenizer|-j bigram|block|mecab|kakasi
+ specify algorithm of a tokenizer for Japanese language
+ "bigram" by default
+
+@@ -3144,8 +3116,6 @@
+ when "block"
+ when "mecab"
+ require 'MeCab'
+- when "chasen"
+- require 'chasen.o'
+ when "kakasi"
+ require 'kakasi'
+ else
+--- a/test/test.rb
++++ b/test/test.rb
+@@ -217,14 +217,9 @@
+ @bsfilter2.setup($default_options + ["--jtokenizer", "bigram"])
+ @bsfilter2.use_dummyfh
+
+- @bsfilter3 = Bsfilter::new
+- @bsfilter3.setup($default_options + ["--jtokenizer", "chasen"])
+- @bsfilter3.use_dummyfh
+-
+ @bsfilter0.run(@files)
+ @bsfilter1.run(@files)
+ @bsfilter2.run(@files)
+- @bsfilter3.run(@files)
+
+ assert_equal(1, @bsfilter0.count_message(/tokenizer ja body Ä«´é/), "@bsfilter0 2letters")
+ assert_equal(0, @bsfilter0.count_message(/tokenizer ja body ¸þÆü°ª/), "@bsfilter0 3letters")
+@@ -234,9 +229,6 @@
+
+ assert_equal(1, @bsfilter2.count_message(/tokenizer ja body Ä«´é/), "@bsfilter2 2letters")
+ assert_equal(0, @bsfilter2.count_message(/tokenizer ja body ¸þÆü°ª/), "@bsfilter2 3letters")
+-
+- assert_equal(1, @bsfilter3.count_message(/tokenizer ja body Ä«´é/), "@bsfilter3 2letters")
+- assert_equal(1, @bsfilter3.count_message(/tokenizer ja body ¸þÆü°ª/), "@bsfilter3 3letters")
+ end
+
+ def teardown
+@@ -325,16 +317,6 @@
+ end
+ @bsfilter.use_dummyfh
+ @bsfilter.run(@files)
+- assert_equal(1, @bsfilter.count_message(/tokenizer ja body Ä«´é/), "2 letters")
+- assert_equal(1, @bsfilter.count_message(/tokenizer ja body ¸þÆü°ª/), "3 letters")
+- end
+-
+- def test_chasen
+- assert_nothing_raised('Warning: ignore this test if chasen is NOT installed') do
+- @bsfilter.setup($default_options + ["--jtokenizer", "chasen"])
+- end
+- @bsfilter.use_dummyfh
+- @bsfilter.run(@files)
+ assert_equal(1, @bsfilter.count_message(/tokenizer ja body Ä«´é/), "2 letters")
+ assert_equal(1, @bsfilter.count_message(/tokenizer ja body ¸þÆü°ª/), "3 letters")
+ end
diff --git a/debian/patches/series b/debian/patches/series
index 29ff1be..778ff65 100644
--- a/debian/patches/series
+++ b/debian/patches/series
@@ -1 +1,2 @@
-debian-changes-1:1.0.17-1
+000_debian-changes-1:1.0.17-1
+010_disable_chasen
--
bsfilter.git
More information about the Pkg-ruby-extras-commits
mailing list