From 1f7c763124bf7f059eafdbaa4da485e06fd7ec21 Mon Sep 17 00:00:00 2001 From: piaolingxue Date: Wed, 26 Mar 2014 10:51:05 +0800 Subject: [PATCH] update wiki, and build script --- README.org | 20 +++++++++++++++++++ bin/build.sh | 6 ++++++ .../analysis/jieba/JiebaSegmenterTest.java | 2 +- 3 files changed, 27 insertions(+), 1 deletion(-) create mode 100755 bin/build.sh diff --git a/README.org b/README.org index 578e4cb..7923f04 100644 --- a/README.org +++ b/README.org @@ -11,8 +11,17 @@ ** 支持分词模式 - Search模式,用于对用户查询词分词 - Index模式,用于对索引文档分词 + +** 特性 + - 支持多种分词模式 + - 全角统一转成半角 + - 用户词典功能 + - conf 目录有整理的搜狗细胞词库 + - 支持词性标注(感谢 [[https://github.com/linkerlin][@linkerlin]] 的贡献) + * 如何获取 + - 当前稳定版本 #+BEGIN_SRC xml com.huaban @@ -21,6 +30,17 @@ #+END_SRC + - 当前快照版本 + - 支持词性标注 [[https://github.com/huaban/jieba-analysis/pull/4][#4]] + - 修复以'-'连接词分词错误问题 [[https://github.com/huaban/jieba-analysis/issues/3][#3]] + #+BEGIN_SRC xml + + com.huaban + jieba-analysis + 1.0.0-SNAPSHOT + + #+END_SRC + * 如何使用 - Demo diff --git a/bin/build.sh b/bin/build.sh new file mode 100755 index 0000000..786850e --- /dev/null +++ b/bin/build.sh @@ -0,0 +1,6 @@ +#!/bin/bash + +ROOT=`dirname $0` +cd $ROOT/.. +mvn package install -DcreateChecksum=true -DskipTests + diff --git a/src/test/java/com/huaban/analysis/jieba/JiebaSegmenterTest.java b/src/test/java/com/huaban/analysis/jieba/JiebaSegmenterTest.java index efe6a56..9a947d9 100644 --- a/src/test/java/com/huaban/analysis/jieba/JiebaSegmenterTest.java +++ b/src/test/java/com/huaban/analysis/jieba/JiebaSegmenterTest.java @@ -145,7 +145,7 @@ public void testCutForIndex() { public void testBugSentence() { String[] bugs = new String[] { - "utf-8", + "UTF-8", "iphone5", "鲜芋仙 3", "RT @laoshipukong : 27日,",