aboutsummaryrefslogtreecommitdiffstats
path: root/textproc/scws
diff options
context:
space:
mode:
authortz <tz@FreeBSD.org>2017-07-17 18:16:04 +0800
committertz <tz@FreeBSD.org>2017-07-17 18:16:04 +0800
commitbb110a423cf7cc5090713301453c3dd4d8d8d29b (patch)
tree071bac40e8f1c75bdd32863df5e5fd3c54f24d37 /textproc/scws
parent4b0e5ef02d24cf7fb1e164d4ad1cfabeb3a7b81e (diff)
downloadfreebsd-ports-gnome-bb110a423cf7cc5090713301453c3dd4d8d8d29b.tar.gz
freebsd-ports-gnome-bb110a423cf7cc5090713301453c3dd4d8d8d29b.tar.zst
freebsd-ports-gnome-bb110a423cf7cc5090713301453c3dd4d8d8d29b.zip
New port: textproc/scws
SCWS (Simple Chinese Word Segmentation) is a frequency dictionary based Chinese word segmentation engine, it can cut a whole section of the Chinese text into words. Word is the smallest unit of morpheme in Chinese, but in Chinese words are not separated by spaces,so word segmentation is an important step for Chinese language process.SCWS is written in C without other dependencies and accept GBK and UTF-8 encoding for both the Simple Chinese (zh_CN) and the Traditional Chinese (such as zh_TW). WWW: http://www.xunsearch.com/scws/index.php PR: 219132 Submitted by: Jov <amutu@amutu.com>
Diffstat (limited to 'textproc/scws')
-rw-r--r--textproc/scws/Makefile23
-rw-r--r--textproc/scws/distinfo3
-rw-r--r--textproc/scws/pkg-descr9
-rw-r--r--textproc/scws/pkg-plist19
4 files changed, 54 insertions, 0 deletions
diff --git a/textproc/scws/Makefile b/textproc/scws/Makefile
new file mode 100644
index 000000000000..a743b9016f98
--- /dev/null
+++ b/textproc/scws/Makefile
@@ -0,0 +1,23 @@
+# Created by: Jov <amutu@amutu.com>
+# $FreeBSD$
+
+PORTNAME= scws
+PORTVERSION= 1.2.3
+CATEGORIES= textproc
+MASTER_SITES= http://www.xunsearch.com/scws/down/
+
+MAINTAINER= amutu@amutu.com
+COMMENT= Simple Chinese word segmentation program and lib
+
+LICENSE= BSD2CLAUSE
+
+GNU_CONFIGURE= yes
+USES= gmake libtool:keepla tar:bzip2
+USE_LDCONFIG= yes
+
+CONFIGURE_ARGS= --sysconfdir=${PREFIX}/etc/scws \
+ --with-pic
+
+INSTALL_TARGET=install-strip
+
+.include <bsd.port.mk>
diff --git a/textproc/scws/distinfo b/textproc/scws/distinfo
new file mode 100644
index 000000000000..21f12bce846d
--- /dev/null
+++ b/textproc/scws/distinfo
@@ -0,0 +1,3 @@
+TIMESTAMP = 1494223276
+SHA256 (scws-1.2.3.tar.bz2) = 60d50ac3dc42cff3c0b16cb1cfee47d8cb8c8baa142a58bc62854477b81f1af5
+SIZE (scws-1.2.3.tar.bz2) = 485903
diff --git a/textproc/scws/pkg-descr b/textproc/scws/pkg-descr
new file mode 100644
index 000000000000..5f677364e24d
--- /dev/null
+++ b/textproc/scws/pkg-descr
@@ -0,0 +1,9 @@
+SCWS (Simple Chinese Word Segmentation) is a frequency dictionary based Chinese
+word segmentation engine, it can cut a whole section of the Chinese text into
+words. Word is the smallest unit of morpheme in Chinese, but in Chinese words
+are not separated by spaces,so word segmentation is an important step for
+Chinese language process.SCWS is written in C without other dependencies and
+accept GBK and UTF-8 encoding for both the Simple Chinese (zh_CN) and the
+Traditional Chinese (such as zh_TW).
+
+WWW: http://www.xunsearch.com/scws/index.php
diff --git a/textproc/scws/pkg-plist b/textproc/scws/pkg-plist
new file mode 100644
index 000000000000..e7ac8bfbd039
--- /dev/null
+++ b/textproc/scws/pkg-plist
@@ -0,0 +1,19 @@
+bin/scws
+bin/scws-gen-dict
+%%ETCDIR%%/rules.ini
+%%ETCDIR%%/rules.utf8.ini
+%%ETCDIR%%/rules_cht.utf8.ini
+include/scws/charset.h
+include/scws/crc32.h
+include/scws/darray.h
+include/scws/pool.h
+include/scws/rule.h
+include/scws/scws.h
+include/scws/version.h
+include/scws/xdb.h
+include/scws/xdict.h
+include/scws/xtree.h
+lib/libscws.la
+lib/libscws.so
+lib/libscws.so.1
+lib/libscws.so.1.1.0