aboutsummaryrefslogtreecommitdiff
path: root/textproc/rubygem-whatlanguage
diff options
context:
space:
mode:
authorJoseph Mingrone <jrm@FreeBSD.org>2017-04-26 19:33:45 +0000
committerJoseph Mingrone <jrm@FreeBSD.org>2017-04-26 19:33:45 +0000
commit8a4e16c9ca603cf81bd8c3919d21ebdb0ebf5fa2 (patch)
tree93c676982f746bf79a3592048ffb4c6530d5573a /textproc/rubygem-whatlanguage
parent2250b4a2bf8ee587b747bfd174e4482c9568f215 (diff)
downloadports-8a4e16c9ca603cf81bd8c3919d21ebdb0ebf5fa2.tar.gz
ports-8a4e16c9ca603cf81bd8c3919d21ebdb0ebf5fa2.zip
Notes
Diffstat (limited to 'textproc/rubygem-whatlanguage')
-rw-r--r--textproc/rubygem-whatlanguage/Makefile19
-rw-r--r--textproc/rubygem-whatlanguage/distinfo3
-rw-r--r--textproc/rubygem-whatlanguage/pkg-descr10
3 files changed, 32 insertions, 0 deletions
diff --git a/textproc/rubygem-whatlanguage/Makefile b/textproc/rubygem-whatlanguage/Makefile
new file mode 100644
index 000000000000..faf74dc4f3e8
--- /dev/null
+++ b/textproc/rubygem-whatlanguage/Makefile
@@ -0,0 +1,19 @@
+# $FreeBSD$
+
+PORTNAME= whatlanguage
+PORTVERSION= 1.0.6
+CATEGORIES= textproc rubygems
+MASTER_SITES= RG
+
+MAINTAINER= jrm@FreeBSD.org
+COMMENT= Natural language detection for text samples
+
+LICENSE= MIT
+LICENSE_FILE= ${WRKSRC}/LICENSE.txt
+
+NO_ARCH= yes
+
+USE_RUBY= yes
+USES= gem
+
+.include <bsd.port.mk>
diff --git a/textproc/rubygem-whatlanguage/distinfo b/textproc/rubygem-whatlanguage/distinfo
new file mode 100644
index 000000000000..033f982ad8ec
--- /dev/null
+++ b/textproc/rubygem-whatlanguage/distinfo
@@ -0,0 +1,3 @@
+TIMESTAMP = 1493234905
+SHA256 (rubygem/whatlanguage-1.0.6.gem) = 2f3410f4c2cc50eb582640e01b2d18c478fc7a95a3d1bcfc5d8ea05a1f68fd69
+SIZE (rubygem/whatlanguage-1.0.6.gem) = 2982400
diff --git a/textproc/rubygem-whatlanguage/pkg-descr b/textproc/rubygem-whatlanguage/pkg-descr
new file mode 100644
index 000000000000..37c247cd1265
--- /dev/null
+++ b/textproc/rubygem-whatlanguage/pkg-descr
@@ -0,0 +1,10 @@
+WhatLanguage, written in pure-Ruby, detects the human language of supplied text.
+It uses Bloom filters, so it is fast and memory efficient. It works well on
+text of over 10 words in length (e.g. blog posts or comments) and very poorly on
+short or Twitter-esque text.
+
+It works with Arabic, Dutch, English, Farsi, Finnish, French, German, Greek,
+Hebrew, Hungarian, Italian, Korean, Norwegian, Pinyin, Polish, Portuguese,
+Russian, Spanish, and Swedish out of the box.
+
+WWW: https://github.com/peterc/whatlanguage