From 8a4e16c9ca603cf81bd8c3919d21ebdb0ebf5fa2 Mon Sep 17 00:00:00 2001 From: Joseph Mingrone Date: Wed, 26 Apr 2017 19:33:45 +0000 Subject: textproc/rubygem-whatlanguage: Natural language detection for text samples Adding textproc/rubygem-whatlanguage, because it is a dependency for the upcoming port, net-im/mastodon. Approved by: swills (mentor, implicit) --- textproc/Makefile | 1 + textproc/rubygem-whatlanguage/Makefile | 19 +++++++++++++++++++ textproc/rubygem-whatlanguage/distinfo | 3 +++ textproc/rubygem-whatlanguage/pkg-descr | 10 ++++++++++ 4 files changed, 33 insertions(+) create mode 100644 textproc/rubygem-whatlanguage/Makefile create mode 100644 textproc/rubygem-whatlanguage/distinfo create mode 100644 textproc/rubygem-whatlanguage/pkg-descr (limited to 'textproc') diff --git a/textproc/Makefile b/textproc/Makefile index 7f3a65c81980..f977386338ef 100644 --- a/textproc/Makefile +++ b/textproc/Makefile @@ -1563,6 +1563,7 @@ SUBDIR += rubygem-unf SUBDIR += rubygem-unf_ext SUBDIR += rubygem-version_sorter + SUBDIR += rubygem-whatlanguage SUBDIR += rubygem-wikicloth SUBDIR += rubygem-xml-simple SUBDIR += rubygem-ya2yaml diff --git a/textproc/rubygem-whatlanguage/Makefile b/textproc/rubygem-whatlanguage/Makefile new file mode 100644 index 000000000000..faf74dc4f3e8 --- /dev/null +++ b/textproc/rubygem-whatlanguage/Makefile @@ -0,0 +1,19 @@ +# $FreeBSD$ + +PORTNAME= whatlanguage +PORTVERSION= 1.0.6 +CATEGORIES= textproc rubygems +MASTER_SITES= RG + +MAINTAINER= jrm@FreeBSD.org +COMMENT= Natural language detection for text samples + +LICENSE= MIT +LICENSE_FILE= ${WRKSRC}/LICENSE.txt + +NO_ARCH= yes + +USE_RUBY= yes +USES= gem + +.include diff --git a/textproc/rubygem-whatlanguage/distinfo b/textproc/rubygem-whatlanguage/distinfo new file mode 100644 index 000000000000..033f982ad8ec --- /dev/null +++ b/textproc/rubygem-whatlanguage/distinfo @@ -0,0 +1,3 @@ +TIMESTAMP = 1493234905 +SHA256 (rubygem/whatlanguage-1.0.6.gem) = 2f3410f4c2cc50eb582640e01b2d18c478fc7a95a3d1bcfc5d8ea05a1f68fd69 +SIZE (rubygem/whatlanguage-1.0.6.gem) = 2982400 diff --git a/textproc/rubygem-whatlanguage/pkg-descr b/textproc/rubygem-whatlanguage/pkg-descr new file mode 100644 index 000000000000..37c247cd1265 --- /dev/null +++ b/textproc/rubygem-whatlanguage/pkg-descr @@ -0,0 +1,10 @@ +WhatLanguage, written in pure-Ruby, detects the human language of supplied text. +It uses Bloom filters, so it is fast and memory efficient. It works well on +text of over 10 words in length (e.g. blog posts or comments) and very poorly on +short or Twitter-esque text. + +It works with Arabic, Dutch, English, Farsi, Finnish, French, German, Greek, +Hebrew, Hungarian, Italian, Korean, Norwegian, Pinyin, Polish, Portuguese, +Russian, Spanish, and Swedish out of the box. + +WWW: https://github.com/peterc/whatlanguage -- cgit v1.2.3