diff --git a/postagger/postagger.sh b/postagger/postagger.sh new file mode 100644 index 0000000000..96426573f3 --- /dev/null +++ b/postagger/postagger.sh @@ -0,0 +1,31 @@ +#!/bin/sh + +# determine Java environment +export JAVA_PLATFORM="sun-jdk" +eval `@l_prefix@/bin/java-toolkit -e` + +# sanity check arguments +if [ $# -lt 1 -o $# -gt 2 ]; then + echo "Usage: postagger | [-textFile ]" + exit 1 +fi +model="$1" +shift + +# determine model +if [ ! -f "$model" ]; then + if [ -f "@l_prefix@/share/postagger/$model.tagger" ]; then + model="@l_prefix@/share/postagger/$model.tagger" + else + echo "No such model: $model" + exit 1 + fi +fi + +# pass-through execution +exec @l_prefix@/bin/java \ + -mx5g -cp "@l_prefix@/lib/postagger/stanford-postagger.jar:" \ + edu.stanford.nlp.tagger.maxent.MaxentTagger \ + -model "$model" \ + "$@" + diff --git a/postagger/postagger.spec b/postagger/postagger.spec new file mode 100644 index 0000000000..4799c2e389 --- /dev/null +++ b/postagger/postagger.spec @@ -0,0 +1,90 @@ +## +## postagger.spec -- OpenPKG RPM Package Specification +## Copyright (c) 2000-2018 OpenPKG Project +## +## Permission to use, copy, modify, and distribute this software for +## any purpose with or without fee is hereby granted, provided that +## the above copyright notice and this permission notice appear in all +## copies. +## +## THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED +## WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF +## MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. +## IN NO EVENT SHALL THE AUTHORS AND COPYRIGHT HOLDERS AND THEIR +## CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, +## SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT +## LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF +## USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND +## ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, +## OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT +## OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF +## SUCH DAMAGE. +## + +# package version +%define V_base 3.9.1 +%define V_date 2018-02-27 + +# package information +Name: postagger +Summary: Stanford Part-Of-Speach (POS) Tagging +URL: https://nlp.stanford.edu/software/tagger.shtml +Vendor: Stanford University +Packager: OpenPKG Project +Distribution: OpenPKG Community +Class: EVAL +Group: Algorithm +License: GPL +Version: %{V_base} +Release: 20180311 + +# list of sources +Source0: https://nlp.stanford.edu/software/stanford-postagger-full-%{V_date}.zip +Source1: postagger.sh + +# build information +BuildPreReq: OpenPKG, openpkg >= 20160101 +PreReq: OpenPKG, openpkg >= 20160101 + +%description + Stanford Part-Of-Speech Tagger (POS Tagger) is a piece of software + that reads text in some language and assigns parts of speech to each + word (and other token), such as noun, verb, adjective, etc. + +%track + prog postagger = { + version = %{V_date} + url = https://nlp.stanford.edu/software/tagger.shtml + regex = stanford-postagger-full-(\d+-\d+-\d+)\.zip + } + +%prep + %setup -q -n stanford-postagger-full-%{V_date} + +%build + +%install + # create installation hierarchy + %{l_shtool} mkdir -f -p -m 755 \ + $RPM_BUILD_ROOT%{l_prefix}/bin \ + $RPM_BUILD_ROOT%{l_prefix}/lib/postagger \ + $RPM_BUILD_ROOT%{l_prefix}/share/postagger + + # install package + %{l_shtool} install -c -m 755 %{l_value -s -a} \ + %{SOURCE postagger.sh} \ + $RPM_BUILD_ROOT%{l_prefix}/bin/postagger + %{l_shtool} install -c -m 644 \ + stanford-postagger.jar \ + $RPM_BUILD_ROOT%{l_prefix}/lib/postagger/ + %{l_shtool} install -c -m 644 \ + models/* \ + $RPM_BUILD_ROOT%{l_prefix}/share/postagger/ + + # determine installation files + %{l_rpmtool} files -v -ofiles -r$RPM_BUILD_ROOT %{l_files_std} + +%files -f files + +%clean +