-
Notifications
You must be signed in to change notification settings - Fork 7
/
Description.props
41 lines (28 loc) · 1.87 KB
/
Description.props
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
# Description file for SCStemmers
# Package name (required)
PackageName=SCStemmers
# Version (required)
Version=1.1.1
# Date
Date=2018-10-16
# Title (required)
Title=A collection of stemmers for Serbian and Croatian.
Category=Preprocessing
# Author (required)
Author=Vuk Batanovic <vuk.batanovic@student.etf.bg.ac.rs>
# Maintainer (required)
Maintainer=Vuk Batanovic <vuk.batanovic@student.etf.bg.ac.rs>
# License (required)
License=GPL 3.0
# Description (required)
Description=This package contains Java implementations of three previously published stemmers for Serbian - two of them by Keselj and Sipka, one by Milosevic - and one for Croatian by Ljubesic and Pandzic. All stemmers require the input text to be in UTF-8. The stemmers accept text in both the Cyrillic and Latin scripts as input, and give the output in the Latin script. Performance comparisons between the stemmers (on the task of sentiment analysis) can be found in the paper "Reliable Baselines for Sentiment Analysis in Resource-Limited Languages: The Serbian Movie Review Dataset," Vuk Batanovic, Bosko Nikolic, Milan Milosavljevic, in Proceedings of the 10th International Conference on Language Resources and Evaluation (LREC 2016), pp. 2688-2696, Portoroz, Slovenia (2016). See the webpage for the list of reference papers and more information.
# Package URL for obtaining the package archive (required)
PackageURL=https://github.com/vukbatanovic/SCStemmers/releases/download/v1.1.1/SCStemmers_1.1.1.zip
# URL for further information
URL=https://github.com/vukbatanovic/SCStemmers/
# Dependencies
Depends=weka (>=3.7.12)
# Special instructions to be displayed on installation of this package
MessageToDisplayOnInstallation=This package requires to run Weka with (-Dfile.encoding=utf-8) option\n\
or change the line (fileEncoding=Cp1252) to (fileEncoding=utf-8) in weka.ini file \n\
Files also should be in utf-8 format.