Skip to content

Commit

Permalink
bump version
Browse files Browse the repository at this point in the history
  • Loading branch information
jiemakel committed Jun 7, 2016
1 parent eccc65f commit 2f5bc54
Show file tree
Hide file tree
Showing 3 changed files with 12 additions and 10 deletions.
8 changes: 5 additions & 3 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ Lexical Analysis Command-Line Tool for lemmatizing, lexical analysis and languag

Program help:
```
las 1.4.1
las 1.4.5
Usage: las [lemmatize|analyze|inflect|recognize|identify] [options] [<file>...]
Command: lemmatize
Expand All @@ -13,19 +13,21 @@ Command: analyze
Command: inflect
(locales: de, en, fi, fr, it, liv, mdf, mhr, mrj, myv, sme, sv, tr, udm)
Command: recognize
report recognition rate (locales: de, en, fi, fr, it, liv, mdf, mhr, mrj, myv, sme, sv, tr, udm, la
report word recognition rate (locales: de, en, fi, fr, it, liv, mdf, mhr, mrj, myv, sme, sv, tr, udm, la
Command: identify
identify language (locales: zh-TW, fi, no, hr, ta, ar, fr, is, lv, eu, mt, bn, dk, uk, pa, ga, br, so, pt, cs, fr, gl, sr, zh-CN, mrj, el, it, ca, vi, tl, nl, bg, ko, liv, it, mk, oc, et, af, de, ru, yi, cy, en, udm, ur, mdf, myv, sme, ru, ht, ml, th, id, sq, sv, de, sv, tr, da, en, gu, he, es, kn, sk, es, hi, te, mr, an, sw, be, pt, nl, ja, ast, fi, ro, mhr, ne, lt, no, km, sl, fa, ms, hu, pl, la, tr)
--locale <value>
possible locales
--forms <value>
inclection forms for inflect/analyze
--segment
segment compound words?
segment baseforms?
--no-guess
Don't guess baseforms for unknown words?
--no-segment-guessed
Don't guess segmentation information for guessed words (speeds up processing significantly)?
--process-by <value>
Analysis unit when processing files (file, paragraph, line)?
--max-edit-distance <value>
Maximum edit distance for error-correcting unidentified words (default 0)?
--no-pretty
Expand Down
4 changes: 2 additions & 2 deletions build.sbt
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ version := "1.4.2"
scalaVersion := "2.11.8"

libraryDependencies ++= Seq(
"fi.seco" % "lexicalanalysis" % "1.4.4",
"fi.seco" % "lexicalanalysis" % "1.4.5",
"com.optimaize.languagedetector" % "language-detector" % "0.5",
"com.github.scopt" %% "scopt" % "3.4.0",
"com.typesafe.play" %% "play-json" % "2.5.3",
Expand All @@ -24,6 +24,6 @@ assemblyMergeStrategy in assembly := {
oldStrategy(x)
}

assemblyOption in assembly := (assemblyOption in assembly).value.copy(prependShellScript = Some(Seq("#!/usr/bin/env sh", """exec java -jar "$0" "$@"""")))
assemblyOption in assembly := (assemblyOption in assembly).value.copy(prependShellScript = Some(Seq("#!/usr/bin/env sh", """exec java -jar -Xmx4G "$0" "$@"""")))

assemblyJarName in assembly := "las"
10 changes: 5 additions & 5 deletions src/main/scala/LASCommandLineTool.scala
Original file line number Diff line number Diff line change
Expand Up @@ -31,10 +31,10 @@ object LASCommandLineTool {
lazy val compoundlas = new CompoundLexicalAnalysisService(combinedlas, snowballlas)

object LanguageDetector extends LazyLogging {
val languageProfiles = new LanguageProfileReader().readAllBuiltIn()
val supportedLanguages = languageProfiles.map(_.getLocale.toString())
val detector = LanguageDetectorBuilder.create(NgramExtractors.standard()).withProfiles(languageProfiles).build()
val textObjectFactory = CommonTextObjectFactories.forDetectingOnLargeText()
lazy val languageProfiles = new LanguageProfileReader().readAllBuiltIn()
lazy val supportedLanguages = languageProfiles.map(_.getLocale.toString())
lazy val detector = LanguageDetectorBuilder.create(NgramExtractors.standard()).withProfiles(languageProfiles).build()
lazy val textObjectFactory = CommonTextObjectFactories.forDetectingOnLargeText()
def apply(text: String) = detector.getProbabilities(textObjectFactory.forText(text))
}

Expand All @@ -54,7 +54,7 @@ object LASCommandLineTool {

def main(args: Array[String]) = {
val parser = new scopt.OptionParser[Config]("las") {
head("las", "1.4.2")
head("las", "1.4.5")
cmd("lemmatize") action { (_, c) =>
c.copy(action = Action.Lemmatize)
} text (s"(locales: ${compoundlas.getSupportedBaseformLocales.mkString(", ")})")
Expand Down

0 comments on commit 2f5bc54

Please sign in to comment.