Skip to content

Commit

Permalink
Add vdr module
Browse files Browse the repository at this point in the history
  • Loading branch information
phuonglh committed May 15, 2020
1 parent 0ab2540 commit c5005d5
Show file tree
Hide file tree
Showing 18 changed files with 42,899 additions and 12 deletions.
26 changes: 14 additions & 12 deletions build.sbt
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,8 @@ lazy val commonSettings = Seq(
libraryDependencies ++= Seq(
"org.apache.spark" %% "spark-core" % sparkVersion % "provided",
"org.apache.spark" %% "spark-sql" % sparkVersion % "provided",
"org.apache.spark" %% "spark-mllib" % sparkVersion % "provided"
"org.apache.spark" %% "spark-mllib" % sparkVersion % "provided",
"com.github.scopt" %% "scopt" % "3.7.1",
)
)

Expand All @@ -32,10 +33,7 @@ lazy val tag = (project in file("tag"))
.settings(
commonSettings,
mainClass in assembly := Some("vlp.tag.Tagger"),
assemblyJarName in assembly := "tag.jar",
libraryDependencies ++= Seq(
"com.github.scopt" %% "scopt" % "3.7.1"
)
assemblyJarName in assembly := "tag.jar"
)

// transition-based dependency parsing module
Expand All @@ -46,7 +44,6 @@ lazy val tdp = (project in file("tdp"))
mainClass in assembly := Some("vlp.tdp.Parser"),
assemblyJarName in assembly := "tdp.jar",
libraryDependencies ++= Seq(
"com.github.scopt" %% "scopt" % "3.7.1",
"com.github.fommil.netlib" % "all" % "1.1.2" pomOnly()
)
)
Expand All @@ -69,10 +66,7 @@ lazy val tpm = (project in file("tpm"))
.settings(
commonSettings,
mainClass in assembly := Some("vlp.tpm.LDA"),
assemblyJarName in assembly := "tpm.jar",
libraryDependencies ++= Seq(
"com.github.scopt" %% "scopt" % "3.7.1"
)
assemblyJarName in assembly := "tpm.jar"
)

// text classification module
Expand All @@ -83,7 +77,6 @@ lazy val tcl = (project in file("tcl"))
mainClass in assembly := Some("vlp.tcl.Classifier"),
assemblyJarName in assembly := "tcl.jar",
libraryDependencies ++= Seq(
"com.github.scopt" %% "scopt" % "3.7.1",
"com.github.fommil.netlib" % "all" % "1.1.2" pomOnly()
)
)
Expand All @@ -95,7 +88,6 @@ lazy val idx = (project in file("idx"))
mainClass in assembly := Some("vlp.idx.NewsIndexer"),
assemblyJarName in assembly := "idx.jar",
libraryDependencies ++= Seq(
"com.github.scopt" %% "scopt" % "3.7.1",
"mysql" % "mysql-connector-java" % "8.0.16",
"org.elasticsearch.client" % "elasticsearch-rest-high-level-client" % "7.1.1",
"de.l3s.boilerpipe" % "boilerpipe" % "1.1.0",
Expand All @@ -104,3 +96,13 @@ lazy val idx = (project in file("idx"))
"org.glassfish" % "javax.json" % "1.1.4"
)
)

// Vietnamese diacritics restoration module
lazy val vdr = (project in file("vdr"))
.settings(
commonSettings,
mainClass in assembly := Some("vlp.vdr.Restorer"),
assemblyJarName in assembly := "vdr.jar",
libraryDependencies ++= Seq(
)
)
Binary file added dat/txt/vlsp.txt.tar.gz
Binary file not shown.
Loading

0 comments on commit c5005d5

Please sign in to comment.