commit embeddings data, not binary jar
Browse files
build.sh
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#! /bin/bash
|
| 2 |
+
|
| 3 |
+
## download embeddings.txt
|
| 4 |
+
# dvc pull embeddings.txt.dvc
|
| 5 |
+
## or copy it of a previous build
|
| 6 |
+
# unzip -j binary/graphseg.jar embeddings.txt
|
| 7 |
+
|
| 8 |
+
cp embeddings.txt source/res/
|
| 9 |
+
|
| 10 |
+
cd source
|
| 11 |
+
mvn package
|
| 12 |
+
mv target/graphseg-0.0.1-SNAPSHOT-jar-with-dependencies.jar ../binary/graphseg.jar
|
| 13 |
+
|
binary/graphseg.jar → embeddings.txt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18870b0a7516e4a72b44d3c226c242d2d846008967d8ce40b94c723a94d1a32b
|
| 3 |
+
size 693432828
|
source/src/edu/uma/nlp/graphseg/preprocessing/StanfordAnnotator.java
CHANGED
|
@@ -37,7 +37,8 @@ public class StanfordAnnotator implements IAnnotator {
|
|
| 37 |
{
|
| 38 |
Properties props = new Properties();
|
| 39 |
props.setProperty("annotators", stanfordAnnotatorsString);
|
| 40 |
-
|
|
|
|
| 41 |
StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
|
| 42 |
|
| 43 |
edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());
|
|
|
|
| 37 |
{
|
| 38 |
Properties props = new Properties();
|
| 39 |
props.setProperty("annotators", stanfordAnnotatorsString);
|
| 40 |
+
props.setProperty("ssplit.eolonly", "true");
|
| 41 |
+
|
| 42 |
StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
|
| 43 |
|
| 44 |
edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());
|