commit embeddings data, not binary jar
Browse files
build.sh
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
#! /bin/bash
|
2 |
+
|
3 |
+
## download embeddings.txt
|
4 |
+
# dvc pull embeddings.txt.dvc
|
5 |
+
## or copy it of a previous build
|
6 |
+
# unzip -j binary/graphseg.jar embeddings.txt
|
7 |
+
|
8 |
+
cp embeddings.txt source/res/
|
9 |
+
|
10 |
+
cd source
|
11 |
+
mvn package
|
12 |
+
mv target/graphseg-0.0.1-SNAPSHOT-jar-with-dependencies.jar ../binary/graphseg.jar
|
13 |
+
|
binary/graphseg.jar → embeddings.txt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18870b0a7516e4a72b44d3c226c242d2d846008967d8ce40b94c723a94d1a32b
|
3 |
+
size 693432828
|
source/src/edu/uma/nlp/graphseg/preprocessing/StanfordAnnotator.java
CHANGED
@@ -37,7 +37,8 @@ public class StanfordAnnotator implements IAnnotator {
|
|
37 |
{
|
38 |
Properties props = new Properties();
|
39 |
props.setProperty("annotators", stanfordAnnotatorsString);
|
40 |
-
|
|
|
41 |
StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
|
42 |
|
43 |
edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());
|
|
|
37 |
{
|
38 |
Properties props = new Properties();
|
39 |
props.setProperty("annotators", stanfordAnnotatorsString);
|
40 |
+
props.setProperty("ssplit.eolonly", "true");
|
41 |
+
|
42 |
StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
|
43 |
|
44 |
edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());
|