lucio commited on
Commit
9074cf1
1 Parent(s): fe40a1e

commit embeddings data, not binary jar

Browse files
build.sh ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #! /bin/bash
2
+
3
+ ## download embeddings.txt
4
+ # dvc pull embeddings.txt.dvc
5
+ ## or copy it of a previous build
6
+ # unzip -j binary/graphseg.jar embeddings.txt
7
+
8
+ cp embeddings.txt source/res/
9
+
10
+ cd source
11
+ mvn package
12
+ mv target/graphseg-0.0.1-SNAPSHOT-jar-with-dependencies.jar ../binary/graphseg.jar
13
+
binary/graphseg.jar → embeddings.txt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8933d43d10f8ba885d4df38b3b0a2d1bf7796f7d367b7f9fef6f3925801987c5
3
- size 616819715
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18870b0a7516e4a72b44d3c226c242d2d846008967d8ce40b94c723a94d1a32b
3
+ size 693432828
source/src/edu/uma/nlp/graphseg/preprocessing/StanfordAnnotator.java CHANGED
@@ -37,7 +37,8 @@ public class StanfordAnnotator implements IAnnotator {
37
  {
38
  Properties props = new Properties();
39
  props.setProperty("annotators", stanfordAnnotatorsString);
40
-
 
41
  StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
42
 
43
  edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());
 
37
  {
38
  Properties props = new Properties();
39
  props.setProperty("annotators", stanfordAnnotatorsString);
40
+ props.setProperty("ssplit.eolonly", "true");
41
+
42
  StanfordCoreNLP pipeline = new StanfordCoreNLP(props);
43
 
44
  edu.stanford.nlp.pipeline.Annotation docAnnotation = new edu.stanford.nlp.pipeline.Annotation(((Document)textUnit).getText());