Skip to content

Commit 0e19ef4

Browse files
Hendrik SchmeerHendrik Schmeer
Hendrik Schmeer
authored and
Hendrik Schmeer
committed
Merge branch 'master' of https://github.com/schlusslicht/Cheiron
Conflicts: .settings/org.eclipse.jdt.core.prefs
2 parents 64da4c0 + 073dac6 commit 0e19ef4

File tree

7 files changed

+33
-4
lines changed

7 files changed

+33
-4
lines changed

.settings/org.eclipse.jdt.core.prefs

+12
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
eclipse.preferences.version=1
2+
org.eclipse.jdt.core.compiler.codegen.inlineJsrBytecode=enabled
3+
org.eclipse.jdt.core.compiler.codegen.targetPlatform=1.8
4+
org.eclipse.jdt.core.compiler.codegen.unusedLocal=preserve
5+
org.eclipse.jdt.core.compiler.compliance=1.8
6+
org.eclipse.jdt.core.compiler.debug.lineNumber=generate
7+
org.eclipse.jdt.core.compiler.debug.localVariable=generate
8+
org.eclipse.jdt.core.compiler.debug.sourceFile=generate
9+
org.eclipse.jdt.core.compiler.problem.assertIdentifier=error
10+
org.eclipse.jdt.core.compiler.problem.enumIdentifier=error
11+
org.eclipse.jdt.core.compiler.problem.forbiddenReference=warning
12+
org.eclipse.jdt.core.compiler.source=1.8

src/Cheiron/Processor/Matetools/Lemmatizer.java

+4-2
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,9 @@ public class Lemmatizer extends JCasAnnotator_ImplBase {
2222
private static Map<String, is2.lemmatizer2.Lemmatizer> detectors = new HashMap<String, is2.lemmatizer2.Lemmatizer>();
2323

2424
private void processView(JCas view) {
25+
if (!detectors.containsKey(view.getDocumentLanguage()))
26+
return;
27+
2528
Token token = null;
2629
String[] tokens = null;
2730
ArrayList<Token> tokenList = null;
@@ -72,8 +75,7 @@ private void processView(JCas view) {
7275
lemma.addToIndexes();
7376
token.setLemma(lemma);
7477

75-
System.out
76-
.println("Matetools.Lemmatizer: " + token.getCoveredText() + "/" + lemma.getValue());
78+
System.out.println("Matetools.Lemmatizer: " + token.getCoveredText() + "/" + lemma.getValue());
7779
}
7880

7981
token_it.moveToFirst();

src/Cheiron/Processor/Matetools/Postagger.java

+4-2
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,9 @@ public class Postagger extends JCasAnnotator_ImplBase {
2626
private static Map<String, Parser> pdetectors = new HashMap<String, Parser>();
2727

2828
private void processView(JCas view) {
29+
if (ldetectors.containsKey(view.getDocumentLanguage()) || !pdetectors.containsKey(view.getDocumentLanguage()))
30+
return;
31+
2932
Token token = null;
3033
String[] tokens = null;
3134
ArrayList<Token> tokenList = null;
@@ -87,8 +90,7 @@ private void processView(JCas view) {
8790
}
8891
token.setPosTag(tokenArray);
8992

90-
System.out
91-
.println("Matetools.Postagger: " + token.getCoveredText() + "/" + postag.getValue());
93+
System.out.println("Matetools.Postagger: " + token.getCoveredText() + "/" + postag.getValue());
9294
}
9395

9496
token_it.moveToFirst();

src/Cheiron/Processor/OpenNLP/Postagger.java

+3
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,9 @@ public class Postagger extends Processor_ImplBase {
2323

2424
@Override
2525
public void processView(JCas view) {
26+
if (!detectors.containsKey(view.getDocumentLanguage()))
27+
return;
28+
2629
Token token = null;
2730
String[] tokens = null;
2831
List<Token> tokenList = null;

src/Cheiron/Processor/OpenNLP/Sentencer.java

+3
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,9 @@ public class Sentencer extends Processor_ImplBase {
1818

1919
@Override
2020
public void processView(JCas view) {
21+
if (!detectors.containsKey(view.getDocumentLanguage()))
22+
return;
23+
2124
Sentence sentence = null;
2225

2326
for (Span span : detectors.get(view.getDocumentLanguage()).sentPosDetect(view.getDocumentText())) {

src/Cheiron/Processor/OpenNLP/Tokenizer.java

+3
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,9 @@ public class Tokenizer extends Processor_ImplBase {
2020

2121
@Override
2222
public void processView(JCas view) {
23+
if (!detectors.containsKey(view.getDocumentLanguage()))
24+
return;
25+
2326
Token token = null;
2427

2528
for (Sentence sentence : JCasUtil.select(view, Sentence.class)) {

src/Cheiron/Processor/Stanford/Postagger.java

+4
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,9 @@ public class Postagger extends Processor_ImplBase {
2424

2525
@Override
2626
public void processView(JCas view) {
27+
if (!detectors.containsKey(view.getDocumentLanguage()))
28+
return;
29+
2730
Token token = null;
2831
List<Word> tokens = null;
2932
List<Token> tokenList = null;
@@ -42,6 +45,7 @@ public void processView(JCas view) {
4245
for (Token t : tokenList)
4346
tokens.add(new Word(t.getCoveredText()));
4447

48+
4549
postags = detectors.get(view.getDocumentLanguage()).tagSentence(tokens);
4650

4751
for (int i = 0; i < postags.size(); i++) {

0 commit comments

Comments
 (0)