This is an automated email from the ASF dual-hosted git repository.
aradzinski pushed a commit to branch master_test
in repository https://gitbox.apache.org/repos/asf/incubator-nlpcraft.git
The following commit(s) were added to refs/heads/master_test by this push:
new 88233a0 WIP
88233a0 is described below
commit 88233a054b1004e45ef78a903b525f5a046de0f9
Author: Aaron Radzinski <[email protected]>
AuthorDate: Fri Dec 17 11:14:58 2021 -0800
WIP
---
.../nlp/token/parser/opennlp/impl/NCOpenNlpImpl.scala | 7 ++++---
.../scala/org/apache/nlpcraft/internal/util/NCUtils.scala | 13 +++++++++++++
2 files changed, 17 insertions(+), 3 deletions(-)
diff --git
a/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/nlp/token/parser/opennlp/impl/NCOpenNlpImpl.scala
b/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/nlp/token/parser/opennlp/impl/NCOpenNlpImpl.scala
index 920efde..7bf1df0 100644
---
a/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/nlp/token/parser/opennlp/impl/NCOpenNlpImpl.scala
+++
b/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/nlp/token/parser/opennlp/impl/NCOpenNlpImpl.scala
@@ -18,13 +18,14 @@
package org.apache.nlpcraft.internal.nlp.token.parser.opennlp.impl
import org.apache.nlpcraft.*
+
import java.io.*
import java.util.List as JList
-
import opennlp.tools.lemmatizer.*
import opennlp.tools.postag.*
import opennlp.tools.stemmer.*
import opennlp.tools.tokenize.*
+import org.apache.nlpcraft.internal.util.NCUtils
import scala.jdk.CollectionConverters.*
@@ -36,8 +37,8 @@ object NCOpenNlpImpl:
* @param lemmaDicSrc Local filesystem path, resources file path or URL
for OpenNLP lemmatizer dictionary.
* @return
*/
- def apply(tokMdlSrc: String, posMdlSrc: String, lemmaDicSrc: String):
NCOpenNlpImpl = ???
-
+ def apply(tokMdlSrc: String, posMdlSrc: String, lemmaDicSrc: String):
NCOpenNlpImpl =
+ new NCOpenNlpImpl(NCUtils.getStream(tokMdlSrc),
NCUtils.getStream(posMdlSrc), NCUtils.getStream(lemmaDicSrc))
/**
*
diff --git
a/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/util/NCUtils.scala
b/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/util/NCUtils.scala
index ec9b7cd..6855786 100644
--- a/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/util/NCUtils.scala
+++ b/nlpcraft/src/main/scala/org/apache/nlpcraft/internal/util/NCUtils.scala
@@ -562,6 +562,19 @@ object NCUtils extends LazyLogging:
f.exists() && f.isFile
/**
+ *
+ * @param src Local filesystem path, resources file or URL.
+ */
+ def getStream(src: String): InputStream =
+ if isFile(src) then new FileInputStream(new File(src))
+ else if isResource(src) then
+ getClass.getClassLoader.getResourceAsStream(src) match
+ case in if in != null => in
+ case _ => throw new NCException(s"Resource not found: $src")
+ else if isUrl(src) then new URL(src).openStream()
+ else throw new NCException(s"Source not found or unsupported: $src")
+
+ /**
* Makes thread.
*
* @param name Name.