Raks-coder
diff --git a/‎Digital-Assignment/.idea/workspace.xml
Lines changed: 89 additions & 69 deletions b/‎Digital-Assignment/.idea/workspace.xml
Lines changed: 89 additions & 69 deletions
diff --git a/‎Digital-Assignment/Readme.md
Lines changed: 1 addition & 6 deletions b/‎Digital-Assignment/Readme.md
Lines changed: 1 addition & 6 deletions
diff --git a/‎Digital-Assignment/out/production/Digital-Assignment/OpenNLP/Tokenization/SentenceTokenization.class
1.35 KB b/‎Digital-Assignment/out/production/Digital-Assignment/OpenNLP/Tokenization/SentenceTokenization.class
1.35 KB
diff --git a/‎Digital-Assignment/out/production/Digital-Assignment/TokenizerMEProbs.class
2.21 KB b/‎Digital-Assignment/out/production/Digital-Assignment/TokenizerMEProbs.class
2.21 KB
diff --git a/‎Digital-Assignment/resources/en-token.bin
430 KB b/‎Digital-Assignment/resources/en-token.bin
430 KB
diff --git a/‎Digital-Assignment/src/OpenNLP/Tokenization/SentenceTokenization.java
Lines changed: 32 additions & 0 deletions b/‎Digital-Assignment/src/OpenNLP/Tokenization/SentenceTokenization.java
Lines changed: 32 additions & 0 deletions
diff --git a/‎Digital-Assignment/src/OpenNLP/Tokenization/TokenizerMEProbs.java
Lines changed: 32 additions & 0 deletions b/‎Digital-Assignment/src/OpenNLP/Tokenization/TokenizerMEProbs.java
Lines changed: 32 additions & 0 deletions
@@ -12,13 +12,8 @@ Develop Java Programs implementing 10 new concepts/features/Topics (not in our s
   3. **Resolving Authentication failure**: Click on [this link](https://www.google.com/settings/security/lesssecureapps) and click on turn on radio button to allow users to send mail from unknown location.
 
 ## Language Detection using OpenNLP
-* Code - [LanguageDetectorMain.java](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/src/languagedetector/LanguageDetectorMain.java), [LanguageMapper.java](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/src/languagedetector/LanguageMapper.java)
+* Code - [LanguageDetectorMain.java](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/src/OpenNLP/languagedetector/LanguageDetectorMain.java), [LanguageMapper.java](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/src/OpenNLP/languagedetector/LanguageMapper.java)
 * [Source](https://github.com/Ruthwik/Language-Detection)
 * [`.jar` files](https://github.com/jacobjohn2016/Java-Programming/tree/master/Digital-Assignment/apache-opennlp-1.9.1/lib)
 * The Apache OpenNLP library is a machine learning based toolkit for the processing of natural language text. It supports the most common NLP tasks, such as language detection, tokenization, sentence segmentation, part-of-speech tagging, named entity extraction, chunking, parsing and coreference resolution.
 * This model is trained for and works well with longer texts that have at least 2 sentences or more from the same language.
-
-## Face Detection using OpenCV
-* [Code](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/src/FaceDetector.java)
-* [Source](https://www.geeksforgeeks.org/image-processing-java-set-9-face-detection/)
-* [`.jar` files](https://github.com/jacobjohn2016/Java-Programming/blob/master/Digital-Assignment/opencv-3.2.0-1.jar)
@@ -0,0 +1,32 @@
+package OpenNLP.Tokenization;
+
+import opennlp.tools.tokenize.SimpleTokenizer;
+import opennlp.tools.tokenize.WhitespaceTokenizer;
+
+public class SentenceTokenization {
+    public static void main(String[] args) {
+        String sentence = "Hi. How are you? Welcome to Tutorialspoint. "
+                + "We provide free tutorials on various technologies";
+
+        //Instantiating SimpleTokenizer class
+        SimpleTokenizer simpleTokenizer = SimpleTokenizer.INSTANCE;
+
+        //Tokenizing the given sentence
+        String tokens[] = simpleTokenizer.tokenize(sentence);
+
+        //Printing the tokens
+        for(String token :tokens){
+            System.out.println(token);
+        }
+
+        //Instantiating whitespaceTokenizer class
+        WhitespaceTokenizer whitespaceTokenizer = WhitespaceTokenizer.INSTANCE;
+
+        //Tokenizing the given paragraph
+        String whitetokens[] = whitespaceTokenizer.tokenize(sentence);
+
+        //Printing the tokens
+        for(String token : whitetokens)
+            System.out.println(token);
+    }
+}
@@ -0,0 +1,32 @@
+import java.io.FileInputStream;
+import java.io.InputStream;
+import opennlp.tools.tokenize.TokenizerME;
+import opennlp.tools.tokenize.TokenizerModel;
+import opennlp.tools.util.Span;
+
+public class TokenizerMEProbs {
+
+    public static void main(String args[]) throws Exception{
+        String sent = "Hello John how are you welcome to Tutorialspoint";
+
+        //Loading the Tokenizer model
+        InputStream inputStream = new FileInputStream("resources/en-token.bin");
+        TokenizerModel tokenModel = new TokenizerModel(inputStream);
+
+        //Instantiating the TokenizerME class
+        TokenizerME tokenizer = new TokenizerME(tokenModel);
+
+        //Retrieving the positions of the tokens
+        Span tokens[] = tokenizer.tokenizePos(sent);
+
+        //Getting the probabilities of the recent calls to tokenizePos() method
+        double[] probs = tokenizer.getTokenProbabilities();
+
+        //Printing the spans of tokens
+        for(Span token : tokens)
+            System.out.println(token +" "+sent.substring(token.getStart(), token.getEnd()));
+        System.out.println("  ");
+        for(int i = 0; i<probs.length; i++)
+            System.out.println(probs[i]);
+    }
+}