Advertisement
Guest User

Untitled

a guest
Nov 15th, 2019
111
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.99 KB | None | 0 0
  1. import java.util.Collection;
  2.  
  3. import org.deeplearning4j.models.embeddings.loader.WordVectorSerializer;
  4. import org.deeplearning4j.models.word2vec.Word2Vec;
  5. import org.deeplearning4j.text.sentenceiterator.BasicLineIterator;
  6. import org.deeplearning4j.text.sentenceiterator.SentenceIterator;
  7. import org.deeplearning4j.text.tokenization.tokenizer.preprocessor.CommonPreprocessor;
  8. import org.deeplearning4j.text.tokenization.tokenizerfactory.DefaultTokenizerFactory;
  9. import org.deeplearning4j.text.tokenization.tokenizerfactory.TokenizerFactory;
  10.  
  11. public class main {
  12.  
  13. public static void main(String[] args) throws Exception {
  14. //Path du document pour apprentissage
  15. String filePath = "C:/Users/lucas/Desktop/M2/Web Semantique/Projet/web-semantique/src/main/resources/raw_sentences.txt";
  16.  
  17. //Ouverture et tokenization du document
  18. System.out.println("Load & Vectorize Sentences....");
  19. SentenceIterator iter = new BasicLineIterator(filePath);
  20. TokenizerFactory t = new DefaultTokenizerFactory();
  21. t.setTokenPreProcessor(new CommonPreprocessor());
  22.  
  23. //Build du model
  24. System.out.println("Building model....");
  25. Word2Vec vec = new Word2Vec.Builder()
  26. .minWordFrequency(5)
  27. .layerSize(100)
  28. .seed(42)
  29. .windowSize(5)
  30. .iterate(iter)
  31. .tokenizerFactory(t)
  32. .build();
  33.  
  34. //Entrainement du model
  35. System.out.println("Fitting Word2Vec model....");
  36. vec.fit();
  37.  
  38. //Affichage des mots les plus proches de "le"
  39. System.out.println("Closest Words:");
  40. Collection<String> lst = vec.wordsNearest("le", 3);
  41. System.out.println(lst);
  42.  
  43. //Sauvegarde du model buildé pour pouvoir le recharger ultérieurement
  44. WordVectorSerializer.writeWord2VecModel(vec, "C:/Users/lucas/Desktop/M2/Web Semantique/Projet/web-semantique/src/main/resources/model.txt");
  45. }
  46. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement