|
Java example source code file (Word2VecIteratorTest.java)
The Word2VecIteratorTest.java Java example source code/* * * * Copyright 2015 Skymind,Inc. * * * * Licensed under the Apache License, Version 2.0 (the "License"); * * you may not use this file except in compliance with the License. * * You may obtain a copy of the License at * * * * http://www.apache.org/licenses/LICENSE-2.0 * * * * Unless required by applicable law or agreed to in writing, software * * distributed under the License is distributed on an "AS IS" BASIS, * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * * See the License for the specific language governing permissions and * * limitations under the License. * */ package org.deeplearning4j.models.word2vec.iterator; import org.canova.api.util.ClassPathResource; import org.deeplearning4j.models.embeddings.WeightLookupTable; import org.deeplearning4j.models.embeddings.inmemory.InMemoryLookupTable; import org.deeplearning4j.models.embeddings.wordvectors.WordVectors; import org.deeplearning4j.models.word2vec.Word2Vec; import org.deeplearning4j.models.word2vec.wordstore.inmemory.InMemoryLookupCache; import org.deeplearning4j.text.sentenceiterator.SentenceIterator; import org.deeplearning4j.text.sentenceiterator.UimaSentenceIterator; import org.deeplearning4j.text.sentenceiterator.labelaware.LabelAwareFileSentenceIterator; import org.deeplearning4j.text.tokenization.tokenizerfactory.TokenizerFactory; import org.deeplearning4j.text.tokenization.tokenizerfactory.UimaTokenizerFactory; import org.junit.Before; import org.junit.Test; import org.nd4j.linalg.api.ndarray.INDArray; import org.nd4j.linalg.dataset.DataSet; import java.io.File; import java.util.ArrayList; import java.util.Arrays; import static org.junit.Assert.assertNotEquals; /** * Created by agibsonccc on 3/5/15. */ public class Word2VecIteratorTest { private Word2Vec vec; @Before public void before() throws Exception { if(vec == null) { ClassPathResource resource = new ClassPathResource("/labeled/"); File file = resource.getFile(); SentenceIterator iter = UimaSentenceIterator.createWithPath(file.getAbsolutePath()); new File("cache.ser").delete(); TokenizerFactory t = new UimaTokenizerFactory(); vec = new Word2Vec.Builder() .minWordFrequency(1).iterations(5) .layerSize(100) .stopWords(new ArrayList<String>()) .useUnknown(true) .windowSize(5).iterate(iter).tokenizerFactory(t).build(); vec.fit(); } } @Test public void testLabeledExample() throws Exception { INDArray unk = vec.getWordVectorMatrix(Word2Vec.DEFAULT_UNK); assertNotEquals(null, unk); unk = vec.getWordVectorMatrix("2131241sdasdas"); assertNotEquals(null, unk); Word2VecDataSetIterator iter = new Word2VecDataSetIterator(vec,new LabelAwareFileSentenceIterator(null, new ClassPathResource("labeled/").getFile()), Arrays.asList("negative","positive","neutral")); DataSet next = iter.next(); } } Other Java examples (source code examples)Here is a short list of links related to this Java Word2VecIteratorTest.java source code file: |
... this post is sponsored by my books ... | |
#1 New Release! |
FP Best Seller |
Copyright 1998-2021 Alvin Alexander, alvinalexander.com
All Rights Reserved.
A percentage of advertising revenue from
pages under the /java/jwarehouse
URI on this website is
paid back to open source projects.