|
Java example source code file (DefaultDocumentIteratorTest.java)
The DefaultDocumentIteratorTest.java Java example source code/* * * * Copyright 2015 Skymind,Inc. * * * * Licensed under the Apache License, Version 2.0 (the "License"); * * you may not use this file except in compliance with the License. * * You may obtain a copy of the License at * * * * http://www.apache.org/licenses/LICENSE-2.0 * * * * Unless required by applicable law or agreed to in writing, software * * distributed under the License is distributed on an "AS IS" BASIS, * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * * See the License for the specific language governing permissions and * * limitations under the License. * */ package org.deeplearning4j.text.documentiterator; import static org.junit.Assert.*; import org.canova.api.util.ClassPathResource; import org.deeplearning4j.text.tokenization.tokenizer.Tokenizer; import org.deeplearning4j.text.tokenization.tokenizerfactory.DefaultTokenizerFactory; import org.deeplearning4j.text.tokenization.tokenizerfactory.TokenizerFactory; import org.junit.Test; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import java.io.File; import java.io.InputStream; /** * Created by agibsonccc on 9/29/14. */ public class DefaultDocumentIteratorTest { private static final Logger log = LoggerFactory.getLogger(DefaultDocumentIteratorTest.class); @Test public void testDocumentIterator() throws Exception { ClassPathResource reuters5250 = new ClassPathResource("/reuters/5250"); File f = reuters5250.getFile(); DocumentIterator iter = new FileDocumentIterator(f.getAbsolutePath()); InputStream doc = iter.nextDocument(); TokenizerFactory t = new DefaultTokenizerFactory(); Tokenizer next = t.create(doc); String[] list = "PEARSON CONCENTRATES ON FOUR SECTORS".split(" "); ///PEARSON CONCENTRATES ON FOUR SECTORS int count = 0; while(next.hasMoreTokens() && count < list.length) { String token = next.nextToken(); assertEquals(list[count++],token); } doc.close(); } } Other Java examples (source code examples)Here is a short list of links related to this Java DefaultDocumentIteratorTest.java source code file: |
... this post is sponsored by my books ... | |
#1 New Release! |
FP Best Seller |
Copyright 1998-2021 Alvin Alexander, alvinalexander.com
All Rights Reserved.
A percentage of advertising revenue from
pages under the /java/jwarehouse
URI on this website is
paid back to open source projects.