|
Java example source code file (Windows.java)
The Windows.java Java example source code/* * * * Copyright 2015 Skymind,Inc. * * * * Licensed under the Apache License, Version 2.0 (the "License"); * * you may not use this file except in compliance with the License. * * You may obtain a copy of the License at * * * * http://www.apache.org/licenses/LICENSE-2.0 * * * * Unless required by applicable law or agreed to in writing, software * * distributed under the License is distributed on an "AS IS" BASIS, * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * * See the License for the specific language governing permissions and * * limitations under the License. * */ package org.deeplearning4j.text.movingwindow; import java.io.InputStream; import java.util.ArrayList; import java.util.List; import java.util.StringTokenizer; import lombok.NonNull; import org.deeplearning4j.berkeley.StringUtils; import org.deeplearning4j.text.tokenization.tokenizer.DefaultStreamTokenizer; import org.deeplearning4j.text.tokenization.tokenizer.Tokenizer; import org.deeplearning4j.text.tokenization.tokenizerfactory.TokenizerFactory; /** * Static utility class for textual based windowing cooccurrences * @author Adam Gibson */ public class Windows { /** * Constructs a list of window of size windowSize. * Note that padding for each window is created as well. * @param words the words to tokenize and construct windows from * @param windowSize the window size to generate * @return the list of windows for the tokenized string */ public static List<Window> windows(InputStream words,int windowSize) { Tokenizer tokenizer = new DefaultStreamTokenizer(words); List<String> list = new ArrayList<>(); while(tokenizer.hasMoreTokens()) list.add(tokenizer.nextToken()); return windows(list,windowSize); } /** * Constructs a list of window of size windowSize. * Note that padding for each window is created as well. * @param words the words to tokenize and construct windows from * @param tokenizerFactory tokenizer factory to use * @param windowSize the window size to generate * @return the list of windows for the tokenized string */ public static List<Window> windows(InputStream words,TokenizerFactory tokenizerFactory,int windowSize) { Tokenizer tokenizer = tokenizerFactory.create(words); List<String> list = new ArrayList<>(); while(tokenizer.hasMoreTokens()) list.add(tokenizer.nextToken()); if(list.isEmpty()) throw new IllegalStateException("No tokens found for windows"); return windows(list,windowSize); } /** * Constructs a list of window of size windowSize. * Note that padding for each window is created as well. * @param words the words to tokenize and construct windows from * @param windowSize the window size to generate * @return the list of windows for the tokenized string */ public static List<Window> windows(String words,int windowSize) { StringTokenizer tokenizer = new StringTokenizer(words); List<String> list = new ArrayList Other Java examples (source code examples)Here is a short list of links related to this Java Windows.java source code file: |
... this post is sponsored by my books ... | |
#1 New Release! |
FP Best Seller |
Copyright 1998-2021 Alvin Alexander, alvinalexander.com
All Rights Reserved.
A percentage of advertising revenue from
pages under the /java/jwarehouse
URI on this website is
paid back to open source projects.