<meta name="decorator" content="popup"/>
<meta name="useModuleDefaults" content="true"/>
<meta name="module" content="sources"/>
<meta name="pageTitle" content="TextParser.java [src/csip/utils], Revision: default"/>

<FONT CLASS="titlenormal">TextParser.java [src/csip/utils] Revision: default&nbsp;&nbsp;Date: </FONT>
<HR NOSHADE>
<PRE><PRE CLASS="editor">/*
 * $Id$
 *
 * This file is part of the Cloud Services Integration Platform (CSIP),
 * a Model-as-a-Service framework, API and application suite.
 *
 * 2012-2022, Olaf David and others, OMSLab, Colorado State University.
 *
 * OMSLab licenses this file to you under the MIT license.
 * See the LICENSE file in the project root for more information.
 */
package csip.utils;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.io.StringReader;
import java.util.Arrays;
import java.util.regex.Pattern;
import java.util.stream.DoubleStream;
import java.util.stream.IntStream;

/**
 * Extract tokens fromIndex an ASCII file (usually some kind of model output)
 *
 * @author od
 */
public class TextParser implements AutoCloseable {

  public static final String WS_SEP = &quot;\\s+&quot;;
  public static final String COMMA_SEP = &quot;\\s*,\\s*&quot;;

  BufferedReader r;
  String line = &quot;&quot;;
  String name;
  int lineno;
  boolean autoclose = true;
  boolean isClosed = false;


  public TextParser(File file) throws FileNotFoundException {
    r = new BufferedReader(new FileReader(file));
    name = file.toString();
  }


  public TextParser(File file, int buffsz) throws FileNotFoundException {
    r = new BufferedReader(new FileReader(file), buffsz);
    name = file.toString();
  }


  public TextParser(String content, String name) {
    r = new BufferedReader(new StringReader(content));
    this.name = name;
  }


  public TextParser nextLine() throws IOException {
    return nextLine(1);
  }


  public TextParser nextLineSkipEmpty() throws IOException {
    do {
      nextLine(1);
    } while (line != null &amp;&amp; line.trim().isEmpty());
    return this;
  }


  public TextParser nextLine(int lines) throws IOException {
    if (lines &lt; 1) 
      throw new IllegalArgumentException(&quot;error: lines &lt; 1&quot;);
    
    String err = &quot;Cannot skip &quot; + lines + &quot; in &quot; + name;
    for (int i = 0; i &lt; lines; i++) {
      line = readLine(err);
    }
    return this;
  }


  public TextParser toLineContaining(String text) throws IOException {
    String err = &quot;Not found in &quot; + name + &quot;: &quot; + text;
    do {
      line = readLine(err);
    } while (line != null &amp;&amp; !line.contains(text));
    return this;
  }


  public TextParser toLineStaringWith(String text) throws IOException {
    String err = &quot;Not found in &quot; + name + &quot;: &quot; + text;
    do {
      line = readLine(err);
    } while (line != null &amp;&amp; !line.startsWith(text));
    return this;
  }


  public TextParser toLineMatching(String regex) throws IOException {
    String err = &quot;No match found in &quot; + name + &quot;: &quot; + regex;
    Pattern p = Pattern.compile(regex);
    do {
      line = readLine(err);
    } while (line != null &amp;&amp; !p.matcher(line).matches());
    return this;
  }


  public TextParser skipLinesContaining(String text) throws IOException {
    String err = &quot;Skipping lines for&quot; + name + &quot;: &quot; + text;
    do {
      line = readLine(err);
    } while (line.contains(text));
    return this;
  }


  public TextParser skipLinesStartingWith(String text) throws IOException {
    String err = &quot;Skipping lines starting for&quot; + name + &quot;: &quot; + text;
    do {
      line = readLine(err);
    } while (line.startsWith(text));
    return this;
  }


  /**
   * Set this to false if terminators should not close the stream
   * @param autoclose if the terminating operation closes the stream
   * @return this instance
   */
  public TextParser autoClose(boolean autoclose) {
    this.autoclose = autoclose;
    return this;
  }


  /**
   * Get the part of the line string right of the text argument.
   * @param text the text to look for
   * @return the substring within the line.
   */
  public TextParser rightOfFirst(String text) {
    int st = line.indexOf(text);
    if (st == -1)
      throw new IllegalArgumentException(&quot;text not found in &quot; + line + &quot;: &quot; + text);
    line = line.substring(st + text.length());
    return this;
  }


  public TextParser rightOfLast(String text) {
    int st = line.lastIndexOf(text);
    if (st == -1)
      throw new IllegalArgumentException(&quot;text not found in &quot; + line + &quot;: &quot; + text);
    line = line.substring(st + text.length());
    return this;
  }


  /**
   * Get the part of the line string left of the text argument.
   * @param text the text to look for
   * @return the substring within the line.
   */
  public TextParser leftOfFirst(String text) {
    int st = line.indexOf(text);
    if (st == -1)
      throw new IllegalArgumentException(&quot;text not found in &quot; + line + &quot;: &quot; + text);
    line = line.substring(0, st);
    return this;
  }


  public TextParser leftOfLast(String text) {
    int st = line.lastIndexOf(text);
    if (st == -1)
      throw new IllegalArgumentException(&quot;text not found in &quot; + line + &quot;: &quot; + text);
    line = line.substring(0, st);
    return this;
  }


  /**
   * Create a new (!) TextParser with the all content from the current position
   * until the text. 'text' is included.
   * @param text the text to look for
   * @return a new instance. 
   * @throws IOException if reading fails
   */
  public TextParser allUntil(String text) throws IOException {
    String err = &quot;Not found in &quot; + name + &quot;: &quot; + text;
    String subContent = line + '\n';
    do {
      line = readLine(err);
      subContent += line + '\n';

    } while (line != null &amp;&amp; !line.contains(text));
    if (line == null)
      return null;
    return new TextParser(subContent, &quot;until&quot;);
  }


  // Terminating operations. they close the stream.
  //
  public Tokens tokens() {
    return tokens(WS_SEP);
  }


  public Tokens tokens(String regex) {
    autoclose();
    return new Tokens(line, regex);
  }


  public String asString() {
    autoclose();
    return line;
  }


  public double asDouble() {
    autoclose();
    return Double.parseDouble(line);
  }


  public int asInteger() {
    autoclose();
    return Integer.parseInt(line.trim());
  }


  public int getLineNo() {
    autoclose();
    return lineno;
  }


  public String getWsTokenAt(int col) {
    autoclose();
    return extractToken(line, col);
  }


  private void autoclose() {
    if (autoclose)
      close();
  }


  @Override
  public synchronized void close() {
    if (r != null) {
      try {
        r.close();
      } catch (IOException ex) {
      }
      isClosed = true;
    }
  }


  public boolean notEOF() {
    return !isClosed;
  }


  public boolean isEOF() {
    return isClosed;
  }


  private String readLine(String err) throws IOException {
    if (isClosed)
      throw new IOException(name + &quot;: already closed. Use autoClose(false) to allow for successive reads. Do &quot;
          + &quot;not forget to close the stream at the end.\n&quot; + err);
    String l = r.readLine();
    if (l == null)
      close();
    lineno++;
    return l;
  }


  @Override
  public String toString() {
    return lineno + &quot;:  '&quot; + line + &quot;'&quot;;
  }


  /**
   * Fast token extract. tokens are separated by any number of white spaces.
   * Tokens cannot contain any white spaces, as in csv.
   *
   * @param line
   * @param col the column, starts with 0.
   * @return the token at column 'col'
   */
  static String extractToken(String line, int col) {
    if (col &lt; 0)
      throw new IllegalArgumentException(&quot;col argument &lt; 0.&quot;);

    int idx = -1;
    int tokens = -1;
    int len = line.length() - 1;
    while (++idx &lt; len) {
      while (Character.isWhitespace(line.charAt(idx)) &amp;&amp; idx++ &lt; len);
      int start = idx;
      while ((!Character.isWhitespace(line.charAt(idx))) &amp;&amp; idx++ &lt; len);
      if (idx == len)
        idx++;
      if (++tokens == col)
        return line.substring(start, idx);

    }
    return null;
  }

//////////////
  public static class Tokens {

    String[] tok;
    static final String[] EMPTY = new String[]{};


    private Tokens(String line, String regex) {
      tok = (line == null) ? EMPTY : line.trim().split(regex);
    }


    public int count() {
      return tok.length;
    }


    /**
     * Find the index of val. in the token array.
     *
     * @param val the string to match (equals)
     * @return the index of val, or -1 if not existent.
     */
    public int indexOf(String val) {
      for (int i = 0; i &lt; tok.length; i++) {
        if (tok[i].equals(val))
          return i;
      }
      return -1;
    }


    public Tokens fromIndex(int b) {
      if (b &lt; 0 || b &gt; tok.length - 1)
        throw new IllegalArgumentException(&quot;invalid begin index:&quot; + b);
      if (b == 0)
        return this;
      tok = Arrays.copyOfRange(tok, b, tok.length);
      return this;
    }


    /**
     * Get the Tokens until the end.
     * 
     * @param e must be negative (starts from the end of the string)
     * @return this instance
     */
    public Tokens toIndex(int e) {
      if (e &gt; 0 || -e &gt; tok.length - 1)
        throw new IllegalArgumentException(&quot;invalid end index:&quot; + e);
      if (e == 0)
        return this;
      tok = Arrays.copyOfRange(tok, 0, tok.length + e);
      return this;
    }


    private DoubleStream dstream() {
      return Arrays.stream(tok).mapToDouble(Double::parseDouble);
    }


    private IntStream istream() {
      return Arrays.stream(tok).mapToInt(Integer::parseInt);
    }


    public double sum() {
      return dstream().sum();
    }


    public double average() {
      return dstream().average().getAsDouble();
    }


    public double min() {
      return dstream().min().getAsDouble();
    }


    public double max() {
      return dstream().max().getAsDouble();
    }


    public double[] asDoubleArray() {
      return dstream().toArray();
    }


    public int[] asIntArray() {
      return istream().toArray();
    }


    public String[] asStringArray() {
      return tok;
    }
  }

}
</PRE>
</PRE>