diff options
| author | bculkin2442 <bjculkin@mix.wvu.edu> | 2017-03-25 20:34:42 -0400 |
|---|---|---|
| committer | bculkin2442 <bjculkin@mix.wvu.edu> | 2017-03-25 20:34:42 -0400 |
| commit | b53c1ef47c438fb1144b961d1939c37a4bfe9120 (patch) | |
| tree | eec3e8737831dfa245fdee31fb4b25bffac03aff /BJC-Utils2/src/main/java/bjc/utils/ioutils | |
| parent | 9716b1ac09eb92c4ed001be4350d54b41b953239 (diff) | |
Separate general I/O from parsing.
Diffstat (limited to 'BJC-Utils2/src/main/java/bjc/utils/ioutils')
3 files changed, 503 insertions, 0 deletions
diff --git a/BJC-Utils2/src/main/java/bjc/utils/ioutils/BlockReader.java b/BJC-Utils2/src/main/java/bjc/utils/ioutils/BlockReader.java new file mode 100644 index 0000000..33bbbd5 --- /dev/null +++ b/BJC-Utils2/src/main/java/bjc/utils/ioutils/BlockReader.java @@ -0,0 +1,208 @@ +package bjc.utils.ioutils; + +import java.io.LineNumberReader; +import java.io.Reader; +import java.util.NoSuchElementException; +import java.util.Scanner; +import java.util.function.Consumer; +import java.util.regex.Pattern; + +/** + * Implements reading numbered blocks from a source. + * + * A block is a series of characters, seperated by some regular expression. + * + * NOTE: The EOF marker is always treated as a delimiter. You are expected to + * handle blocks that may be shorter than you expect. + * + * @author EVE + * + */ +public class BlockReader implements AutoCloseable { + /** + * Represents a block of text read in from a source. + * + * @author EVE + * + */ + public static class Block { + /** + * The contents of this block. + */ + public final String contents; + + /** + * The line of the source this block started on. + */ + public final int startLine; + + /** + * The line of the source this block ended on. + */ + public final int endLine; + + /** + * The number of this block. + */ + public final int blockNo; + + /** + * Create a new block. + * + * @param blockNo + * The number of this block. + * @param contents + * The contents of this block. + * @param startLine + * The line this block started on. + * @param endLine + * The line this block ended. + */ + public Block(int blockNo, String contents, int startLine, int endLine) { + this.contents = contents; + this.startLine = startLine; + this.endLine = endLine; + this.blockNo = blockNo; + } + + @Override + public int hashCode() { + final int prime = 31; + int result = 1; + + result = prime * result + blockNo; + result = prime * result + ((contents == null) ? 0 : contents.hashCode()); + result = prime * result + endLine; + result = prime * result + startLine; + + return result; + } + + @Override + public boolean equals(Object obj) { + if(this == obj) return true; + if(obj == null) return false; + if(!(obj instanceof Block)) return false; + + Block other = (Block) obj; + + if(blockNo != other.blockNo) return false; + + if(contents == null) { + if(other.contents != null) return false; + } else if(!contents.equals(other.contents)) return false; + + if(endLine != other.endLine) return false; + if(startLine != other.startLine) return false; + + return true; + } + + @Override + public String toString() { + return String.format("Block #%d (from lines %d to %d) length: %d characters", blockNo, startLine, + endLine, contents.length()); + } + } + + /* + * I/O source for blocks. + */ + private LineNumberReader lnReader; + private Scanner blockReader; + + /* + * The current block. + */ + private Block currBlock; + private int blockNo; + + /** + * Create a new block reader. + * + * @param blockDelim + * The pattern that separates blocks. Note that the end + * of file is always considered to end a block. + * + * @param source + * The source to read blocks from. + */ + public BlockReader(String blockDelim, Reader source) { + lnReader = new LineNumberReader(source); + + blockReader = new Scanner(lnReader); + + String pattern = String.format("(?:%s)|\\Z", blockDelim); + Pattern pt = Pattern.compile(pattern, Pattern.MULTILINE); + + blockReader.useDelimiter(pt); + } + + /** + * Check if this reader has an available block. + * + * @return Whether or not another block is available. + */ + public boolean hasNextBlock() { + return blockReader.hasNext(); + } + + /** + * Get the current block. + * + * @return The current block, or null if there is no current block. + */ + public Block getBlock() { + return currBlock; + } + + /** + * Move to the next block. + * + * @return Whether or not the next block was succesfully read. + */ + public boolean nextBlock() { + try { + int blockStartLine = lnReader.getLineNumber(); + String blockContents = blockReader.next(); + int blockEndLine = lnReader.getLineNumber(); + blockNo += 1; + + currBlock = new Block(blockNo, blockContents, blockStartLine, blockEndLine); + + return true; + } catch(NoSuchElementException nseex) { + return false; + } + } + + /** + * Execute an action for each remaining block. + * + * @param action + * The action to execute for each block + */ + public void forEachBlock(Consumer<Block> action) { + while(hasNextBlock()) { + nextBlock(); + + action.accept(currBlock); + } + } + + /** + * Retrieve the number of blocks that have been read so far. + * + * @return The number of blocks read so far. + */ + public int getBlockCount() { + return blockNo; + } + + @Override + public void close() throws Exception { + blockReader.close(); + + lnReader.close(); + } +} diff --git a/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedConfigReader.java b/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedConfigReader.java new file mode 100644 index 0000000..b4d56a1 --- /dev/null +++ b/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedConfigReader.java @@ -0,0 +1,215 @@ +package bjc.utils.ioutils; + +import bjc.utils.data.IHolder; +import bjc.utils.data.IPair; +import bjc.utils.data.Identity; +import bjc.utils.data.Pair; +import bjc.utils.exceptions.UnknownPragmaException; +import bjc.utils.funcdata.FunctionalMap; +import bjc.utils.funcdata.FunctionalStringTokenizer; +import bjc.utils.funcdata.IMap; + +import java.io.InputStream; +import java.util.InputMismatchException; +import java.util.Scanner; +import java.util.function.BiConsumer; +import java.util.function.Consumer; + +/** + * This class parses a rules based config file, and uses it to drive a provided + * set of actions + * + * @author ben + * + * @param <E> + * The type of the state object to use + * + */ +public class RuleBasedConfigReader<E> { + // Function to execute when starting a rule + // Takes the tokenizer, and a pair of the read token and application + // state + private BiConsumer<FunctionalStringTokenizer, IPair<String, E>> start; + + // Function to use when continuing a rule + // Takes a tokenizer and application state + private BiConsumer<FunctionalStringTokenizer, E> continueRule; + + // Function to use when ending a rule + // Takes an application state + private Consumer<E> end; + + // Map of pragma names to pragma actions + // Pragma actions are functions taking a tokenizer and application state + private IMap<String, BiConsumer<FunctionalStringTokenizer, E>> pragmas; + + /** + * Create a new rule-based config reader + * + * @param start + * The action to fire when starting a rule + * @param continueRule + * The action to fire when continuing a rule + * @param end + * The action to fire when ending a rule + */ + public RuleBasedConfigReader(BiConsumer<FunctionalStringTokenizer, IPair<String, E>> start, + BiConsumer<FunctionalStringTokenizer, E> continueRule, Consumer<E> end) { + this.start = start; + this.continueRule = continueRule; + this.end = end; + + this.pragmas = new FunctionalMap<>(); + } + + /** + * Add a pragma to this reader + * + * @param name + * The name of the pragma to add + * @param action + * The function to execute when this pragma is read + */ + public void addPragma(String name, BiConsumer<FunctionalStringTokenizer, E> action) { + if(name == null) + throw new NullPointerException("Pragma name must not be null"); + else if(action == null) throw new NullPointerException("Pragma action must not be null"); + + pragmas.put(name, action); + } + + private void continueRule(E state, boolean isRuleOpen, String line) { + // Make sure our input is correct + if(isRuleOpen == false) + throw new InputMismatchException("Cannot continue rule with no rule open"); + else if(continueRule == null) + throw new InputMismatchException("Rule continuation not supported for current grammar"); + + // Accept the rule + continueRule.accept(new FunctionalStringTokenizer(line.substring(1), " "), state); + } + + private boolean endRule(E state, boolean isRuleOpen) { + // Ignore blank line without an open rule + if(isRuleOpen == false) + // Do nothing + return false; + else { + // Nothing happens on rule end + if(end != null) { + // Process the rule ending + end.accept(state); + } + + // Return a closed rule + return false; + } + } + + /** + * Run a stream through this reader + * + * @param input + * The stream to get input + * @param initialState + * The initial state of the reader + * @return The final state of the reader + */ + public E fromStream(InputStream input, E initialState) { + if(input == null) throw new NullPointerException("Input stream must not be null"); + + // Application state: We're giving this back later + E state = initialState; + + // Prepare our input source + try(Scanner source = new Scanner(input)) { + source.useDelimiter("\n"); + // This is true when a rule's open + IHolder<Boolean> isRuleOpen = new Identity<>(false); + + // Do something for every line of the file + source.forEachRemaining((line) -> { + // Skip comment lines + if(line.startsWith("#") || line.startsWith("//")) + // It's a comment + return; + else if(line.equals("")) { + // End the rule + isRuleOpen.replace(endRule(state, isRuleOpen.getValue())); + } else if(line.startsWith("\t")) { + // Continue the rule + continueRule(state, isRuleOpen.getValue(), line); + } else { + // Open a rule + isRuleOpen.replace(startRule(state, isRuleOpen.getValue(), line)); + } + }); + } + + // Return the state that the user has created + return state; + + } + + /** + * Set the action to execute when continuing a rule + * + * @param continueRule + * The action to execute on continuation of a rule + */ + public void setContinueRule(BiConsumer<FunctionalStringTokenizer, E> continueRule) { + this.continueRule = continueRule; + } + + /** + * Set the action to execute when ending a rule + * + * @param end + * The action to execute on ending of a rule + */ + public void setEndRule(Consumer<E> end) { + this.end = end; + } + + /** + * Set the action to execute when starting a rule + * + * @param start + * The action to execute on starting of a rule + */ + public void setStartRule(BiConsumer<FunctionalStringTokenizer, IPair<String, E>> start) { + if(start == null) throw new NullPointerException("Action on rule start must be non-null"); + + this.start = start; + } + + private boolean startRule(E state, boolean isRuleOpen, String line) { + // Create the line tokenizer + FunctionalStringTokenizer tokenizer = new FunctionalStringTokenizer(line, " "); + + // Get the initial token + String nextToken = tokenizer.nextToken(); + + // Handle pragmas + if(nextToken.equals("pragma")) { + // Get the pragma name + String token = tokenizer.nextToken(); + + // Handle pragmas + pragmas.getOrDefault(token, (tokenzer, stat) -> { + throw new UnknownPragmaException("Unknown pragma " + token); + }).accept(tokenizer, state); + } else { + // Make sure input is correct + if(isRuleOpen == true) + throw new InputMismatchException("Nested rules are currently not supported"); + + // Start a rule + start.accept(tokenizer, new Pair<>(nextToken, state)); + + isRuleOpen = true; + } + + return isRuleOpen; + } +} diff --git a/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedReaderPragmas.java b/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedReaderPragmas.java new file mode 100644 index 0000000..f19eb2c --- /dev/null +++ b/BJC-Utils2/src/main/java/bjc/utils/ioutils/RuleBasedReaderPragmas.java @@ -0,0 +1,80 @@ +package bjc.utils.ioutils; + +import bjc.utils.exceptions.PragmaFormatException; +import bjc.utils.funcdata.FunctionalStringTokenizer; +import bjc.utils.funcutils.ListUtils; + +import java.util.function.BiConsumer; + +/** + * Contains factory methods for common pragma types + * + * @author ben + * + */ +public class RuleBasedReaderPragmas { + + /** + * Creates a pragma that takes a single integer argument + * + * @param <StateType> + * The type of state that goes along with this pragma + * @param name + * The name of this pragma, for error message purpose + * @param consumer + * The function to invoke with the parsed integer + * @return A pragma that functions as described above. + */ + public static <StateType> BiConsumer<FunctionalStringTokenizer, StateType> buildInteger(String name, + BiConsumer<Integer, StateType> consumer) { + return (tokenizer, state) -> { + // Check our input is correct + if(!tokenizer.hasMoreTokens()) + throw new PragmaFormatException("Pragma " + name + " requires one integer argument"); + + // Read the argument + String token = tokenizer.nextToken(); + + try { + // Run the pragma + consumer.accept(Integer.parseInt(token), state); + } catch(NumberFormatException nfex) { + // Tell the user their argument isn't correct + PragmaFormatException pfex = new PragmaFormatException( + "Argument " + token + " to " + name + " pragma isn't a valid integer. " + + "This pragma requires a integer argument"); + + pfex.initCause(nfex); + + throw pfex; + } + }; + } + + /** + * Creates a pragma that takes any number of arguments and collapses + * them all into a single string + * + * @param <StateType> + * The type of state that goes along with this pragma + * @param name + * The name of this pragma, for error message purpose + * @param consumer + * The function to invoke with the parsed string + * @return A pragma that functions as described above. + */ + public static <StateType> BiConsumer<FunctionalStringTokenizer, StateType> buildStringCollapser(String name, + BiConsumer<String, StateType> consumer) { + return (tokenizer, state) -> { + // Check our input + if(!tokenizer.hasMoreTokens()) throw new PragmaFormatException( + "Pragma " + name + " requires one or more string arguments"); + + // Build our argument + String collapsed = ListUtils.collapseTokens(tokenizer.toList()); + + // Run the pragma + consumer.accept(collapsed, state); + }; + } +} |
