diff options
| author | student <student@192.168.1.186> | 2017-04-05 11:51:19 -0400 |
|---|---|---|
| committer | student <student@192.168.1.186> | 2017-04-05 11:51:19 -0400 |
| commit | 19e411314a757f029fd157cf9b2968b839c4f1d0 (patch) | |
| tree | a9c6a4eb6cce72f88ff58a70261ad0739d357130 /src/main/java/bjc | |
| parent | fe521df984a4bf1f6627401716e6b4558235bfb2 (diff) | |
Work on markup interface
Diffstat (limited to 'src/main/java/bjc')
| -rw-r--r-- | src/main/java/bjc/inflexion/EnglishUtils.java | 67 | ||||
| -rw-r--r-- | src/main/java/bjc/inflexion/InflectionML.java | 128 |
2 files changed, 195 insertions, 0 deletions
diff --git a/src/main/java/bjc/inflexion/EnglishUtils.java b/src/main/java/bjc/inflexion/EnglishUtils.java new file mode 100644 index 0000000..875d75e --- /dev/null +++ b/src/main/java/bjc/inflexion/EnglishUtils.java @@ -0,0 +1,67 @@ +/** + * (C) Copyright 2017 Benjamin Culkin. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package bjc.inflexion; + +/** + * @author student + * + */ +public class EnglishUtils { + private static String[] smallNums = new String[] { "zero", "one", "two", "three", "four", "five", "six", "seven", + "eight", "nine", "ten" }; + + private static String[] summaryNums = new String[] { "no", "one", "a couple of", "a few", "several" }; + private static String[] endSummaryNums = new String[] { "no", "one", "a couple of", "a few", "several" }; + + private static int[] summaryMap = new int[] { + /* + * no + */ + 0, + /* + * one + */ + 1, + /* + * a couple of + */ + 2, + /* + * a few + */ + 3, 3, 3, + /* + * several + */ + 4, 4, 4, 4 }; + + public static String smallIntToWord(int num) { + if (num >= 0 && num <= 10) { + return smallNums[num]; + } + + return Integer.toString(num); + } + + public static String intSummarize(int num, boolean atEnd) { + String[] nums = atEnd ? endSummaryNums : summaryNums; + + if (num >= 0 && num < 10) { + return nums[summaryMap[num]]; + } else + return "many"; + } +} diff --git a/src/main/java/bjc/inflexion/InflectionML.java b/src/main/java/bjc/inflexion/InflectionML.java new file mode 100644 index 0000000..6ec78ba --- /dev/null +++ b/src/main/java/bjc/inflexion/InflectionML.java @@ -0,0 +1,128 @@ +/** + * (C) Copyright 2017 Benjamin Culkin. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package bjc.inflexion; + +import java.util.Arrays; +import java.util.HashSet; +import java.util.Set; +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import bjc.inflexion.nouns.InflectionException; +import bjc.inflexion.nouns.Noun; +import bjc.inflexion.nouns.Nouns; + +/** + * @author student + * + */ +public class InflectionML { + private static Pattern FORM_MARKER = Pattern.compile("<(?<command>[#A])(?<options>[^:]*):(?<text>[^>]*)>"); + + /** + * Apply inflection to marked forms in the string. + * + * @param form + * The string to inflect. + * + * @param nounDB + * The source to load nouns from. + * + * @return The inflected string. + */ + public static String inflect(String form, Nouns nounDB) { + Matcher formMatcher = FORM_MARKER.matcher(form); + + StringBuffer formBuffer = new StringBuffer(); + + int curCount = 1; + boolean inflectSingular = true; + + while (formMatcher.find()) { + String command = formMatcher.group("command"); + String options = formMatcher.group("options"); + String text = formMatcher.group("text"); + + Set<String> optionSet = new HashSet<>(); + for (int i = 1; i <= options.length(); i++) { + optionSet.add(options.substring(i - 1, i)); + } + + switch (command) { + case "#": + try { + curCount = Integer.parseInt(text); + + if (curCount != 1) + inflectSingular = false; + else + inflectSingular = true; + + String rep = text; + + if (optionSet.contains("n")) { + if (curCount == 0) + rep = "no"; + } + + if (optionSet.contains("s")) { + if (curCount == 0) { + rep = "no"; + inflectSingular = true; + } + } + + if (optionSet.contains("a")) { + /* + * TODO implement a/an for nouns + */ + } + + boolean shouldOverride = !(rep.equals("no") || rep.equals("a") || rep.equals("an")); + if (optionSet.contains("w") && shouldOverride) { + rep = EnglishUtils.smallIntToWord(curCount); + } else if (optionSet.contains("f")) { + rep = EnglishUtils.intSummarize(curCount, false); + } + + formMatcher.appendReplacement(formBuffer, rep); + } catch (NumberFormatException nfex) { + throw new InflectionException("Count setter must take a number as a parameter", nfex); + } + + case "N": + Noun noun = nounDB.getNoun(text); + if (inflectSingular || optionSet.contains("s")) { + formMatcher.appendReplacement(formBuffer, noun.singular()); + } else if (optionSet.contains("p")) { + if (optionSet.contains("c")) { + formMatcher.appendReplacement(formBuffer, noun.classicalPlural()); + } else { + formMatcher.appendReplacement(formBuffer, noun.modernPlural()); + } + } + default: + String msg = String.format("Unknown command '%s'", command); + + throw new InflectionException(msg); + } + } + + formMatcher.appendTail(formBuffer); + + return formBuffer.toString(); + } +} |
