hacker-quotes/english.go

637 lines
14 KiB
Go

package hacker
import (
"encoding/json"
"fmt"
"io/ioutil"
"math/rand"
"strings"
"github.com/zorchenhimer/hacker-quotes/database"
"github.com/zorchenhimer/hacker-quotes/models"
)
type InitialData struct {
Adjectives [][]string
Nouns [][]string
Verbs [][]string
Pronouns [][]string
Sentences []string
}
type english struct {
db database.DB
currentPronoun string
}
func NewEnglish(db database.DB) (HackerQuotes, error) {
return &english{db: db}, nil
}
/*
Sentence format
{word_type:options}
{{word_type:new word:properties}}
{pronoun} can't {verb:i,present} {noun_phrase}, it {verb:it,future} {noun_phrase}!
{verb:you,present} {noun_phrase:indefinite}, then you can {verb:you,present} {noun_phrase:definite}!
{noun_phrase} {verb}. With {noun_phrase:indifinite,noadj,compound}!
{pronoun} {{verb:need:from_pronoun,present}} to {verb:i,present} {noun_phrase:definite}!
*/
func (g *english) Hack() (string, error) {
//var fmtString string = `{verb:you,present} {noun_phrase:definite} then you can {verb:you,present} {noun_phrase:definite}!`
//var str string = `{pronoun} {{verb:need:from_pronoun,present}} to {verb:i,present} {noun_phrase:definite}!`
str, err := g.randomSentence()
if err != nil {
return "", err
}
return g.HackThis(str)
}
func (g *english) HackThis(fmtString string) (string, error) {
var idx int
var err error
var nidx int
output := &strings.Builder{}
g.currentPronoun = ""
for idx < len(fmtString) {
if fmtString[idx] == '{' {
if fmtString[idx+1] == '{' {
nidx, err = g.consumeNewWord(fmtString, idx, output)
if err != nil {
return "", err
}
idx = nidx
continue
}
nidx, err = g.consumeWord(fmtString, idx, output)
if err != nil {
return "", err
}
idx = nidx
continue
}
nidx, err = g.consumeRaw(fmtString, idx, output)
if err != nil {
return "", err
}
idx = nidx
}
return toCap(output.String()), nil
}
func (g *english) consumeRaw(fmtString string, idx int, output *strings.Builder) (int, error) {
end := strings.Index(fmtString[idx:], "{")
if end == -1 {
output.WriteString(fmtString[idx:len(fmtString)])
return len(fmtString), nil
}
output.WriteString(fmtString[idx:end+idx])
return idx+end, nil
}
func (g *english) parseVerbOptions(optlist []string) (models.ConjugationType, models.ConjugationTime, bool) {
var ct models.ConjugationType = models.ConjugationType(rand.Intn(5) + 1)
if sliceContains(optlist, "i") {
ct = models.CT_I
} else if sliceContains(optlist, "you") {
ct = models.CT_You
} else if sliceContains(optlist, "it") {
ct = models.CT_It
} else if sliceContains(optlist, "we") {
ct = models.CT_We
} else if sliceContains(optlist, "they") {
ct = models.CT_They
}
var cm models.ConjugationTime = models.ConjugationTime(rand.Intn(3) + 1)
if sliceContains(optlist, "present") {
cm = models.CM_Present
} else if sliceContains(optlist, "past") {
cm = models.CM_Past
} else if sliceContains(optlist, "future") {
cm = models.CM_Future
}
var invert bool = rand.Int() % 2 == 0
if sliceContains(optlist, "invert") {
invert = true
}
//var regular bool = true
//if sliceContains(optlist, "irregular") {
// regular = false
//}
if sliceContains(optlist, "from_pronoun") {
switch g.currentPronoun {
case "he", "she", "it":
ct = models.CT_It
case "i":
ct = models.CT_I
case "you":
ct = models.CT_You
case "we":
ct = models.CT_We
case "they":
ct = models.CT_They
}
}
return ct, cm, invert
}
func (g *english) parseNounOptions(optlist []string) (bool, bool) {
var plural bool = rand.Int() % 2 == 0
if sliceContains(optlist, "plural") {
plural = true
} else if sliceContains(optlist, "singular") {
plural = false
}
var compound bool = rand.Int() % 2 == 0
if sliceContains(optlist, "compound") {
compound = true
} else if sliceContains(optlist, "simple") {
compound = false
}
return plural, compound
}
func (g *english) consumeNewWord(fmtString string, idx int, output *strings.Builder) (int, error) {
idx += 2
var wordtype string
var word string
var options string
end := strings.Index(fmtString[idx:], "}")
if end == -1 {
return 0, fmt.Errorf("[consumeNewWord] Unclosed definition starting at %d", idx)
}
end += idx
// Find the start of the new word
def := strings.Index(fmtString[idx:], ":")
if def == -1 {
return 0, fmt.Errorf("[consumeNewWord] Word definition missing word")
}
def += idx
wordtype = fmtString[idx:def]
// Find the start of the options
opts := strings.Index(fmtString[def+1:], ":")
if opts > -1 {
opts += def+2
options = fmtString[opts:end]
word = fmtString[def+1:opts-1]
} else {
word = fmtString[def+1:end]
}
//fmt.Printf("idx:%d def:%d opts:%d end:%d type:%q word:%q opts:%q\n",
// idx, def, opts, end,
// wordtype,
// word,
// options)
optlist := strings.Split(options, ",")
var formatted string
switch wordtype {
case "verb":
ct, cm, invert := g.parseVerbOptions(optlist)
v := models.Verb{
Regular: true,
Word: word,
}
formatted = v.Conjugate(ct, cm, invert)
case "noun":
plural, _ := g.parseNounOptions(optlist)
if plural {
n := models.Noun{
Regular: true,
Word: word,
}
formatted = n.Plural()
} else {
formatted = word
}
default:
// Pronouns and adjectives aren't implemented because they have no modifications to apply.
return 0, fmt.Errorf("Word type %q not implemented creating in-sentence", wordtype)
}
output.WriteString(formatted)
return end+2, nil
}
func (g *english) consumeWord(fmtString string, idx int, output *strings.Builder) (int, error) {
idx++
var wordtype string
var options string
end := strings.Index(fmtString[idx:], "}")
if end == -1 {
return 0, fmt.Errorf("[consumeWord] Unclosed definition starting at %d", idx)
}
end += idx
optsStart := strings.Index(fmtString[idx:end], ":")
if optsStart != -1 {
options = fmtString[optsStart+idx+1:end]
wordtype = fmtString[idx:optsStart+idx]
} else {
wordtype = fmtString[idx:end]
}
if wordtype == "" {
return 0, fmt.Errorf("[consumeWord] Missing word type at idx: %d", idx)
}
opts := strings.Split(options, ",")
var word string
var err error
switch wordtype {
case "pronoun":
var plural bool
if sliceContains(opts, "plural") {
plural = true
}
word, err = g.randomPronoun(plural)
if err != nil {
return 0, err
}
g.currentPronoun = word
case "verb":
ct, cm, invert := g.parseVerbOptions(opts)
word, err = g.randomVerb(ct, cm, invert)
if err != nil {
return 0, err
}
case "noun":
plural, compound := g.parseNounOptions(opts)
word, err = g.randomNoun(plural, compound)
if err != nil {
return 0, err
}
case "noun_phrase":
var definite bool = true
var hasAdj bool = true
var plural bool = false
var compound bool = false
if sliceContains(opts, "indefinite") {
definite = false
}
if sliceContains(opts, "noadj") {
hasAdj = false
}
if sliceContains(opts, "plural") {
plural = true
}
if sliceContains(opts, "compound") {
compound = true
}
word, err = g.nounPhrase(definite, hasAdj, plural, compound)
if err != nil {
return 0, err
}
case "adjective":
word, err = g.randomAdjective()
if err != nil {
return 0, err
}
default:
return 0, fmt.Errorf("[consumeWord] Invalid word type %s at %d", wordtype, idx)
}
output.WriteString(word)
return end+1, nil
}
func (g *english) nounPhrase(definite, hasAdj, plural, compound bool) (string, error){
adj := ""
var err error
if hasAdj {
adj, err = g.randomAdjective()
if err != nil {
return "", err
}
}
noun, err := g.randomNoun(plural, compound)
if err != nil {
return "", err
}
phrase := adj
if phrase != "" {
phrase += " " + noun
} else {
phrase = noun
}
if definite && !plural {
//fmt.Println("[nounPhrase] definite && !plural")
return "the " + phrase, nil
}
if !plural {
//fmt.Println("[nounPhrase] !plural")
return g.ana(phrase), nil
}
return phrase, nil
}
func (g *english) randomAdjective() (string, error) {
ids, err := g.db.GetAdjectiveIds()
if err != nil {
return "", fmt.Errorf("[adj] get IDs error: %v", err)
}
if len(ids) <= 0 {
return "", fmt.Errorf("No adjective IDs returned from database")
}
rid := int(rand.Int63n(int64(len(ids))))
//fmt.Printf("[adj] len(ids): %d; rid: %d; %d\n", len(ids), rid, ids[rid])
adj, err := g.db.GetAdjective(ids[rid])
if err != nil {
return "", fmt.Errorf("[adj] ID: %d; %v", ids[rid], err)
}
return adj.Word, nil
}
func (g *english) randomNoun(plural, compound bool) (string, error) {
var ids []int
var err error
if compound {
ids, err = g.db.GetNounIds(true, true, true)
if err != nil {
return "", fmt.Errorf("[noun] get IDs error: %v", err)
}
} else {
ids, err = g.db.GetNounIds(true, false, false)
if err != nil {
return "", fmt.Errorf("[noun] get IDs error: %v", err)
}
}
if len(ids) <= 0 {
return "", fmt.Errorf("No noun IDs returned from database")
}
rid := int(rand.Int63n(int64(len(ids))))
//fmt.Printf("[noun] len(ids): %d; rid: %d; ID: %d\n", len(ids), rid, ids[rid])
noun, err := g.db.GetNoun(ids[rid])
if err != nil {
return "", fmt.Errorf("[noun] ID: %d; %v", ids[rid], err)
}
if plural {
return noun.Plural(), nil
}
return noun.Word, nil
}
func (g *english) randomVerb(ctype models.ConjugationType, ctime models.ConjugationTime, invert bool) (string, error) {
ids, err := g.db.GetVerbIds()
if err != nil {
return "", fmt.Errorf("[verb] get IDs error: %v", err)
}
if len(ids) <= 0 {
return "", fmt.Errorf("No verb IDs returned from database")
}
rid := int(rand.Int63n(int64(len(ids))))
verb, err := g.db.GetVerb(ids[rid])
if err != nil {
return "", fmt.Errorf("[verb] ID: %d; %v", ids[rid], err)
}
return verb.Conjugate(ctype, ctime, invert), nil
}
func (g *english) randomPronoun(plural bool) (string, error) {
ids, err := g.db.GetPronounIds(plural)
if err != nil {
return "", fmt.Errorf("[pronoun] get IDs error: %v", err)
}
if len(ids) <= 0 {
return "", fmt.Errorf("No pronoun IDs returned from database")
}
rid := int(rand.Int63n(int64(len(ids))))
pronoun, err := g.db.GetPronoun(ids[rid])
if err != nil {
return "", fmt.Errorf("[pronoun] ID: %d; %v", ids[rid], err)
}
return pronoun.Word, nil
}
func (g *english) randomSentence() (string, error) {
ids, err := g.db.GetSentenceIds()
if err != nil {
return "", fmt.Errorf("[sentence] get IDs error: %v", err)
}
if len(ids) <= 0 {
return "", fmt.Errorf("[sentence] No sentence IDs returned from database")
}
rid := int(rand.Int63n(int64(len(ids))))
sentence, err := g.db.GetSentence(ids[rid])
if err != nil {
return "", fmt.Errorf("[sentence] ID: %d, %v", ids[rid], err)
}
return sentence, nil
}
func (g *english) InitData(filename string) error {
fmt.Printf("Initializing database with data in %q\n", filename)
if g.db == nil {
return fmt.Errorf("databse is nil!")
}
raw, err := ioutil.ReadFile(filename)
if err != nil {
return err
}
//data := map[string][]interface{}{}
data := InitialData{}
if err = json.Unmarshal(raw, &data); err != nil {
return err
}
if data.Adjectives == nil || len(data.Adjectives) == 0 {
return fmt.Errorf("Missing Adjectives in input data")
}
adjectives := []models.Adjective{}
for _, adj := range data.Adjectives {
t, word := adj[0], adj[1]
a := models.Adjective{Word: word}
if strings.Contains(t, "a") {
a.Absolute = true
}
if strings.Contains(t, "e") {
a.AppendEst = true
}
if strings.Contains(t, "m") {
a.AppendMore = true
}
adjectives = append(adjectives, a)
}
if data.Nouns == nil || len(data.Nouns) == 0 {
return fmt.Errorf("Missing nouns key in data")
}
nouns := []models.Noun{}
for _, noun := range data.Nouns {
t, word := noun[0], noun[1]
n := models.Noun{Word: word}
if strings.Contains(t, "m") {
n.Multiple = true
}
if strings.Contains(t, "b") {
n.Begin = true
}
if strings.Contains(t, "e") {
n.End = true
}
if strings.Contains(t, "a") {
n.Alone = true
}
if strings.Contains(t, "r") {
n.Regular = true
}
nouns = append(nouns, n)
}
if data.Verbs == nil || len(data.Verbs) == 0 {
return fmt.Errorf("Missing verbs key in data")
}
verbs := []models.Verb{}
for _, verb := range data.Verbs {
v := models.Verb{Word: verb[1]}
if strings.Contains(verb[0], "r") {
v.Regular = true
}
verbs = append(verbs, v)
}
if data.Pronouns == nil || len(data.Pronouns) == 0 {
return fmt.Errorf("Missing pronouns key in data")
}
pronouns := []models.Pronoun{}
for _, pro := range data.Pronouns {
p := models.Pronoun{Word: pro[1]}
if strings.Contains(pro[0], "p") {
p.Plural = true
}
pronouns = append(pronouns, p)
}
if data.Sentences == nil || len(data.Sentences) == 0 {
return fmt.Errorf("Missing sentences key in data")
}
return g.db.InitData(adjectives, nouns, verbs, pronouns, data.Sentences)
}
// Prepend "a", "an" or nothing to a phrase
func (g *english) ana(phrase string) string {
//fmt.Printf("[ana] phrase[0]: %s; %q\n", string(phrase[0]), phrase)
if strings.ContainsAny(string(phrase[0]), "aeiou") {
return "an " + phrase
}
return "a " + phrase
}
// toCap capitalizes the first word of each sentence in the input string.
func toCap(words string) string {
ret := strings.ToUpper(string(words[0])) + words[1:]
next := strings.Index(words, ". ")
if next == -1 {
return ret
}
for next+3 < len(words) {
newnext := strings.Index(words[next+1:], ". ")
ret = ret[0:next+2] + strings.ToUpper(string(ret[next+2])) + ret[next+3:]
if newnext == -1 {
break
}
next = newnext + next+1
}
return ret
}
func sliceContains(haystack []string, needle string) bool {
if len(haystack) == 0 {
return false
}
for _, item := range haystack {
if item == needle {
return true
}
}
return false
}