/*
* Quackle -- Crossword game artificial intelligence and analysis tool
* Copyright (C) 2005-2014 Jason Katz-Brown and John O'Laughlin.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*/
#include
#include
#include "gaddagfactory.h"
#include "util.h"
GaddagFactory::GaddagFactory(const QString& alphabetFile)
{
QuackleIO::FlexibleAlphabetParameters *flexure = new QuackleIO::FlexibleAlphabetParameters;
flexure->load(alphabetFile);
alphas = flexure;
// So the separator is sorted to last.
root.t = false;
root.c = QUACKLE_NULL_MARK; // "_"
root.pointer = 0;
root.lastchild = true;
}
void GaddagFactory::pushWord(const QString& word)
{
UVString originalString = QuackleIO::Util::qstringToString(word);
UVString leftover;
Quackle::LetterString encodedWord = alphas->encode(originalString, &leftover);
if (leftover.empty())
{
++m_encodableWords;
for (unsigned i = 1; i <= encodedWord.length(); i++)
{
Quackle::LetterString newword;
for (int j = i - 1; j >= 0; j--)
newword.push_back(encodedWord[j]);
if (i < encodedWord.length())
{
newword.push_back(internalSeparatorRepresentation); // "^"
for (unsigned j = i; j < encodedWord.length(); j++)
newword.push_back(encodedWord[j]);
}
gaddagizedWords.push_back(newword);
}
}
else
{
UVcout << "not encodable without leftover: " << originalString << endl;
++m_unencodableWords;
}
}
void GaddagFactory::generate()
{
Quackle::WordList::const_iterator wordsEnd = gaddagizedWords.end();
for (Quackle::WordList::const_iterator wordsIt = gaddagizedWords.begin(); wordsIt != wordsEnd; ++wordsIt)
root.pushWord(*wordsIt);
// for (const auto& words : gaddaggizedWords)
// root.pushWord(words);
}
void GaddagFactory::writeIndex(const QString& fname)
{
nodelist.push_back(&root);
root.print(nodelist, "");
ofstream out(QuackleIO::Util::qstringToStdString(fname).c_str(), ios::out | ios::binary);
for (size_t i = 0; i < nodelist.size(); i++)
{
unsigned int p = (unsigned int)(nodelist[i]->pointer);
if (p != 0)
p -= i; // offset indexing
char bytes[4];
unsigned char n1 = (p & 0x00FF0000) >> 16;
unsigned char n2 = (p & 0x0000FF00) >> 8;
unsigned char n3 = (p & 0x000000FF) >> 0;
unsigned char n4;
n4 = nodelist[i]->c;
if (n4 == internalSeparatorRepresentation)
n4 = QUACKLE_NULL_MARK;
if (nodelist[i]->t)
n4 |= 64;
if (nodelist[i]->lastchild)
n4 |= 128;
bytes[0] = n1; bytes[1] = n2; bytes[2] = n3; bytes[3] = n4;
out.write(bytes, 4);
}
}
void GaddagFactory::Node::print(vector< Node* > nodelist, Quackle::LetterString prefix)
{
if (children.size() > 0)
{
pointer = nodelist.size();
children[children.size() - 1].lastchild = true;
}
for (size_t i = 0; i < children.size(); i++)
nodelist.push_back(&children[i]);
for (size_t i = 0; i < children.size(); i++)
children[i].print(nodelist, prefix + children[i].c);
}
void GaddagFactory::Node::pushWord(Quackle::LetterString word)
{
if (word.length() == 0)
{
t = true;
return;
}
Quackle::Letter first = Quackle::String::front(word);
Quackle::LetterString rest = Quackle::String::allButFront(word);
int index = -1;
for (size_t i = 0; i < children.size(); i++)
{
if (children[i].c == first)
{
index = i;
i = children.size();
}
}
if (index == -1)
{
Node n;
n.c = first;
n.t = false;
n.pointer = 0;
n.lastchild = false;
children.push_back(n);
index = children.size() - 1;
}
children[index].pushWord(rest);
}