From 9306cb60c32082c5403931de0823a9fd5daa196c Mon Sep 17 00:00:00 2001 From: Jason Katz-Brown Date: Sun, 25 Aug 2013 02:17:13 -0700 Subject: Initial git commit. --- encodeleaves/encodeleaves.cpp | 113 ++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 113 insertions(+) create mode 100644 encodeleaves/encodeleaves.cpp (limited to 'encodeleaves/encodeleaves.cpp') diff --git a/encodeleaves/encodeleaves.cpp b/encodeleaves/encodeleaves.cpp new file mode 100644 index 0000000..882684e --- /dev/null +++ b/encodeleaves/encodeleaves.cpp @@ -0,0 +1,113 @@ +/* + * Quackle -- Crossword game artificial intelligence and analysis tool + * Copyright (C) 2005-2006 Jason Katz-Brown and John O'Laughlin. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA + * 02110-1301 USA + */ + +#include +#include +#include +#include +#include + +#include + +#include +#include +#include + +using namespace std; + +int main(int argc, char **argv) { + QCoreApplication a(argc, argv); + + GetOpt opts; + QString alphabet; + opts.addOption('a', "alphabet", &alphabet); + if (!opts.parse()) + return 1; + + if (alphabet.isNull()) + alphabet = "english"; + + Quackle::AlphabetParameters *alphas = 0; + QString alphabetFile = QString("../data/alphabets/%1.quackle_alphabet").arg(alphabet); + UVcout << "Using alphabet file: " << QuackleIO::Util::qstringToString(alphabetFile) << endl; + QuackleIO::FlexibleAlphabetParameters *flexure = new QuackleIO::FlexibleAlphabetParameters; + flexure->load(alphabetFile); + alphas = flexure; + + QString leavesFilename = "superleaves.raw"; + QFile file(leavesFilename); + if (!file.exists()) + { + UVcout << "leaves file does not exist: " << QuackleIO::Util::qstringToString(leavesFilename) << endl; + return false; + } + + if (!file.open(QIODevice::ReadOnly | QIODevice::Text)) + { + UVcout << "Could not open " << QuackleIO::Util::qstringToString(leavesFilename) << endl; + return false; + } + + QTextStream stream(&file); + stream.setCodec(QTextCodec::codecForName("UTF-8")); + + ofstream out("encoded"); + + int encodableLeaves = 0; + int unencodableLeaves = 0; + + while (!stream.atEnd()) { + QString leaveQString; + stream >> leaveQString; + double value; + stream >> value; + //UVcout << "value: " << value << endl; + + UVString leaveString = QuackleIO::Util::qstringToString(leaveQString); + + if (stream.atEnd()) + break; + + //UVcout << "read original string: " << originalString << endl; + UVString leftover; + Quackle::LetterString encodedLeave = alphas->encode(leaveString, &leftover); + if (leftover.empty()) + { + unsigned char leavelength = encodedLeave.length(); + out.write((char*)(&leavelength), 1); + out.write(encodedLeave.begin(), encodedLeave.length()); + unsigned short int intvalue = (value + 128) * 256; + //UVcout << "intvalue: " << intvalue << endl; + out.write((char*)(&intvalue), 2); + ++encodableLeaves; + } + else + { + //UVcout << "not encodable without leftover: " << originalString << endl; + ++unencodableLeaves; + } + } + + file.close(); + delete alphas; + + UVcout << "encodable leaves: " << encodableLeaves << ", unencodable leaves: " << unencodableLeaves << endl; + +} -- cgit v1.2.3