/*
* Copyright (c) 2008, 2009, 2010, 2011
* Jonathan Schleifer <js@webkeks.org>
*
* All rights reserved.
*
* This file is part of ObjFW. It may be distributed under the terms of the
* Q Public License 1.0, which can be found in the file LICENSE.QPL included in
* the packaging of this file.
*
* Alternatively, it may be distributed under the terms of the GNU General
* Public License, either version 2 or 3, which can be found in the file
* LICENSE.GPLv2 or LICENSE.GPLv3 respectively included in the packaging of this
* file.
*/
#include "config.h"
#include <string.h>
#import "OFString.h"
#import "OFArray.h"
#import "OFFile.h"
#import "OFAutoreleasePool.h"
#import "OFApplication.h"
#import "OFExceptions.h"
#import "TableGenerator.h"
#import "copyright.h"
OF_APPLICATION_DELEGATE(TableGenerator)
@implementation TableGenerator
- init
{
self = [super init];
upperTableSize = SIZE_MAX;
lowerTableSize = SIZE_MAX;
casefoldingTableSize = SIZE_MAX;
return self;
}
- (void)applicationDidFinishLaunching
{
TableGenerator *tgen = [[[TableGenerator alloc] init] autorelease];
[tgen readUnicodeDataFileAtPath: @"UnicodeData.txt"];
[tgen readCaseFoldingFileAtPath: @"CaseFolding.txt"];
[tgen writeTablesToFileAtPath: @"../src/unicode.m"];
[tgen writeHeaderToFileAtPath: @"../src/unicode.h"];
}
- (void)readUnicodeDataFileAtPath: (OFString*)path
{
OFAutoreleasePool *pool = [[OFAutoreleasePool alloc] init], *pool2;
OFFile *file = [OFFile fileWithPath: path
mode: @"rb"];
OFString *line;
pool2 = [[OFAutoreleasePool alloc] init];
while ((line = [file readLine])) {
OFArray *splitted;
OFString **splitted_carray;
of_unichar_t codep;
splitted = [line componentsSeparatedByString: @";"];
if ([splitted count] != 15) {
[of_stderr writeFormat: @"Invalid line: %s\n",
[line cString]];
[OFApplication terminateWithStatus: 1];
}
splitted_carray = [splitted cArray];
codep = [splitted_carray[0] hexadecimalValue];
upperTable[codep] = [splitted_carray[12] hexadecimalValue];
lowerTable[codep] = [splitted_carray[13] hexadecimalValue];
[pool2 releaseObjects];
}
[pool release];
}
- (void)readCaseFoldingFileAtPath: (OFString*)path
{
OFAutoreleasePool *pool = [[OFAutoreleasePool alloc] init], *pool2;
OFFile *file = [OFFile fileWithPath: path
mode: @"rb"];
OFString *line;
pool2 = [[OFAutoreleasePool alloc] init];
while ((line = [file readLine])) {
OFArray *splitted;
OFString **splitted_carray;
of_unichar_t codep;
if ([line characterAtIndex: 0] == '#')
continue;
splitted = [line componentsSeparatedByString: @"; "];
if ([splitted count] != 4) {
[of_stderr writeFormat: @"Invalid line: %s\n",
[line cString]];
[OFApplication terminateWithStatus: 1];
}
splitted_carray = [splitted cArray];
if (![splitted_carray[1] isEqual: @"S"] &&
![splitted_carray[1] isEqual: @"C"])
continue;
codep = [splitted_carray[0] hexadecimalValue];
casefoldingTable[codep] = [splitted_carray[2] hexadecimalValue];
[pool2 releaseObjects];
}
[pool release];
}
- (void)writeTablesToFileAtPath: (OFString*)file
{
OFAutoreleasePool *pool = [[OFAutoreleasePool alloc] init], *pool2;
of_unichar_t i, j;
OFFile *f = [OFFile fileWithPath: file
mode: @"wb"];
[f writeString: COPYRIGHT
@"#include \"config.h\"\n"
@"\n"
@"#import \"OFString.h\"\n\n"
@"static const of_unichar_t nop_page[0x100] = {};\n\n"];
pool2 = [[OFAutoreleasePool alloc] init];
/* Write upper_page_%u */
for (i = 0; i < 0x110000; i += 0x100) {
BOOL empty;
empty = YES;
for (j = i; j < i + 0x100; j++) {
if (upperTable[j] != 0) {
empty = NO;
upperTableSize = i >> 8;
upperTableUsed[upperTableSize] = YES;
break;
}
}
if (!empty) {
[f writeString: [OFString stringWithFormat:
@"static const of_unichar_t upper_page_%u[0x100] = "
@"{\n", i >> 8]];
for (j = i; j < i + 0x100; j += 8)
[f writeString: [OFString stringWithFormat:
@"\t%u, %u, %u, %u, %u, %u, %u, %u,\n",
upperTable[j], upperTable[j + 1],
upperTable[j + 2], upperTable[j + 3],
upperTable[j + 4], upperTable[j + 5],
upperTable[j + 6], upperTable[j + 7]]];
[f writeString: @"};\n\n"];
[pool2 releaseObjects];
}
}
/* Write lower_page_%u */
for (i = 0; i < 0x110000; i += 0x100) {
BOOL empty;
empty = YES;
for (j = i; j < i + 0x100; j++) {
if (lowerTable[j] != 0) {
empty = NO;
lowerTableSize = i >> 8;
lowerTableUsed[lowerTableSize] = YES;
break;
}
}
if (!empty) {
[f writeString: [OFString stringWithFormat:
@"static const of_unichar_t lower_page_%u[0x100] = "
@"{\n", i >> 8]];
for (j = i; j < i + 0x100; j += 8)
[f writeString: [OFString stringWithFormat:
@"\t%u, %u, %u, %u, %u, %u, %u, %u,\n",
lowerTable[j], lowerTable[j + 1],
lowerTable[j + 2], lowerTable[j + 3],
lowerTable[j + 4], lowerTable[j + 5],
lowerTable[j + 6], lowerTable[j + 7]]];
[f writeString: @"};\n\n"];
[pool2 releaseObjects];
}
}
/* Write cf_page_%u if it does NOT match lower_page_%u */
for (i = 0; i < 0x110000; i += 0x100) {
BOOL empty;
empty = YES;
for (j = i; j < i + 0x100; j++) {
if (casefoldingTable[j] != 0) {
empty = (memcmp(lowerTable + i,
casefoldingTable + i,
256 * sizeof(of_unichar_t)) ? NO : YES);
casefoldingTableSize = i >> 8;
casefoldingTableUsed[casefoldingTableSize] =
(empty ? 2 : 1);
break;
}
}
if (!empty) {
[f writeString: [OFString stringWithFormat:
@"static const of_unichar_t cf_page_%u[0x100] = {"
@"\n", i >> 8]];
for (j = i; j < i + 0x100; j += 8)
[f writeString: [OFString stringWithFormat:
@"\t%u, %u, %u, %u, %u, %u, %u, %u,\n",
casefoldingTable[j],
casefoldingTable[j + 1],
casefoldingTable[j + 2],
casefoldingTable[j + 3],
casefoldingTable[j + 4],
casefoldingTable[j + 5],
casefoldingTable[j + 6],
casefoldingTable[j + 7]]];
[f writeString: @"};\n\n"];
[pool2 releaseObjects];
}
}
/*
* Those are currently set to the last index.
* But from now on, we need the size.
*/
upperTableSize++;
lowerTableSize++;
casefoldingTableSize++;
/* Write of_unicode_upper_table */
[f writeString: [OFString stringWithFormat:
@"const of_unichar_t* const of_unicode_upper_table[0x%X] = {\n\t",
upperTableSize]];
for (i = 0; i < upperTableSize; i++) {
if (upperTableUsed[i]) {
[f writeString: [OFString stringWithFormat:
@"upper_page_%u", i]];
[pool2 releaseObjects];
} else
[f writeString: @"nop_page"];
if (i + 1 < upperTableSize) {
if ((i + 1) % 4 == 0)
[f writeString: @",\n\t"];
else
[f writeString: @", "];
}
}
[f writeString: @"\n};\n\n"];
/* Write of_unicode_lower_table */
[f writeString: [OFString stringWithFormat:
@"const of_unichar_t* const of_unicode_lower_table[0x%X] = {\n\t",
lowerTableSize]];
for (i = 0; i < lowerTableSize; i++) {
if (lowerTableUsed[i]) {
[f writeString: [OFString stringWithFormat:
@"lower_page_%u", i]];
[pool2 releaseObjects];
} else
[f writeString: @"nop_page"];
if (i + 1 < lowerTableSize) {
if ((i + 1) % 4 == 0)
[f writeString: @",\n\t"];
else
[f writeString: @", "];
}
}
[f writeString: @"\n};\n\n"];
/* Write of_unicode_casefolding_table */
[f writeString: [OFString stringWithFormat:
@"const of_unichar_t* const of_unicode_casefolding_table[0x%X] = {"
@"\n\t", casefoldingTableSize]];
for (i = 0; i < casefoldingTableSize; i++) {
if (casefoldingTableUsed[i] == 1) {
[f writeString: [OFString stringWithFormat:
@"cf_page_%u", i]];
[pool2 releaseObjects];
} else if (casefoldingTableUsed[i] == 2) {
[f writeString: [OFString stringWithFormat:
@"lower_page_%u", i]];
} else
[f writeString: @"nop_page"];
if (i + 1 < casefoldingTableSize) {
if ((i + 1) % 4 == 0)
[f writeString: @",\n\t"];
else
[f writeString: @", "];
}
}
[f writeString: @"\n};\n"];
[pool release];
}
- (void)writeHeaderToFileAtPath: (OFString*)file
{
OFAutoreleasePool *pool = [[OFAutoreleasePool alloc] init];
OFFile *f = [OFFile fileWithPath: file
mode: @"wb"];
[f writeString: COPYRIGHT
@"#import \"OFString.h\"\n\n"];
[f writeString: [OFString stringWithFormat:
@"#define OF_UNICODE_UPPER_TABLE_SIZE 0x%X\n"
@"#define OF_UNICODE_LOWER_TABLE_SIZE 0x%X\n"
@"#define OF_UNICODE_CASEFOLDING_TABLE_SIZE 0x%X\n\n",
upperTableSize, lowerTableSize, casefoldingTableSize]];
[f writeString:
@"extern const of_unichar_t* const\n"
@" of_unicode_upper_table[OF_UNICODE_UPPER_TABLE_SIZE];\n"
@"extern const of_unichar_t* const\n"
@" of_unicode_lower_table[OF_UNICODE_LOWER_TABLE_SIZE];\n"
@"extern const of_unichar_t* const\n"
@" of_unicode_casefolding_table["
@"OF_UNICODE_CASEFOLDING_TABLE_SIZE];\n"];
[pool release];
}
@end