2019-11-27 16:16:14 +00:00
|
|
|
<?php
|
|
|
|
/* Generate lookup table from unicode.org mapping file (SHIFTJIS.TXT by default). */
|
|
|
|
/*
|
|
|
|
libzint - the open source barcode library
|
2022-06-02 20:32:25 +01:00
|
|
|
Copyright (C) 2019-2022 Robin Stuart <rstuart114@gmail.com>
|
2019-11-27 16:16:14 +00:00
|
|
|
*/
|
2022-06-02 20:32:25 +01:00
|
|
|
/* To create backend/tests/test_sjis_tab.h (from the project root directory):
|
2019-12-08 16:15:34 +00:00
|
|
|
*
|
2022-06-02 20:32:25 +01:00
|
|
|
* php backend/tests/tools/gen_test_tab.php
|
2019-12-08 16:15:34 +00:00
|
|
|
*
|
|
|
|
* To create backend/tests/test_gb2312_tab.h;
|
|
|
|
*
|
2022-06-02 20:32:25 +01:00
|
|
|
* php backend/tests/tools/gen_test_tab.php -f GB2312.TXT -s gb2312_tab
|
|
|
|
*
|
|
|
|
* To create backend/tests/test_gbk.h;
|
|
|
|
*
|
|
|
|
* php backend/tests/tools/gen_test_tab.php -f CP936.TXT -s gbk_tab
|
2019-12-08 16:15:34 +00:00
|
|
|
*
|
|
|
|
* To create backend/tests/test_gb18030_tab.h (note that backend/tests/tools/data/GB18030.TXT
|
|
|
|
* will have to be downloaded first from https://haible.de/bruno/charsets/conversion-tables/GB18030.html
|
2022-06-02 20:32:25 +01:00
|
|
|
* using the version jdk-1.4.2/GB18030.TXT):
|
2019-12-08 16:15:34 +00:00
|
|
|
*
|
2022-06-02 20:32:25 +01:00
|
|
|
* php backend/tests/tools/gen_test_tab.php -f GB18030.TXT -s gb18030_tab
|
2021-01-11 18:11:41 +00:00
|
|
|
*
|
|
|
|
* To create backend/tests/test_big5_tab.h;
|
|
|
|
*
|
2022-06-02 20:32:25 +01:00
|
|
|
* php backend/tests/tools/gen_test_tab.php -f BIG5.TXT -s big5_tab
|
2021-01-11 18:11:41 +00:00
|
|
|
*
|
|
|
|
* To create backend/tests/test_ksx1001_tab.h;
|
|
|
|
*
|
2022-06-02 20:32:25 +01:00
|
|
|
* php backend/tests/tools/gen_test_tab.php -f KSX1001.TXT -s ksx1001_tab
|
2021-01-11 18:11:41 +00:00
|
|
|
*
|
2019-12-08 16:15:34 +00:00
|
|
|
*/
|
2019-11-27 16:16:14 +00:00
|
|
|
|
|
|
|
$basename = basename(__FILE__);
|
|
|
|
$dirname = dirname(__FILE__);
|
|
|
|
|
|
|
|
$opts = getopt('d:f:o:s:');
|
2022-06-02 20:32:25 +01:00
|
|
|
$data_dirname = isset($opts['d']) ? $opts['d'] : ($dirname . '/../../tools/data'); // Where to load file from.
|
2019-11-27 16:16:14 +00:00
|
|
|
$file_name = isset($opts['f']) ? $opts['f'] : 'SHIFTJIS.TXT'; // Name of file.
|
|
|
|
$out_dirname = isset($opts['o']) ? $opts['o'] : ($dirname . '/..'); // Where to put output.
|
|
|
|
$suffix_name = isset($opts['s']) ? $opts['s'] : 'sjis_tab'; // Suffix of table and output file.
|
|
|
|
|
|
|
|
$file = $data_dirname . '/' . $file_name;
|
|
|
|
|
|
|
|
// Read the file.
|
|
|
|
|
|
|
|
if (($get = file_get_contents($file)) === false) {
|
|
|
|
error_log($error = "$basename: ERROR: Could not read mapping file \"$file\"");
|
|
|
|
exit($error . PHP_EOL);
|
|
|
|
}
|
|
|
|
|
|
|
|
$lines = explode("\n", $get);
|
|
|
|
|
|
|
|
// Parse the file.
|
|
|
|
|
|
|
|
$tab_lines = array();
|
|
|
|
$sort = array();
|
|
|
|
foreach ($lines as $line) {
|
|
|
|
$line = trim($line);
|
2021-01-11 18:11:41 +00:00
|
|
|
if ($line === '' || strncmp($line, '0x', 2) !== 0 || strpos($line, "*** NO MAPPING ***") !== false) {
|
2019-11-27 16:16:14 +00:00
|
|
|
continue;
|
|
|
|
}
|
2019-12-08 16:15:34 +00:00
|
|
|
if (preg_match('/^0x([0-9A-F]{2,8})[ \t]+0x([0-9A-F]{5})/', $line)) { // Exclude U+10000..10FFFF to save space
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$tab_lines[] = preg_replace_callback('/^0x([0-9A-F]{2,8})[ \t]+0x([0-9A-F]{4}).*$/', function ($matches) {
|
2019-11-27 16:16:14 +00:00
|
|
|
global $sort;
|
|
|
|
$mb = hexdec($matches[1]);
|
|
|
|
$unicode = hexdec($matches[2]);
|
|
|
|
$sort[] = $unicode;
|
|
|
|
return sprintf(" 0x%04X, 0x%04X,", $mb, $unicode);
|
|
|
|
}, $line);
|
|
|
|
}
|
|
|
|
|
|
|
|
array_multisort($sort, $tab_lines);
|
|
|
|
|
|
|
|
// Output.
|
|
|
|
|
|
|
|
$out = array();
|
|
|
|
$out[] = '/* Generated by ' . $basename . ' from ' . $file_name . ' */';
|
2019-12-08 16:15:34 +00:00
|
|
|
$out[] = 'static const unsigned int test_' . $suffix_name . '[] = {';
|
2019-11-27 16:16:14 +00:00
|
|
|
$out = array_merge($out, $tab_lines);
|
|
|
|
$out[] = '};';
|
|
|
|
|
2019-12-08 16:15:34 +00:00
|
|
|
$out[] = '';
|
|
|
|
$out[] = 'static const unsigned int test_' . $suffix_name . '_ind[] = {';
|
|
|
|
$first = 0;
|
|
|
|
foreach ($sort as $ind => $unicode) {
|
2021-01-11 18:11:41 +00:00
|
|
|
$div = (int)($unicode / 0x400);
|
2019-12-08 16:15:34 +00:00
|
|
|
while ($div >= $first) {
|
2021-01-11 18:11:41 +00:00
|
|
|
$out[] = ' ' . ($ind * 2) . ',';
|
2019-12-08 16:15:34 +00:00
|
|
|
$first++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
$out[] = '};';
|
|
|
|
|
2019-11-27 16:16:14 +00:00
|
|
|
file_put_contents($out_dirname . '/test_' . $suffix_name . '.h', implode("\n", $out) . "\n");
|
2022-06-02 20:32:25 +01:00
|
|
|
|
|
|
|
/* vim: set ts=4 sw=4 et : */
|