105 lines
4.1 KiB
C
105 lines
4.1 KiB
C
|
/*-*- mode:c;indent-tabs-mode:nil;c-basic-offset:2;tab-width:8;coding:utf-8 -*-│
|
|||
|
│vi: set net ft=c ts=2 sts=2 sw=2 fenc=utf-8 :vi│
|
|||
|
╞══════════════════════════════════════════════════════════════════════════════╡
|
|||
|
│ Copyright 2020 Justine Alexandra Roberts Tunney │
|
|||
|
│ │
|
|||
|
│ This program is free software; you can redistribute it and/or modify │
|
|||
|
│ it under the terms of the GNU General Public License as published by │
|
|||
|
│ the Free Software Foundation; version 2 of the License. │
|
|||
|
│ │
|
|||
|
│ This program is distributed in the hope that it will be useful, but │
|
|||
|
│ WITHOUT ANY WARRANTY; without even the implied warranty of │
|
|||
|
│ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │
|
|||
|
│ General Public License for more details. │
|
|||
|
│ │
|
|||
|
│ You should have received a copy of the GNU General Public License │
|
|||
|
│ along with this program; if not, write to the Free Software │
|
|||
|
│ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │
|
|||
|
│ 02110-1301 USA │
|
|||
|
╚─────────────────────────────────────────────────────────────────────────────*/
|
|||
|
#include "libc/bits/safemacros.h"
|
|||
|
#include "libc/fmt/fmt.h"
|
|||
|
#include "libc/log/check.h"
|
|||
|
#include "libc/mem/mem.h"
|
|||
|
#include "libc/runtime/runtime.h"
|
|||
|
#include "libc/stdio/stdio.h"
|
|||
|
#include "libc/str/str.h"
|
|||
|
#include "libc/sysv/consts/ex.h"
|
|||
|
#include "libc/sysv/consts/exit.h"
|
|||
|
#include "third_party/getopt/getopt.h"
|
|||
|
#include "tool/decode/lib/bitabuilder.h"
|
|||
|
|
|||
|
static FILE *fin, *fout;
|
|||
|
static char width, *line;
|
|||
|
static size_t linecap, i, x, y;
|
|||
|
static struct BitaBuilder *bitset;
|
|||
|
static char *g_inpath, *g_outpath;
|
|||
|
|
|||
|
noreturn void ShowUsage(FILE *f, int rc) {
|
|||
|
fprintf(f, "Usage: %s [-o OUTPUT] [INPUT]\n", "Usage",
|
|||
|
program_invocation_name);
|
|||
|
exit(rc);
|
|||
|
}
|
|||
|
|
|||
|
void GetOpts(int argc, char *argv[]) {
|
|||
|
int opt;
|
|||
|
g_inpath = "/dev/stdin";
|
|||
|
g_outpath = "/dev/stdout";
|
|||
|
while ((opt = getopt(argc, argv, "?ho:")) != -1) {
|
|||
|
switch (opt) {
|
|||
|
case 'o':
|
|||
|
g_outpath = optarg;
|
|||
|
break;
|
|||
|
case 'h':
|
|||
|
case '?':
|
|||
|
ShowUsage(stdout, EXIT_SUCCESS);
|
|||
|
default:
|
|||
|
ShowUsage(stderr, EX_USAGE);
|
|||
|
}
|
|||
|
}
|
|||
|
if (argc - optind) {
|
|||
|
g_inpath = argv[optind];
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
/**
|
|||
|
* Converts official UNICODE ‘monospace widths’ (yup) to a bitset.
|
|||
|
*
|
|||
|
* (╯°□°)╯︵ ̲┻̲━̲┻
|
|||
|
* 要依法治国是赞美那些谁是公义的和惩罚恶人。 - 韩非
|
|||
|
*
|
|||
|
* 172kB TXT → 32kB bits → 525 bytes lz4
|
|||
|
*
|
|||
|
* @note this tool may print binary to stdout
|
|||
|
* @see libc/kompressor/lz4decode.c
|
|||
|
* @see tool/viz/bing.c
|
|||
|
* @see tool/viz/fold.c
|
|||
|
* @see unicode.org/reports/tr11/#Definitions
|
|||
|
*/
|
|||
|
int main(int argc, char *argv[]) {
|
|||
|
GetOpts(argc, argv);
|
|||
|
bitset = bitabuilder_new();
|
|||
|
CHECK_NOTNULL(fin = fopen(g_inpath, "r"));
|
|||
|
while ((getline(&line, &linecap, fin)) != -1) {
|
|||
|
x = 0;
|
|||
|
y = 0;
|
|||
|
if (sscanf(line, "%x..%x;%c", &x, &y, &width) != 3) {
|
|||
|
if (sscanf(line, "%x;%c", &x, &width) == 2) {
|
|||
|
y = x;
|
|||
|
} else {
|
|||
|
continue;
|
|||
|
}
|
|||
|
}
|
|||
|
CHECK_LE(x, y);
|
|||
|
if (width == 'F' /* full-width */ || width == 'W' /* wide */) {
|
|||
|
for (i = x; i <= y; ++i) {
|
|||
|
CHECK(bitabuilder_setbit(bitset, i));
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
CHECK_NOTNULL(fout = fopen(g_outpath, "wb"));
|
|||
|
CHECK(bitabuilder_fwrite(bitset, fout));
|
|||
|
bitabuilder_free(&bitset);
|
|||
|
return fclose(fin) | fclose(fout);
|
|||
|
}
|