overdue unicode cleanup.

our new pdcurses can do utf8 output, let's use it.
convert output on a windows tty to codepage 1252.
This commit is contained in:
Enno Rehling 2021-02-21 20:49:03 +01:00
parent b9eea2c8a2
commit abf548cecd
10 changed files with 41 additions and 36 deletions

View file

@ -2,7 +2,8 @@ local path = 'scripts'
if config.install then if config.install then
path = config.install .. '/' .. path path = config.install .. '/' .. path
end end
package.path = package.path .. ';' .. path .. '/?.lua;' .. path .. '/?/init.lua' package.path = path .. '/?.lua;' .. path .. '/?/init.lua;' .. package.path
require 'eressea.path' require 'eressea.path'
require 'eressea' require 'eressea'
require 'eressea.xmlconf' require 'eressea.xmlconf'

View file

@ -10,7 +10,7 @@ path = 'scripts'
if config.install then if config.install then
path = config.install .. '/' .. path path = config.install .. '/' .. path
end end
package.path = package.path .. ';' .. path .. '/?.lua;' .. path .. '/?/init.lua' package.path = path .. '/?.lua;' .. path .. '/?/init.lua;' .. package.path
config.rules = 'e2' config.rules = 'e2'

View file

@ -10,7 +10,7 @@ path = 'scripts'
if config.install then if config.install then
path = config.install .. '/' .. path path = config.install .. '/' .. path
end end
package.path = package.path .. ';' .. path .. '/?.lua;' .. path .. '/?/init.lua' package.path = path .. '/?.lua;' .. path .. '/?/init.lua;' .. package.path
config.rules = 'e3' config.rules = 'e3'

View file

@ -10,7 +10,7 @@ path = 'scripts'
if config.install then if config.install then
path = config.install .. '/' .. path path = config.install .. '/' .. path
end end
package.path = package.path .. ';' .. path .. '/?.lua;' .. path .. '/?/init.lua' package.path = path .. '/?.lua;' .. path .. '/?/init.lua;' .. package.path
require 'eressea' require 'eressea'
require 'eressea.path' require 'eressea.path'

View file

@ -192,7 +192,7 @@ local path = 'scripts'
if config.install then if config.install then
path = config.install .. '/' .. path path = config.install .. '/' .. path
end end
package.path = package.path .. ';' .. path .. '/?.lua;' .. path .. '/?/init.lua' package.path = path .. '/?.lua;' .. path .. '/?/init.lua;' .. package.path
require 'eressea' require 'eressea'
require 'eressea.xmlconf' -- read xml data require 'eressea.xmlconf' -- read xml data

View file

@ -58,29 +58,14 @@ state *current_state = NULL;
#define IFL_BUILDINGS (1<<3) #define IFL_BUILDINGS (1<<3)
static WINDOW *hstatus; static WINDOW *hstatus;
static int gm_utf8 = 0; /* does our curses support utf-8? */
#ifdef STDIO_CP
int gm_codepage = STDIO_CP;
#else
int gm_codepage = -1;
#endif
static void unicode_remove_diacritics(const char *rp, char *wp) { static void unicode_remove_diacritics(const char *rp, char *wp) {
while (*rp) { while (*rp) {
if (gm_codepage >= 0 && *rp & 0x80) { if (*rp & 0x80) {
size_t sz = 0; size_t sz = 0;
unsigned char ch; unsigned char ch;
switch (gm_codepage) {
case 1252:
unicode_utf8_to_cp1252(&ch, rp, &sz);
break;
case 437:
unicode_utf8_to_cp437(&ch, rp, &sz);
break;
default:
unicode_utf8_to_ascii(&ch, rp, &sz); unicode_utf8_to_ascii(&ch, rp, &sz);
break;
}
rp += sz; rp += sz;
*wp++ = (char)ch; *wp++ = (char)ch;
} }
@ -92,8 +77,13 @@ static void unicode_remove_diacritics(const char *rp, char *wp) {
} }
static void simplify(const char* rp, char* wp) { static void simplify(const char* rp, char* wp) {
if (!gm_utf8) {
unicode_remove_diacritics(rp, wp); unicode_remove_diacritics(rp, wp);
} }
else if (rp != wp) {
strcpy(wp, rp);
}
}
int umvwprintw(WINDOW *win, int y, int x, const char *format, ...) { int umvwprintw(WINDOW *win, int y, int x, const char *format, ...) {
char buffer[128]; char buffer[128];
@ -117,6 +107,10 @@ int umvwaddnstr(WINDOW *w, int y, int x, const char * str, int len) {
static void init_curses(void) static void init_curses(void)
{ {
#ifdef PDCURSES
/* PDCurses from vcpkg is compiled with UTF8 (and WIDE) support */
gm_utf8 = 1;
#endif
initscr(); initscr();
if (has_colors() || force_color) { if (has_colors() || force_color) {

View file

@ -23,7 +23,6 @@ extern "C" {
void run_mapper(void); void run_mapper(void);
extern int force_color; extern int force_color;
extern int gm_codepage;
struct state *state_open(void); struct state *state_open(void);
void state_close(struct state *); void state_close(struct state *);

View file

@ -64,7 +64,6 @@ static void load_inifile(void)
#ifdef USE_CURSES #ifdef USE_CURSES
/* only one value in the [editor] section */ /* only one value in the [editor] section */
force_color = config_get_int("editor.color", force_color); force_color = config_get_int("editor.color", force_color);
gm_codepage = config_get_int("editor.codepage", gm_codepage);
#endif #endif
} }

View file

@ -16,6 +16,14 @@
#include <stdarg.h> #include <stdarg.h>
#include <time.h> #include <time.h>
#ifdef WIN32
#include <io.h>
#define FISATTY(F) (_isatty(_fileno(F)))
#else
#include <unistd.h>
#define FISATTY(F) (isatty(fileno(F)))
#endif
void errno_check(const char * file, int line) { void errno_check(const char * file, int line) {
if (errno) { if (errno) {
log_info("errno is %d (%s) at %s:%d", log_info("errno is %d (%s) at %s:%d",
@ -24,8 +32,8 @@ void errno_check(const char * file, int line) {
} }
} }
#ifdef STDIO_CP #if WIN32
static int stdio_codepage = STDIO_CP; static int stdio_codepage = 1252;
#else #else
static int stdio_codepage = 0; static int stdio_codepage = 0;
#endif #endif
@ -63,7 +71,7 @@ void log_destroy(log_t *handle) {
} }
} }
#define MAXLENGTH 4096 /* because I am lazy, CP437 output is limited to this many chars */ #define MAXLENGTH 4096 /* because I am lazy, tty output is limited to this many chars */
#define LOG_MAXBACKUPS 5 #define LOG_MAXBACKUPS 5
static int static int
@ -87,7 +95,7 @@ cp_convert(const char *format, unsigned char *buffer, size_t length, int codepag
return result; return result;
} }
++pos; ++pos;
input += length; input += size;
} }
*pos = 0; *pos = 0;
return 0; return 0;
@ -177,11 +185,14 @@ static void _log_write(FILE * stream, int codepage, const char *format, va_list
static void log_stdio(void* data, int level, const char* module, const char* format, va_list args) { static void log_stdio(void* data, int level, const char* module, const char* format, va_list args) {
FILE* out = (FILE*)data; FILE* out = (FILE*)data;
int codepage = (out == stderr || out == stdout) ? stdio_codepage : 0; int codepage = 0;
const char* prefix = log_prefix(level); const char* prefix = log_prefix(level);
size_t len = strlen(format); size_t len = strlen(format);
(void)module; (void)module;
if (stdio_codepage && (out == stderr || out == stdout)) {
codepage = FISATTY(out) ? stdio_codepage : 0;
}
fprintf(out, "%s: ", prefix); fprintf(out, "%s: ", prefix);
_log_write(out, codepage, format, args); _log_write(out, codepage, format, args);

View file

@ -572,7 +572,8 @@ unicode_utf8_to_cp437(unsigned char *cp_character, const char * utf8_string,
int unicode_utf8_to_ascii(unsigned char *cp_character, const char * utf8_string, int unicode_utf8_to_ascii(unsigned char *cp_character, const char * utf8_string,
size_t *length) size_t *length)
{ {
int result = unicode_utf8_to_cp437(cp_character, utf8_string, length); wint_t ucs4_character;
int result = unicode_utf8_decode(&ucs4_character, utf8_string, length);
if (result == 0) { if (result == 0) {
if (*length > 1) { if (*length > 1) {
*cp_character = '?'; *cp_character = '?';