diff --recursive -ub links-0.97pre12.orig/charsets.c links-0.97pre12/charsets.c
--- links-0.97pre12.orig/charsets.c Mon Mar 4 21:48:15 2002
+++ links-0.97pre12/charsets.c Thu May 9 01:59:38 2002
@@ -89,7 +89,7 @@
0x007e, 0x2122, 0x0161, 0x003e, 0x0153, 0x0000, 0x0000, 0x0000,
};
-static inline unsigned char *u2cp(int u, int to)
+unsigned char *u2cp(int u, int to)
{
int j, s;
if (u < 128) return strings[u];
@@ -138,6 +138,22 @@
utf_buffer[4] = 0x80 | ((u >> 6) & 0x3f),
utf_buffer[5] = 0x80 | (u & 0x3f);
return utf_buffer;
+}
+
+/* this slow and ugly code is used by the terminal utf_8_io */
+unsigned char *cp2utf_8(int from, int c)
+{
+ int j;
+
+ if (codepages[from].table == table_utf_8) return strings[c];
+ for (j = 0; codepages[from].table[j].c; j++) {
+ if (codepages[from].table[j].c == c)
+ {
+ return encode_utf_8(codepages[from].table[j].u);
+ }
+ }
+ if (c < 128) return strings[c];
+ return encode_utf_8(UCS_NO_CHAR);
}
void add_utf_8(struct conv_table *ct, int u, unsigned char *str)
diff --recursive -ub links-0.97pre12.orig/default.c links-0.97pre12/default.c
--- links-0.97pre12.orig/default.c Thu Apr 4 10:49:48 2002
+++ links-0.97pre12/default.c Thu May 9 01:59:38 2002
@@ -556,6 +556,7 @@
}
}
+/* terminal NAME(str) MODE(0-3) M11_HACK(0-1) BLOCK_CURSOR.RESTRICT_852.COL(0-7) CHARSET(str) [ UTF_8_IO("utf-8") ]*/
unsigned char *term_rd(struct option *o, unsigned char *c)
{
struct term_spec *ts;
@@ -566,6 +567,7 @@
mem_free(w);
goto end;
}
+ ts->utf_8_io = 0;
mem_free(w);
if (!(w = get_token(&c))) goto err;
if (strlen(w) != 1 || w[0] < '0' || w[0] > '3') goto err_f;
@@ -585,6 +587,9 @@
if ((i = get_cp_index(w)) == -1) goto err_f;
ts->charset = i;
mem_free(w);
+ if (!(w = get_token(&c))) goto end;
+ if (!(strcasecmp(w, "utf-8"))) ts->utf_8_io = 1;
+ mem_free(w);
end:
return NULL;
err_f:
@@ -593,6 +598,7 @@
return "Error reading terminal specification";
}
+/* terminal2 NAME(str) MODE(0-3) M11_HACK(0-1) RESTRICT_852(0-1) COL(0-1) CHARSET(str) [ UTF_8_IO("utf-8") ]*/
unsigned char *term2_rd(struct option *o, unsigned char *c)
{
struct term_spec *ts;
@@ -603,6 +609,7 @@
mem_free(w);
goto end;
}
+ ts->utf_8_io = 0;
mem_free(w);
if (!(w = get_token(&c))) goto err;
if (strlen(w) != 1 || w[0] < '0' || w[0] > '3') goto err_f;
@@ -624,6 +631,9 @@
if ((i = get_cp_index(w)) == -1) goto err_f;
ts->charset = i;
mem_free(w);
+ if (!(w = get_token(&c))) goto end;
+ if (!(strcasecmp(w, "utf-8"))) ts->utf_8_io = 1;
+ mem_free(w);
end:
return NULL;
err_f:
@@ -646,6 +656,10 @@
add_num_to_str(s, l, !!ts->col + !!ts->restrict_852 * 2 + !!ts->block_cursor * 4);
add_to_str(s, l, " ");
add_to_str(s, l, get_cp_mime_name(ts->charset));
+ if (ts->utf_8_io)
+ {
+ add_to_str(s, l, " utf-8");
+ }
}
}
diff --recursive -ub links-0.97pre12.orig/intl/english.lng links-0.97pre12/intl/english.lng
--- links-0.97pre12.orig/intl/english.lng Tue Mar 26 17:35:45 2002
+++ links-0.97pre12/intl/english.lng Thu May 9 01:59:46 2002
@@ -48,6 +48,7 @@
T_LINUX_OR_OS2_FRAMES, "Linux or OS/2 frames",
T_KOI8R_FRAMES, "KOI8-R frames",
T_USE_11M, "Use ^[[11m",
+T_UTF_8_IO, "UTF-8 I/O",
T_RESTRICT_FRAMES_IN_CP850_852, "Restrict frames in cp850/852",
T_BLOCK_CURSOR, "Block cursor",
T_COLOR, "Color",
diff --recursive -ub links-0.97pre12.orig/links.h links-0.97pre12/links.h
--- links-0.97pre12.orig/links.h Wed Apr 3 14:41:02 2002
+++ links-0.97pre12/links.h Thu May 9 01:59:46 2002
@@ -992,6 +992,11 @@
int qlen;
struct list_head windows;
unsigned char *title;
+ struct {
+ int ucs;
+ int len;
+ int min;
+ } utf_8;
};
struct term_spec {
@@ -1000,6 +1005,7 @@
unsigned char term[MAX_TERM_LEN];
int mode;
int m11_hack;
+ int utf_8_io;
int restrict_852;
int block_cursor;
int col;
@@ -1701,6 +1707,9 @@
void do_auth_dialog(struct session *);
/* charsets.c */
+/* UCS/Unicode replacement character */
+#define UCS_NO_CHAR 0xFFFD
+
#include "codepage.h"
struct conv_table {
@@ -1719,6 +1728,8 @@
unsigned char *get_cp_mime_name(int);
int is_cp_special(int);
void free_conv_table();
+unsigned char *cp2utf_8(int, int);
+unsigned char *u2cp(int, int);
/* view.c */
diff --recursive -ub links-0.97pre12.orig/menu.c links-0.97pre12/menu.c
--- links-0.97pre12.orig/menu.c Sat Mar 9 09:52:32 2002
+++ links-0.97pre12/menu.c Thu May 9 01:59:46 2002
@@ -380,15 +380,15 @@
cls_redraw_all_terminals();
}
-unsigned char *td_labels[] = { TEXT(T_NO_FRAMES), TEXT(T_VT_100_FRAMES), TEXT(T_LINUX_OR_OS2_FRAMES), TEXT(T_KOI8R_FRAMES), TEXT(T_USE_11M), TEXT(T_RESTRICT_FRAMES_IN_CP850_852), TEXT(T_BLOCK_CURSOR), TEXT(T_COLOR), NULL };
+unsigned char *td_labels[] = { TEXT(T_NO_FRAMES), TEXT(T_VT_100_FRAMES), TEXT(T_LINUX_OR_OS2_FRAMES), TEXT(T_KOI8R_FRAMES), TEXT(T_USE_11M), TEXT(T_RESTRICT_FRAMES_IN_CP850_852), TEXT(T_BLOCK_CURSOR), TEXT(T_COLOR), TEXT(T_UTF_8_IO), NULL };
void terminal_options(struct terminal *term, void *xxx, struct session *ses)
{
struct dialog *d;
struct term_spec *ts = new_term_spec(term->term);
if (!ts) return;
- if (!(d = mem_alloc(sizeof(struct dialog) + 11 * sizeof(struct dialog_item)))) return;
- memset(d, 0, sizeof(struct dialog) + 11 * sizeof(struct dialog_item));
+ if (!(d = mem_alloc(sizeof(struct dialog) + 12 * sizeof(struct dialog_item)))) return;
+ memset(d, 0, sizeof(struct dialog) + 12 * sizeof(struct dialog_item));
d->title = TEXT(T_TERMINAL_OPTIONS);
d->fn = checkbox_list_fn;
d->udata = td_labels;
@@ -429,15 +429,19 @@
d->items[7].gid = 0;
d->items[7].dlen = sizeof(int);
d->items[7].data = (void *)&ts->col;
- d->items[8].type = D_BUTTON;
- d->items[8].gid = B_ENTER;
- d->items[8].fn = ok_dialog;
- d->items[8].text = TEXT(T_OK);
+ d->items[8].type = D_CHECKBOX;
+ d->items[8].gid = 0;
+ d->items[8].dlen = sizeof(int);
+ d->items[8].data = (void *)&ts->utf_8_io;
d->items[9].type = D_BUTTON;
- d->items[9].gid = B_ESC;
- d->items[9].fn = cancel_dialog;
- d->items[9].text = TEXT(T_CANCEL);
- d->items[10].type = D_END;
+ d->items[9].gid = B_ENTER;
+ d->items[9].fn = ok_dialog;
+ d->items[9].text = TEXT(T_OK);
+ d->items[10].type = D_BUTTON;
+ d->items[10].gid = B_ESC;
+ d->items[10].fn = cancel_dialog;
+ d->items[10].text = TEXT(T_CANCEL);
+ d->items[11].type = D_END;
do_dialog(term, d, getml(d, NULL));
}
diff --recursive -ub links-0.97pre12.orig/terminal.c links-0.97pre12/terminal.c
--- links-0.97pre12.orig/terminal.c Wed Jan 30 07:53:48 2002
+++ links-0.97pre12/terminal.c Thu May 9 02:03:46 2002
@@ -345,6 +345,25 @@
return term;
}
+static inline void term_send_event(struct terminal *term, struct event *ev)
+{
+ ((struct window *)&term->windows)->next->handler(term->windows.next, ev, 0);
+}
+
+static inline void term_send_ucs(struct terminal *term, struct event *ev, int u)
+{
+ unsigned char *recoded;
+
+ if (u == 0xA0) u = ' ';
+ recoded = u2cp(u, term->spec->charset);
+ if (! recoded) recoded = "*";
+ while (*recoded) {
+ ev->x = *recoded;
+ term_send_event(term, ev);
+ recoded ++;
+ }
+}
+
void in_term(struct terminal *term)
{
struct event *ev;
@@ -405,7 +424,40 @@
goto send_redraw;
}
else if (ev->ev == EV_KBD && ev->x == KBD_CTRL_C) ((struct window *)&term->windows)->prev->handler(term->windows.prev, ev, 0);
- else ((struct window *)&term->windows)->next->handler(term->windows.next, ev, 0);
+ else if (ev->ev == EV_KBD) {
+ if (term->utf_8.len) {
+ if ((ev->x & 0xC0) == 0x80 && term->spec->utf_8_io) {
+ term->utf_8.ucs <<= 6;
+ term->utf_8.ucs |= ev->x & 0x3F;
+ if (! --term->utf_8.len) {
+ int u = term->utf_8.ucs;
+
+ if (u < term->utf_8.min) u = UCS_NO_CHAR;
+ term_send_ucs(term, ev, u);
+ }
+ goto mm;
+ } else {
+ term->utf_8.len = 0;
+ term_send_ucs(term, ev, UCS_NO_CHAR);
+ }
+ }
+ if (ev->x < 0x80 || ev->x > 0xFF || ! term->spec->utf_8_io) {
+ term_send_event(term, ev);
+ goto mm;
+ } else if ((ev->x & 0xC0) == 0xC0 && (ev->x & 0xFE) != 0xFE) {
+ int mask, len = 0, cov = 0x80;
+
+ for (mask = 0x80; ev->x & mask; mask >>= 1) {
+ len++;
+ term->utf_8.min = cov;
+ cov = 1 << (1 + 5 * len);
+ }
+ term->utf_8.len = len - 1;
+ term->utf_8.ucs = ev->x & (mask - 1);
+ goto mm;
+ }
+ term_send_ucs(term, ev, UCS_NO_CHAR);
+ } else term_send_event(term, ev);
}
if (ev->ev == EV_ABORT) destroy_terminal(term);
/*redraw_screen(term);*/
@@ -422,6 +474,14 @@
unsigned char frame_dumb[48] = " ||||++||++++++--|-+||++--|-+----++++++++ ";
unsigned char frame_vt100[48] = "aaaxuuukkuxkjjjkmvwtqnttmlvwtqnvvwwmmllnnjla ";
+unsigned char frame_vt100_u[48] = {
+ 177,177,177,179,180,180,180,191,
+ 191,180,179,191,217,217,217,191,
+ 192,193,194,195,196,197,195,195,
+ 192,218,193,194,195,196,197,193,
+ 193,194,194,192,192,218,218,197,
+ 197,217,218,177, 32, 32, 32, 32
+};
unsigned char frame_koi[48] = {
144,145,146,129,135,178,180,167,
166,181,161,168,174,173,172,131,
@@ -445,7 +505,7 @@
unsigned char c = ch & 0xff; \
unsigned char A = ch >> 8 & 0x7f; \
if (s->mode == TERM_LINUX) { \
- if (s->m11_hack) { \
+ if (s->m11_hack && !s->utf_8_io) { \
if (ch >> 15 != mode) { \
if (!(mode = ch >> 15)) add_to_str(&a, &l, "\033[10m"); \
else add_to_str(&a, &l, "\033[11m"); \
@@ -454,12 +514,14 @@
if (s->restrict_852 && (ch >> 15) && c >= 176 && c < 224) { \
if (frame_restrict[c - 176]) c = frame_restrict[c - 176]; \
} \
- } else if (s->mode == TERM_VT100) { \
+ } else if (s->mode == TERM_VT100 && !s->utf_8_io) { \
if (ch >> 15 != mode) { \
if (!(mode = ch >> 15)) add_to_str(&a, &l, "\x0f"); \
else add_to_str(&a, &l, "\x0e"); \
} \
if (mode && c >= 176 && c < 224) c = frame_vt100[c - 176]; \
+ } else if (s->mode == TERM_VT100 && (ch >> 15) && c >= 176 && c < 224) { \
+ c = frame_vt100_u[c - 176]; \
} else if (s->mode == TERM_KOI8 && (ch >> 15) && c >= 176 && c < 224) { c = frame_koi[c - 176];\
} else if (s->mode == TERM_DUMB && (ch >> 15) && c >= 176 && c < 224) c = frame_dumb[c - 176];\
if (!(A & 0100) && (A >> 3) == (A & 7)) A = (A & 070) | 7 * !(A & 020); \
@@ -479,7 +541,20 @@
if (attrib & 0100) add_to_str(&a, &l, ";1"); \
add_to_str(&a, &l, "m"); \
} \
- if (c >= ' ' && c != 127/* && c != 155*/) add_chr_to_str(&a, &l, c); \
+ if (c >= ' ' && c != 127/* && c != 155*/) { \
+ int charset = s->charset; \
+ \
+ if (ch >> 15) { \
+ int frames_charset = (s->mode == TERM_LINUX || s->mode == TERM_VT100) \
+ ? get_cp_index("cp437") \
+ : s->mode == TERM_KOI8 \
+ ? get_cp_index("koi8-r") \
+ : -1; \
+ if (frames_charset != -1) charset = frames_charset; \
+ } \
+ if (s->utf_8_io) add_to_str(&a, &l, cp2utf_8(charset, c)); \
+ else add_chr_to_str(&a, &l, c); \
+ } \
else if (!c || c == 1) add_chr_to_str(&a, &l, ' '); \
else add_chr_to_str(&a, &l, '.'); \
cx++; \