console UTF-8 fixes (fix)

author Egmont Koblinger <egmont@uhulinux.hu>

Sun, 24 Jun 2007 00:16:27 +0000 (17:16 -0700)

committer Linus Torvalds <torvalds@woody.linux-foundation.org>

Sun, 24 Jun 2007 15:59:10 +0000 (08:59 -0700)
author Egmont Koblinger <egmont@uhulinux.hu>
Sun, 24 Jun 2007 00:16:27 +0000 (17:16 -0700)
committer Linus Torvalds <torvalds@woody.linux-foundation.org>
Sun, 24 Jun 2007 15:59:10 +0000 (08:59 -0700)
diff --git a/drivers/char/vt.c b/drivers/char/vt.c

index bbd9fc4..6650ae1 100644 (file)
--- a/drivers/char/vt.c
+++ b/drivers/char/vt.c
@@ -1956,7 +1956,7 @@ char con_buf[CON_BUF_SIZE];
  DEFINE_MUTEX(con_buf_mtx);
  
  /* is_double_width() is based on the wcwidth() implementation by
- * Markus Kuhn -- 2003-05-20 (Unicode 4.0)
+ * Markus Kuhn -- 2007-05-26 (Unicode 5.0)
   * Latest version: http://www.cl.cam.ac.uk/~mgk25/ucs/wcwidth.c
   */
  struct interval {
@@ -1988,8 +1988,8 @@ static int is_double_width(uint32_t ucs)
         static const struct interval double_width[] = {
                 { 0x1100, 0x115F }, { 0x2329, 0x232A }, { 0x2E80, 0x303E },
                 { 0x3040, 0xA4CF }, { 0xAC00, 0xD7A3 }, { 0xF900, 0xFAFF },
-               { 0xFE30, 0xFE6F }, { 0xFF00, 0xFF60 }, { 0xFFE0, 0xFFE6 },
-               { 0x20000, 0x2FFFD }, { 0x30000, 0x3FFFD }
+               { 0xFE10, 0xFE19 }, { 0xFE30, 0xFE6F }, { 0xFF00, 0xFF60 },
+               { 0xFFE0, 0xFFE6 }, { 0x20000, 0x2FFFD }, { 0x30000, 0x3FFFD }
         };
         return bisearch(ucs, double_width,
                 sizeof(double_width) / sizeof(*double_width) - 1);
@@ -2187,9 +2187,12 @@ rescan_last_byte:
                                     continue; /* nothing to display */
                                 }
                                 /* Glyph not found */
-                               if (!(vc->vc_utf && !vc->vc_disp_ctrl) && !(c & ~charmask)) {
+                               if ((!(vc->vc_utf && !vc->vc_disp_ctrl) || c < 128) && !(c & ~charmask)) {
                                     /* In legacy mode use the glyph we get by a 1:1 mapping.
-                                      This would make absolutely no sense with Unicode in mind. */
+                                      This would make absolutely no sense with Unicode in mind,
+                                      but do this for ASCII characters since a font may lack
+                                      Unicode mapping info and we don't want to end up with
+                                      having question marks only. */
                                     tc = c;
                                 } else {
                                     /* Display U+FFFD. If it's not found, display an inverse question mark. */
@@ -2213,6 +2216,7 @@ rescan_last_byte:
                                 } else {
                                         vc_attr = ((vc->vc_attr) & 0x88) | (((vc->vc_attr) & 0x70) >> 4) | (((vc->vc_attr) & 0x07) << 4);
                                 }
+                               FLUSH
                         }
  
                         while (1) {
@@ -2246,6 +2250,10 @@ rescan_last_byte:
                                 if (tc < 0) tc = ' ';
                         }
  
+                       if (inverse) {
+                               FLUSH
+                       }
+
                         if (rescan) {
                                 rescan = 0;
                                 inverse = 0;
author	Egmont Koblinger <egmont@uhulinux.hu>
	Sun, 24 Jun 2007 00:16:27 +0000 (17:16 -0700)
committer	Linus Torvalds <torvalds@woody.linux-foundation.org>
	Sun, 24 Jun 2007 15:59:10 +0000 (08:59 -0700)