erts: Fix bug in atom to filename conversions

Buggy old code assumed latin1 atoms.
author: Sverker Eriksson <[email protected]> 2013-09-20 20:13:40 +0200
committer: Sverker Eriksson <[email protected]> 2013-09-24 16:23:55 +0200
commit: b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa (patch)
tree: 9cd909f99ac4684d0abc9bc7a8f408fc9a80d01d /erts/emulator/beam/erl_unicode.c
parent: 3a0402e1157a89fac210f2276d9461aab30a9968 (diff)
download: otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.tar.gz
otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.tar.bz2
otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.zip
1 files changed, 42 insertions, 17 deletions
diff --git a/erts/emulator/beam/erl_unicode.c b/erts/emulator/beam/erl_unicode.c
index a448b600ca..ec8ea5f044 100644
--- a/erts/emulator/beam/erl_unicode.c
+++ b/erts/emulator/beam/erl_unicode.c
@@ -2174,16 +2174,31 @@ Sint erts_native_filename_need(Eterm ioterm, int encoding)
 	ap = atom_tab(atom_val(ioterm));
 	switch (encoding) {
 	case ERL_FILENAME_LATIN1:
-	    need = ap->len;
+	    need = ap->latin1_chars;  /* May be -1 */
 	    break;
 	case ERL_FILENAME_UTF8_MAC:
 	case ERL_FILENAME_UTF8:
-	    for (i = 0; i < ap->len; i++) {
-		need += (ap->name[i] >= 0x80) ? 2 : 1;
-	    }
+	    need = ap->len;
 	    break;
 	case ERL_FILENAME_WIN_WCHAR:
-	    need = 2*(ap->len);
+            if (ap->latin1_chars >= 0) {
+		need = 2* ap->latin1_chars;
+            }
+	    else {
+		for (i = 0; i < ap->len; ) {
+                    if (ap->name[i] < 0x80) {
+			i++;
+                    } else if (ap->name[i] < 0xE0) {
+			i += 2;
+                    } else if (ap->name[i] < 0xF0) {
+			i += 3;
+                    } else {
+			need = -1;
+			break;
+		    }
+		    need += 2;
+		}
+	    }
 	    break;
 	default:
 	    need = -1;
@@ -2313,26 +2328,36 @@ void erts_native_filename_put(Eterm ioterm, int encoding, byte *p)
 	switch (encoding) {
 	case ERL_FILENAME_LATIN1:
 	    for (i = 0; i < ap->len; i++) {
-		*p++ = ap->name[i];
-	    }
-	    break;
-	case ERL_FILENAME_UTF8_MAC:
-	case ERL_FILENAME_UTF8:
-	    for (i = 0; i < ap->len; i++) {
-		if(ap->name[i] < 0x80) {
+		if (ap->name[i] < 0x80) {
 		    *p++ = ap->name[i];
 		} else {
-		    *p++ = (((ap->name[i]) >> 6) | ((byte) 0xC0));
-		    *p++ = (((ap->name[i]) & 0x3F) | ((byte) 0x80));
+		    ASSERT(ap->name[i] < 0xC4);
+		    *p++ = ((ap->name[i] & 3) << 6) | (ap->name[i+1] & 0x3F);
+		    i++;
 		}
 	    }
 	    break;
+	case ERL_FILENAME_UTF8_MAC:
+	case ERL_FILENAME_UTF8:
+	    sys_memcpy(p, ap->name, ap->len);
+	    break;
 	case ERL_FILENAME_WIN_WCHAR:
 	    for (i = 0; i < ap->len; i++) {
 		/* Little endian */
-		*p++ = ap->name[i];
-		*p++ = 0;
-	    }
+                if (ap->name[i] < 0x80) {
+		    *p++ = ap->name[i];
+		    *p++ = 0;
+                } else if (ap->name[i] < 0xE0) {
+		    *p++ = ((ap->name[i] & 3) << 6) | (ap->name[i+1] & 0x3F);
+		    *p++ = ((ap->name[i] & 0x1C) >> 2);
+		    i++;
+                } else {
+		    ASSERT(ap->name[i] < 0xF0);
+		    *p++ = ((ap->name[i+1] & 3) << 6) | (ap->name[i+2] & 0x3C);
+		    *p++ = ((ap->name[i] & 0xF) << 4) | ((ap->name[i+1] & 0x3C) >> 2);
+		    i += 2;
+		}
+            }
 	    break;
 	default:
 	    ASSERT(0);
author	Sverker Eriksson <[email protected]>	2013-09-20 20:13:40 +0200
committer	Sverker Eriksson <[email protected]>	2013-09-24 16:23:55 +0200
commit	b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa (patch)
tree	9cd909f99ac4684d0abc9bc7a8f408fc9a80d01d /erts/emulator/beam/erl_unicode.c
parent	3a0402e1157a89fac210f2276d9461aab30a9968 (diff)
download	otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.tar.gz otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.tar.bz2 otp-b6b0b73ecec7facefb3b9c5a7ef663599cfee4aa.zip