ziglang · data-man · Dec 22, 2019 · Dec 29, 2019 · Dec 29, 2019 · daurnimator
diff --git a/lib/std/fmt.zig b/lib/std/fmt.zig
@@ -76,6 +76,7 @@ fn peekIsAlign(comptime fmt: []const u8) bool {
 /// - `d`: output numeric value in decimal notation
 /// - `b`: output integer value in binary notation
 /// - `c`: output integer as an ASCII character. Integer type must have 8 bits at max.
+/// - `u`: output integer as an UTF-8 sequence. Integer type must have 21 bits at max.
 /// - `*`: output the address of the value instead of the value itself.
 ///
 /// If a formatted user type contains a function of the type
@@ -520,6 +521,12 @@ pub fn formatIntValue(
         } else {
             @compileError("Cannot print integer that is larger than 8 bits as a ascii");
         }
+    } else if (comptime std.mem.eql(u8, fmt, "u")) {
+        if (@TypeOf(int_value).bit_count <= 21) {
+            return formatUtf8Codepoint(@as(u21, int_value), options, context, Errors, output);
+        } else {
+            @compileError("Cannot print integer that is larger than 21 bits as an UTF-8 sequence");
+        }
     } else if (comptime std.mem.eql(u8, fmt, "b")) {
         radix = 2;
         uppercase = false;
@@ -587,6 +594,18 @@ pub fn formatAsciiChar(
     return format(context, Errors, output, "\\x{x:0<2}", .{c});
 }
 
+pub fn formatUtf8Codepoint(
+    c: u21,
+    options: FormatOptions,
+    context: var,
+    comptime Errors: type,
+    output: fn (@TypeOf(context), []const u8) Errors!void,
+) Errors!void {
+    var buf: [4]u8 = undefined;
+    const len = std.unicode.utf8Encode(c, buf[0..]) catch unreachable;
+    return output(context, @as(*const [4]u8, &buf)[0..len]);
+}
+
 pub fn formatBuf(
     buf: []const u8,
     options: FormatOptions,
@@ -1207,6 +1226,14 @@ test "int.specifier" {
         const value: u8 = 'a';
         try testFmt("u8: a\n", "u8: {c}\n", .{value});
     }
+    {
+        const value: u8 = 'a';
+        try testFmt("UTF-8: a\n", "UTF-8: {u}\n", .{value});
+    }
+    {
+        const value: u21 = 0x1F310;
+        try testFmt("UTF-8: 🌐\n", "UTF-8: {u}\n", .{value});
+    }
     {
         const value: u8 = 0b1100;
         try testFmt("u8: 0b1100\n", "u8: 0b{b}\n", .{value});