UTF-8 encode and decode: Difference between revisions

Content added Content deleted
(Scala solution added)
Line 853: Line 853:
codePoint, Character.getName(codePoint), leftAlignedHex, s, utf8Decode(bytes))
codePoint, Character.getName(codePoint), leftAlignedHex, s, utf8Decode(bytes))
}</lang>
}</lang>
=== Functional solution===
<lang scala>object UTF8EncodeAndDecode extends App {

val codePoints = Seq(0x0041, 0x00F6, 0x0416, 0x20AC, 0x1D11E)

def utf8Encode(codepoint: Int): Array[Byte] =
new String(Array[Int](codepoint), 0, 1).getBytes(StandardCharsets.UTF_8)

def utf8Decode(bytes: Array[Byte]): Int =
new String(bytes, StandardCharsets.UTF_8).codePointAt(0)

println("Char Name Unicode UTF-8 Decoded")
for (codePoint <- codePoints) {
val w = if (Character.isBmpCodePoint(codePoint)) 4 else 5 // Compute spacing
val bytes = utf8Encode(codePoint)

def leftAlignedHex: String = f"U+${codePoint}%04X"

def utf: String = bytes.foldLeft("")(_ + "%02X ".format(_))

printf(s"%-${w}c %-36s %-7s %-${16 - w}s%c%n",
codePoint, Character.getName(codePoint), leftAlignedHex, utf, utf8Decode(bytes))
}

println(s"\nSuccessfully completed without errors. [total ${scala.compat.Platform.currentTime - executionStart} ms]")
}<lang>


=={{header|Sidef}}==
=={{header|Sidef}}==