Hex dump
You are encouraged to solve this task according to the task description, using any language you may know.
A hex dump is a textual representation of bytes in a file, and hexdump is a command-line tool that can dump bytes from a file in a variety of formats, including hexadecimal, octal and ASCII.
hexdump's canonical format displays, on each line:
- a byte offset in hexadecimal,
- up to 16 bytes in hexadecimal, separated by spaces, with an extra space between the 8th and 9th byte,
- the same 16 bytes interpreted as ASCII characters, with non-printing and non-ascii characters replaced with a dot (
.
), surrounded by pipes (|
).
The last line of output shows a final byte count, also in hexadecimal.
For example, the string "Rosetta Code is a programming chrestomathy site 😀." encoded in UTF-16 (little-endian - the first two bytes are the byte order mark), displayed in the canonical format is:
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.|
00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.|
00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.|
00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.|
00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.|
00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.|
00000060 20 00 3d d8 00 de 2e 00 | .=.....|
00000068
- Task
Implement a hexdump-like program that:
- outputs in the canonical format,
- takes an optional offset in bytes from which to start,
- takes an optional length in bytes after which it will stop.
Demonstrate your implementation by showing the canonical hex dump of the example above, plus any other examples you find useful.
- Stretch
xxd is another command-line tool similar to hexdump. It offers a binary mode where bytes are displayed in bits instead of hexadecimal.
Implement a binary mode. For this task, in binary mode, the example above should be displayed like this:
00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.|
00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.|
0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .|
00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.|
00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.|
0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.|
00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.|
0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.|
00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.|
00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.|
0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.|
00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.|
00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.|
0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.|
00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.|
0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.|
00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...|
00000066 00101110 00000000 |..|
00000068
Other hexdump/xxd features and a command line interface to your program are optional.
AArch64 Assembly
/* ARM assembly AARCH64 Raspberry PI 3B */
/* program hexadump64.s */
/*******************************************/
/* Constantes */
/*******************************************/
/* for this file see task include a file in language AArch64 assembly*/
.include "../includeConstantesARM64.inc"
.equ NBCARLIBEL, 45
/*******************************************/
/* Macros */
/*******************************************/
//.include "../../ficmacros64.inc" @ for developer debugging
/*******************************************/
/* Initialized data */
/*******************************************/
.data
szMessDebutPgm: .asciz "Program 64 bits start. \n"
szCarriageReturn: .asciz "\n"
szMessFinOK: .asciz "Program normal end. \n"
szTitre1: .asciz "Dump memory 1"
szTitre2: .asciz "Dump memory main"
// title info line display
szTitleDump: .ascii "Memory dump"
sadx1: .ascii " : "
sBlockAddress: .fill 17, 1, ' '
sTitleDisp: .fill NBCARLIBEL,1,' '
.asciz "\n"
// block datas line display
sAreaBlockAddress: .fill 13, 1, ' '
.ascii " "
sAreaHexaChar: .fill 47, 1, ' '
.ascii " "
sAreaCharAscii: .fill 16, 1, ' '
s3mem: .asciz "\n"
/*******************************************/
/* UnInitialized data */
/*******************************************/
.bss
.align 4
szZoneConv: .skip 24
/*******************************************/
/* code section */
/*******************************************/
.text
.global main
main:
ldr x0,qAdrszMessDebutPgm
bl affichageMess
ldr x0,qAdrszMessDebutPgm
mov x1,#4 // display 4 blocks
ldr x2,qAdrszTitre1
bl hexaDump
adr x0,main
add x0,x0,#5 // for no block address
mov x1,#2 // display 2 blocks
ldr x2,qAdrszTitre2
bl hexaDump
ldr x0,qAdrszMessFinOK
bl affichageMess
100: // standard end of the program
mov x0, #0 // return code
mov x8,EXIT
svc 0 // perform system call
qAdrszMessDebutPgm: .quad szMessDebutPgm
qAdrszMessFinOK: .quad szMessFinOK
qAdrszCarriageReturn: .quad szCarriageReturn
qAdrszTitre1: .quad szTitre1
qAdrszTitre2: .quad szTitre2
/*******************************************/
/* display memory area */
/*******************************************/
/* r0 address memoire r1 nombre de bloc r2 titre */
hexaDump: //
stp x1,lr,[sp,-16]! // save registers
stp x2,x3,[sp,-16]!
stp x4,x5,[sp,-16]!
stp x6,x7,[sp,-16]!
stp x8,x9,[sp,-16]!
mov x4,x0
mov x6,x1 // number of blocks
ldr x1,qAdrsBlockAddress // result address
bl conversion16
mov x7,#0
ldr x5,qAdrsTitleDisp //
1: // title copy loop
ldrb w3,[x2,x7]
cmp x3,#0
beq 2f
strb w3,[x5,x7]
add x7,x7,#1
b 1b
2:
mov x3,#' '
3:
cmp x7,#NBCARLIBEL
bge 4f
strb w3,[x5,x7]
add x7,x7,#1
b 3b
4:
mov x2,x4 // memory address begin
ldr x0,qAdrszTitleDump // display dump title
bl affichageMess
mov x1, x2, ASR #4 // compute block 16 bytes begin
mov x1, x1, LSL #4 // divide by 16 and mult by 16
mov x8,#3 // 3 charaters by byte displayed
sub x0,x2,x1 // memory offset in block
mul x5,x0,x8 // character display offset
ldr x0,qAdrsAreaHexaChar // store address
add x7,x0,x5 // compute position
sub x7,x7,#1 // in front of the character display
mov x0,#'*' // store star of memory address begin
strb w0,[x7]
5: // loop display block
mov x4,x1 // display block address
mov x0,x1
// ldr x1,qAdrsAreaBlockAddress // area block address
ldr x1,qAdrszZoneConv
bl prepRegistre16 // conversion hexa
// recopie de 12 caractères de l'adresse
mov x8,#3 // pour supprimer les 4 premiers zeros
mov x0,#0
ldr x1,qAdrszZoneConv
ldr x2,qAdrsAreaBlockAddress // et mettre le résultat dans la zone d'affichage
6:
ldrb w5,[x1,x8]
strb w5,[x2,x0]
add x0,x0,#1
add x8,x8,#1
cmp x8,#15 // arrêt au 15ième caractère
ble 6b
mov x1,x4 // restaur block address
mov x8,#3
mov x2,#0
7: // begin loop display 16 byte in hexa
ldrb w4,[x1,x2] // load byte
ldr x0,qAdrsAreaHexaChar //
mul x5,x2,x8 // compute store offset
add x0,x0,x5
mov x3, x4, ASR #4 // conversion byte in two hexa characters
cmp x3,#9 // < 10
add x9,x3,#48 // number
//addle x5,x3,#48 // number
add x5,x3,#55 // letter A-F
csel x5,x9,x5,le
strb w5,[x0] // store result
add x0,x0,#1 // second character
mov x5,x3,LSL #4 //
sub x3,x4,x5 // compute remander divsion by 10
cmp x3,#9 // < 10
add x9,x3,#48 // number
//addle x5,x3,#48 // number
add x5,x3,#55 // letter A-F
csel x5,x9,x5,le
strb w5,[x0] // store second character
add x2,x2,#1 // increment byte indice
cmp x2,#16 // block 16 bytes end ?
blt 7b // no -> loop
// display in characters ascii
mov x2,#0 // byte indice
8: // begin loop ascii display
ldrb w4,[x1,x2] // load byte
cmp x4,#31 // character ascii ?
ble 9f // no
cmp x4,#125 // character ascii ?
bgt 9f // no
b 10f
9:
mov x4,#46 // character ascii
10:
ldr x0,qAdrsAreaCharAscii //
add x0,x0,x2
strb w4,[x0]
add x2,x2,#1
cmp x2,#16 // block end ?
blt 8b // no ->loop
ldr x0,qAdrsAreaBlockAddress // begin block address
bl affichageMess
mov x0,#' '
strb w0,[x7] // raz star address for other line
add x1,x1,#16 // next block
subs x6,x6,#1 // decrement block number
bgt 5b // and loop if not zero
100:
ldp x8,x9,[sp],16
ldp x6,x7,[sp],16
ldp x4,x5,[sp],16
ldp x2,x3,[sp],16
ldp x1,lr,[sp],16
ret
qAdrszTitleDump: .quad szTitleDump
qAdrsBlockAddress: .quad sBlockAddress
qAdrsTitleDisp: .quad sTitleDisp
qAdrsAreaHexaChar: .quad sAreaHexaChar
qAdrsAreaBlockAddress: .quad sAreaBlockAddress
qAdrsAreaCharAscii: .quad sAreaCharAscii
qAdrszZoneConv: .quad szZoneConv
/******************************************************************/
/* conversion d'un registre en hexadecimal */
/******************************************************************/
/* x0 contient N° registre and x1 adresse zone receptrice */
prepRegistre16:
stp x0,lr,[sp,-48]! // save registres
stp x1,x2,[sp,32] // save registres
stp x3,x4,[sp,16] // save registres
mov x2,#60 // start bit position
mov x4,#0xF000000000000000 // masque
mov x3,x0 // save entry value
1: // start loop
and x0,x3,x4 // valeur du registre and du masque
lsr x0,x0,x2 // deplacement droite
cmp x0,#10 // >= 10 ?
bge 2f // oui
add x0,x0,#48 // non c'est un chiffre
b 3f
2:
add x0,x0,#55 // sinon c'est une lettre A-F
3:
strb w0,[x1],#1 // stocke le chiffre et + 1 dans la pointeur
lsr x4,x4,#4 // deplace le masque de 4 positions
subs x2,x2,#4 // decrement compteur de 4 bits <= zero ?
bge 1b // non -> boucle
100: // fin standard de la fonction
ldp x3,x4,[sp,16] // restaur des 2 registres
ldp x1,x2,[sp,32] // restaur des 2 registres
ldp x0,lr,[sp],48 // restaur des 2 registres
ret
/***************************************************/
/* ROUTINES INCLUDE */
/***************************************************/
/* for this file see task include a file in language AArch64 assembly*/
.include "../includeARM64.inc"
- Output:
Program 64 bits start. Memory dump : 0000000000420000 Dump memory 1 0000000420000*50 72 6F 67 72 61 6D 20 36 34 20 62 69 74 73 20 Program 64 bits 0000000420010 73 74 61 72 74 2E 20 0A 00 0A 00 50 72 6F 67 72 start. ....Progr 0000000420020 61 6D 20 6E 6F 72 6D 61 6C 20 65 6E 64 2E 20 0A am normal end. . 0000000420030 00 44 75 6D 70 20 6D 65 6D 6F 72 79 20 31 00 44 .Dump memory 1.D Memory dump : 00000000004000B5 Dump memory main 00000004000B0 00 02 00 58 A1*00 00 94 C0 01 00 58 81 00 80 D2 ...X.......X.... 00000004000C0 42 02 00 58 15 00 00 94 40 FF FF 10 00 14 00 91 B..X....@....... Program normal end.
ARM Assembly
/* ARM assembly Raspberry PI */
/* program hexadump.s */
/* REMARK 1 : this program use routines in a include file
see task Include a file language arm assembly
for the routine affichageMess conversion10
see at end of this program the instruction include */
/*******************************************/
/* Constantes */
/*******************************************/
.include "../constantes.inc"
.equ NBCARLIBEL, 45
/*******************************************/
/* Macros */
/*******************************************/
//.include "../../ficmacros32.inc" @ for developer debugging
/*******************************************/
/* Initialized data */
/*******************************************/
.data
szMessDebutPgm: .asciz "Program 32 bits start. \n"
szCarriageReturn: .asciz "\n"
szMessFinOK: .asciz "Program normal end. \n"
szTitre1: .asciz "Dump memory 1"
szTitre2: .asciz "Dump memory main"
@ title info line display
szTitleDump: .ascii "Memory dump : "
sadr1: .ascii " address : "
sBlockAddress: .ascii " "
sTitleDisp: .fill NBCARLIBEL,1,' '
.asciz "\n"
@ block datas line display
sAreaBlockAddress: .fill 9, 1, ' '
.ascii " "
sAreaHexaChar: .fill 48, 1, ' '
.ascii " "
sAreaCharAscii: .fill 16, 1, ' '
s3mem: .asciz "\n"
/*******************************************/
/* UnInitialized data */
/*******************************************/
.bss
//buffer_conversion: .skip 40
.align 4
/*******************************************/
/* code section */
/*******************************************/
.text
.global main
main:
ldr r0,iAdrszMessDebutPgm
bl affichageMess
ldr r0,iAdrszMessDebutPgm
mov r1,#4 @ display 4 blocks
ldr r2,iAdrszTitre1
bl hexaDump
adr r0,main
add r0,#5 @ for no block address
mov r1,#2 @ display 2 blocks
ldr r2,iAdrszTitre2
bl hexaDump
ldr r0,iAdrszMessFinOK
bl affichageMess
100: @ standard end of the program
mov r0, #0 @ return code
mov r7, #EXIT @ request to exit program
svc 0 @ perform system call
iAdrszMessDebutPgm: .int szMessDebutPgm
iAdrszMessFinOK: .int szMessFinOK
iAdrszCarriageReturn: .int szCarriageReturn
iAdrszTitre1: .int szTitre1
iAdrszTitre2: .int szTitre2
/*******************************************/
/* display memory area */
/*******************************************/
/* r0 address memoire r1 nombre de bloc r2 titre */
hexaDump: @
push {r0-r8,fp,lr}
mov r4,r0
mov r6,r1 @ number of blocks
ldr r1,iAdrsBlockAddress @ result address
bl conversion16
mov r7,#0
ldr r5,iAdrsTitleDisp @
1: @ title copy loop
ldrb r3,[r2,r7]
cmp r3,#0
strneb r3,[r5,r7]
addne r7,#1
bne 1b
mov r3,#' '
2:
cmp r7,#NBCARLIBEL
strltb r3,[r5,r7]
addlt r7,#1
blt 2b
mov r2,r4 @ memory address begin
ldr r0,iAdrszTitleDump @ display dump title
bl affichageMess
mov r1, r2, ASR #4 @ compute block 16 bytes begin
mov r1, r1, LSL #4 @ divide by 16 and mult by 16
mov r8,#3 @ 3 charaters by byte displayed
sub r0,r2,r1 @ memory offset in block
mul r5,r0,r8 @ character display offset
ldr r0,iAdrsAreaHexaChar @ store address
add r7,r0,r5 @ compute position
sub r7,r7,#1 @ in front of the character display
mov r0,#'*' @ store star of memory address begin
strb r0,[r7]
3: @ loop display block
mov r4,r1 @ display block address
mov r0,r1
ldr r1,iAdrsAreaBlockAddress @ area block address
bl conversion16 @ conversion hexa
mov r1,r4 @ restaur block address
mov r8,#3
mov r2,#0
4: @ begin loop display 16 byte in hexa
ldrb r4,[r1,r2] @ load byte
ldr r0,iAdrsAreaHexaChar @
mul r5,r2,r8 @ compute store offset
add r0,r5
mov r3, r4, ASR #4 @ conversion byte in two hexa characters
cmp r3,#9 @ < 10
addle r5,r3,#48 @ number
addgt r5,r3,#55 @ letter A-F
strb r5,[r0] @ store result
add r0,#1 @ second character
mov r5,r3,LSL #4 @
sub r3,r4,r5 @ compute remander divsion by 10
cmp r3,#9 @ < 10
addle r5,r3,#48 @ number
addgt r5,r3,#55 @ letter A-F
strb r5,[r0] @ store second character
add r2,r2,#1 @ increment byte indice
cmp r2,#16 @ block 16 bytes end ?
blt 4b @ no -> loop
@ display in characters ascii
mov r2,#0 @ byte indice
5: @ begin loop ascii display
ldrb r4,[r1,r2] @ load byte
cmp r4,#31 @ character ascii ?
ble 6f @ no
cmp r4,#125 @ character ascii ?
bgt 6f @ no
b 7f
6:
mov r4,#46 @ character ascii
7:
ldr r0,iAdrsAreaCharAscii @
add r0,r2
strb r4,[r0]
add r2,r2,#1
cmp r2,#16 @ block end ?
blt 5b @ no ->loop
ldr r0,iAdrsAreaBlockAddress @ begin block address
bl affichageMess
mov r0,#' '
strb r0,[r7] @ raz star address for other line
add r1,r1,#16 @ next block
subs r6,#1 @ decrement block number
bgt 3b @ and loop if not zero
100:
pop {r0-r8,fp,pc}
iAdrszTitleDump: .int szTitleDump
iAdrsBlockAddress: .int sBlockAddress
iAdrsTitleDisp: .int sTitleDisp
iAdrsAreaHexaChar: .int sAreaHexaChar
iAdrsAreaBlockAddress: .int sAreaBlockAddress
iAdrsAreaCharAscii: .int sAreaCharAscii
/***************************************************/
/* ROUTINES INCLUDE */
/***************************************************/
.include "../affichage.inc"
- Output:
Program 32 bits start. Memory dump : address : 00012000 Dump memory 1 00012000 *50 72 6F 67 72 61 6D 20 33 32 20 62 69 74 73 20 Program 32 bits 00012010 73 74 61 72 74 2E 20 0A 00 0A 00 50 72 6F 67 72 start. ....Progr 00012020 61 6D 20 6E 6F 72 6D 61 6C 20 65 6E 64 2E 20 0A am normal end. . 00012030 00 44 75 6D 70 20 6D 65 6D 6F 72 79 20 31 00 44 .Dump memory 1.D Memory dump : address : 00010085 Dump memory main 00010080 38 00 9F E5 66*00 00 EB 30 00 9F E5 04 10 A0 E3 8...f...0....... 00010090 34 20 9F E5 0E 00 00 EB 20 00 4F E2 05 00 80 E2 4 ...... .O..... Program normal end.
C
#include <ctype.h>
#include <errno.h>
#include <limits.h>
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#define BYTES_HEX 16
#define BYTES_BIN 6
static void print_hex(const char* data, long count) {
long i = 0;
for (; i < count; ++i) {
if (i % 8 == 0)
putchar(' ');
printf(" %02x", (unsigned char)data[i]);
}
for (; i < BYTES_HEX; ++i) {
if (i % 8 == 0)
putchar(' ');
printf(" ");
}
}
static void print_binary(const char* data, long count) {
long i = 0;
putchar(' ');
for (; i < count; ++i) {
unsigned char c = data[i];
putchar(' ');
for (unsigned char m = 1 << 7; m != 0; m >>= 1)
putchar((c & m) ? '1' : '0');
}
for (; i < BYTES_BIN; ++i)
printf(" ");
}
static void print_chars(const char* data, long count) {
for (long i = 0; i < count; ++i) {
unsigned char c = data[i];
putchar(isprint(c) ? c : '.');
}
}
static bool string_to_long(const char* str, long* value) {
char* eptr;
long result = strtol(str, &eptr, 0);
if (errno || *eptr || result < 0)
return false;
*value = result;
return true;
}
static void usage(const char* program) {
fprintf(stderr, "usage: %s [-b] [-s skip] [-n length] filename\n", program);
}
int main(int argc, char** argv) {
long offset = 0;
long max_length = LONG_MAX;
bool binary = false;
int i = 1;
for (; i < argc && argv[i][0] == '-'; ++i) {
switch (argv[i][1]) {
case 's':
if (++i == argc) {
usage(argv[0]);
return EXIT_FAILURE;
}
if (!string_to_long(argv[i], &offset)) {
fprintf(stderr, "Invalid skip '%s'.\n", argv[i]);
return EXIT_FAILURE;
}
break;
case 'n':
if (++i == argc) {
usage(argv[0]);
return EXIT_FAILURE;
}
if (!string_to_long(argv[i], &max_length)) {
fprintf(stderr, "Invalid length '%s'.\n", argv[i]);
return EXIT_FAILURE;
}
break;
case 'b':
binary = true;
break;
default:
usage(argv[0]);
return EXIT_FAILURE;
}
}
if (i + 1 != argc) {
usage(argv[0]);
return EXIT_FAILURE;
}
FILE* fp = fopen(argv[i], "rb");
if (!fp) {
perror(argv[i]);
return EXIT_FAILURE;
}
if (fseek(fp, 0, SEEK_END)) {
perror("fseek");
fclose(fp);
return EXIT_FAILURE;
}
long max_offset = ftell(fp);
if (offset > max_offset)
offset = max_offset;
if (fseek(fp, offset, SEEK_SET)) {
perror("fseek");
fclose(fp);
return EXIT_FAILURE;
}
char data[BYTES_HEX];
const long max_count = binary ? BYTES_BIN : BYTES_HEX;
for (long length = 0; length <= max_length;) {
printf("%08lx", offset);
long count = fread(data, 1, max_count, fp);
if (count > max_length - length)
count = max_length - length;
if (count == 0) {
putchar('\n');
break;
}
if (binary)
print_binary(data, count);
else
print_hex(data, count);
printf(" |");
print_chars(data, count);
printf("|\n");
offset += count;
length += count;
}
fclose(fp);
return EXIT_SUCCESS;
}
- Output:
Hexadecimal output:
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068
Binary output:
00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068
C++
#include <algorithm>
#include <bitset>
#include <cstdint>
#include <filesystem>
#include <format>
#include <fstream>
#include <iostream>
#include <string>
#include <vector>
enum DumpType { HEX, XXD };
struct DumpDetails {
DumpType type;
uint32_t factor;
uint32_t block_length;
uint32_t line_length;
};
class Converter {
public:
Converter(const std::vector<uint8_t>& aBytes, const uint32_t& aStart_Index,
const uint32_t& aLength, const DumpDetails& aDump_Details) {
start_index =
std::min(static_cast<uint32_t>(aBytes.size()), std::max(static_cast<uint32_t>(0), aStart_Index));
length = ( aLength < 1 || aLength > aBytes.size() - start_index ) ? aBytes.size() - start_index : aLength;
dump_details = aDump_Details;
std::copy(aBytes.begin() + start_index, aBytes.begin() + start_index + length, std::back_inserter(bytes));
}
std::string to_converted_string() {
std::string result = "";
for ( uint32_t i = 0; i * dump_details.factor < bytes.size(); ++i ) {
result += to_converted_row(byte_vector(i * dump_details.factor, dump_details.factor));
}
return result + to_hex(counter_finish);
}
private:
std::vector<uint8_t> byte_vector(const uint32_t& current_index, const uint32_t& current_length) {
counter_start = current_index;
counter_finish = std::min(static_cast<size_t>(current_index + current_length), bytes.size());
std::vector<uint8_t> subvector(bytes.begin() + current_index, bytes.begin() + counter_finish);
return subvector;
}
std::string to_converted_row(std::vector<uint8_t> row) const {
std::string line, characters;
for ( const uint8_t& byte : row ) {
line += to_digit(byte);
characters += printable_character(byte);
}
line = padding(insertSpace(line));
return to_hex(counter_start) + line + "|" + characters + "|" + "\n";
}
std::string insertSpace(const std::string& line) const {
std::string result = line;
for ( uint8_t i = dump_details.block_length; i < line.size(); i += dump_details.block_length ) {
result.insert(i++, " ");
}
return result;
}
std::string to_digit(const uint32_t& number) const {
std::string result = "";
switch ( dump_details.type ) {
case DumpType::HEX : result = std::format("{:02x}", number & 0xff) + " "; break;
case DumpType::XXD : result = std::bitset<8>(number).to_string(); break;
};
return result;
}
std::string printable_character(const uint32_t& number) const {
return std::string(1, ( number >= 32 && number < 127 ) ? static_cast<char>(number) : '.');
}
std::string padding(const std::string& line) const {
return line + std::string(dump_details.line_length - line.size(), ' ');
}
std::string to_hex(const uint32_t& number) const {
return std::format("{:08x}", number) + " ";
}
uint32_t counter_start = 0, counter_finish = 0;
uint32_t start_index, length;
std::vector<uint8_t> bytes;
DumpDetails dump_details;
};
std::vector<uint8_t> read_file_data(const std::string& file_name) {
std::filesystem::path input_file_path { file_name };
const uint64_t length = std::filesystem::file_size(input_file_path);
if ( length == 0 ) {
return { };
}
std::vector<uint8_t> buffer(length);
std::ifstream input_file(file_name, std::ios_base::binary);
input_file.read(reinterpret_cast<char*>(buffer.data()), length);
input_file.close();
return buffer;
}
int main() {
std::vector<uint8_t> bytes = read_file_data("ExampleUTF16LE.dat");
DumpDetails hex = { DumpType::HEX, 16, 24, 50 };
DumpDetails xxd = { DumpType::XXD, 6, 8, 55 };
std::cout << "Hex dump of the entire file:" << std::endl;
std::cout << Converter(bytes, 0, bytes.size(), hex).to_converted_string() << std::endl << std::endl;
std::cout << "xxd dump of the entire file:" << std::endl;
std::cout << Converter(bytes, 0, bytes.size(), xxd).to_converted_string() << std::endl << std::endl;
std::cout << "Hex dump of the file from byte 20 to byte 94:" << std::endl;
std::cout << Converter(bytes, 20, 75, hex).to_converted_string() << std::endl << std::endl;
std::cout << "xxd dump of the file from byte 38 to byte 58:" << std::endl;
std::cout << Converter(bytes, 38, 21, xxd).to_converted_string() << std::endl;
}
- Output:
Hex dump of the entire file: 00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068 xxd dump of the entire file: 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068 Hex dump of the file from byte 20 to byte 94: 00000000 6f 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000010 20 00 70 00 72 00 6f 00 67 00 72 00 61 00 6d 00 | .p.r.o.g.r.a.m.| 00000020 6d 00 69 00 6e 00 67 00 20 00 63 00 68 00 72 00 |m.i.n.g. .c.h.r.| 00000030 65 00 73 00 74 00 6f 00 6d 00 61 00 74 00 68 00 |e.s.t.o.m.a.t.h.| 00000040 79 00 20 00 73 00 69 00 74 00 65 |y. .s.i.t.e| 0000004b xxd dump of the file from byte 38 to byte 58: 00000000 01110000 00000000 01110010 00000000 01101111 00000000 |p.r.o.| 00000006 01100111 00000000 01110010 00000000 01100001 00000000 |g.r.a.| 0000000c 01101101 00000000 01101101 00000000 01101001 00000000 |m.m.i.| 00000012 01101110 00000000 01100111 |n.g| 00000015
FreeBASIC
Code adapted from https://github.com/jlaasonen/hexfile
The code is from Jussi Laasonen (https://jlaasonen.me)
'Usage: hexfile [-i <first index>] <file>
Const bytesPerLine = 16
Const tabWidth = 3
Const fileIndexWidth = 8
Const firstIndex = 1
Const asciiLowerBound = 31
Const asciiUpperBound = 127
Const emptyByte = " "
Const emptyAsciiByte = " "
Const nonAsciiByte = "."
Enum Keys Explicit
Up = &H48FF
PageUp = &H49FF
Down = &H50FF
PageDown = &H51FF
Home = &H47FF
End_ = &H4FFF
Esc = 27
End Enum
Sub GetLine(Byval fileIndex As Longint, Byval fileNumber As Integer, bytes() As Ubyte)
Dim bytesread As Uinteger
If Get(#fileNumber,fileIndex,bytes(), ,bytesread) = 0 And bytesread > 0 Then
Redim Preserve bytes(bytesread)
Else
Erase bytes
End If
End Sub
Function ByteToAscii(Byval byte_ As Ubyte) As String
Return Iif(byte_ > asciiLowerBound And byte_ < asciiUpperBound, Chr(byte_), nonAsciiByte)
End Function
Function MakeLine(Byval firstIndexDisplay As Longint, Byval fileIndex As Longint, bytes() As Ubyte) As String
If Ubound(bytes) < Lbound(bytes) Then Return "" End If
Dim hexBytes As String = ""
Dim asciiBytes As String = ""
For byteIndex As Integer = Lbound(bytes) To Lbound(bytes) + bytesPerLine - 1
If byteIndex <= Ubound(bytes) Then
Dim byte_ As Ubyte = bytes(byteIndex)
asciiBytes += ByteToAscii(byte_)
hexBytes += Hex(byte_, 2)
Else
asciiBytes += emptyAsciiByte
hexBytes += emptyByte
End If
hexBytes += Iif(byteIndex = (bytesPerLine\2)-1, " ", " ")
Next
Dim displayIndex As Const Longint = fileIndex - firstIndex + firstIndexDisplay
Return Space(1) + Hex(displayIndex,fileIndexWidth) + Space(tabWidth) +_
hexBytes + Space(tabWidth-1) + asciiBytes
End Function
Sub DumpInteractive(Byval fileNumber As Integer, Byval firstIndexDisplay As Longint)
Dim consoleDimensions As Integer = Width()
Dim linesPerPage As Integer = Hiword(consoleDimensions)
Dim bytesPerPage As Integer = bytesPerline * linesPerPage
Dim numberOfFullLines As Longint = (Lof(fileNumber)-1) \ bytesPerLine
Dim lastLineIndex As Longint = numberOfFullLines * bytesPerLine + firstIndex
Dim lastPageIndex As Longint = lastLineIndex - bytesPerPage + bytesPerLine
If lastPageIndex < firstIndex Then lastPageIndex = firstIndex End If
Cls
Dim input_ As Long
Dim fileIndex As Longint = firstIndex
Do
Locate 1,1,0
For lineNumber As Integer = 1 To linesPerPage
Dim lineIndex As Longint = fileIndex + (lineNumber-1)*bytesPerLine
Redim bytes(bytesPerLine) As Ubyte
GetLine(lineIndex, fileNumber, bytes())
Dim lineText As String = MakeLine(firstIndexDisplay, lineIndex, bytes())
If lineNumber = linesPerPage Then
Print lineText;
Else
Print lineText
End If
Next
input_ = Getkey
Select Case As Const input_
Case Keys.PageUp
fileIndex -= bytesPerPage
Case Keys.Up
fileIndex -= bytesPerLine
Case Keys.PageDown
fileIndex += bytesPerPage
Case Keys.Down
fileIndex += bytesPerLine
Case Keys.Home
fileIndex = firstIndex
Case Keys.End_
fileIndex = lastPageIndex
End Select
If fileIndex < firstIndex Then fileIndex = firstIndex
If fileIndex > lastPageIndex Then fileIndex = lastPageIndex
Loop Until input_ = Keys.Esc
End Sub
Sub PrintUsage()
Const firstColumn = 4
Const secondColumn = 12
Dim controls(0 To ..., 2) As String = {_
{"Down", "Scroll down one line."},_
{"Up", "Scroll up one line."},_
{"PgDown", "Show next page."},_
{"PgUp", "Show previos page."},_
{"End", "Jump to the end of the file."},_
{"Home", "Jump to the beginning of the file."},_
{"Esc", "Quit."}_
}
Print "hexfile - a simple commandline hexdumper"
Print " (c) 2021-2023 Jussi Laasonen. Licensed under the MIT license."
Print " See https://github.com/jlaasonen/hexfile for full license."
Print !"\nUsage: hexfile [-i <first index>] <file>"
Print !"\nDisplays an interactive hex dump the file."
Print !"\nControls:"
For row As Integer = Lbound(controls) To Ubound(controls)
Print Tab(firstColumn);controls(row,0);Tab(secondColumn);controls(row,1)
Next
Print !"\nOptions:"
Print " -i <first index>"
Print " Starts the displayed file index from the given index. Defaults to 0."
Print " The value is expected in decimal format. For binary, octal or hexadecimal"
Print " Use prefix &B, &O or &H respectively."
End Sub
Const fileIndexArgument = "-i"
Dim fileName As String = ""
Dim firstIndexDisplay As Longint = 0
If __fb_argc__ = 2 Then
fileName = Command(1)
Elseif __fb_argc__ = 4 And Command(1) = fileIndexArgument Then
firstIndexDisplay = Vallng(Command(2))
fileName = Command(3)
End If
Dim fileNumber As Long = Freefile
If fileName = "" Then
PrintUsage()
Elseif Open(fileName For Binary Access Read As #fileNumber) = 0 Then
DumpInteractive(fileNumber, firstIndexDisplay)
Close(fileNumber)
Else
Print "Failed to open file '" + fileName + "'."
End If
J
J's hfd
(hex from decimal) is useful here, but it's not what the task asked for. We need to ensure a leading zero (achievable by adding 256 to the byte numbers, then dropping the resulting leading column of 1s), and then we need to massage the result to add spaces which fit the desired pattern.
The ascii section requires similar massaging, and some decorating.
The binary stretch goal could be approached similarly, but it's more concise to convert to 8 bit binary before massaging.
hexdump=: {{
assert. 'literal'-:datatype y
h=. '',~_2;\_8<@(' '(,,)])\' ',. 0 1}.hfd 256+a.i.y
a=. '',~_16(' |','|',~])\(y e.32}.127{.a.)}'.',:y
i=. 0 1}.hfd(2^32)+16*i.#h
i,.h,.a
}}
bindump=: {{
assert. 'literal'-:datatype y
b=. '',~_6(' ',,)\' ',.,/"2":"0(8#2)#:256+a.i.y
a=. '',~_6(' |','|',~])\(y e.32}.127{.a.)}'.',:y
i=. 0 1}.hfd(2^32)+6*i.#b
i,.b,.a
}}
J doesn't support a "little endian utf-16 literal" datatype, so we need to do a bit of work to create the required value.
sample=: a.{~_1 _2,,_1|."1]0 256#:3 u:7 u:'Rosetta Code is a programming chrestomathy site 😀.'
hexdump a.
00000000 00 01 02 03 04 05 06 07 08 09 0a 0b 0c 0d 0e 0f |................|
00000010 10 11 12 13 14 15 16 17 18 19 1a 1b 1c 1d 1e 1f |................|
00000020 20 21 22 23 24 25 26 27 28 29 2a 2b 2c 2d 2e 2f | !"#$%&'()*+,-./|
00000030 30 31 32 33 34 35 36 37 38 39 3a 3b 3c 3d 3e 3f |0123456789:;<=>?|
00000040 40 41 42 43 44 45 46 47 48 49 4a 4b 4c 4d 4e 4f |@ABCDEFGHIJKLMNO|
00000050 50 51 52 53 54 55 56 57 58 59 5a 5b 5c 5d 5e 5f |PQRSTUVWXYZ[\]^_|
00000060 60 61 62 63 64 65 66 67 68 69 6a 6b 6c 6d 6e 6f |`abcdefghijklmno|
00000070 70 71 72 73 74 75 76 77 78 79 7a 7b 7c 7d 7e 7f |pqrstuvwxyz{|}~.|
00000080 80 81 82 83 84 85 86 87 88 89 8a 8b 8c 8d 8e 8f |................|
00000090 90 91 92 93 94 95 96 97 98 99 9a 9b 9c 9d 9e 9f |................|
000000a0 a0 a1 a2 a3 a4 a5 a6 a7 a8 a9 aa ab ac ad ae af |................|
000000b0 b0 b1 b2 b3 b4 b5 b6 b7 b8 b9 ba bb bc bd be bf |................|
000000c0 c0 c1 c2 c3 c4 c5 c6 c7 c8 c9 ca cb cc cd ce cf |................|
000000d0 d0 d1 d2 d3 d4 d5 d6 d7 d8 d9 da db dc dd de df |................|
000000e0 e0 e1 e2 e3 e4 e5 e6 e7 e8 e9 ea eb ec ed ee ef |................|
000000f0 f0 f1 f2 f3 f4 f5 f6 f7 f8 f9 fa fb fc fd fe ff |................|
00000100
hexdump sample
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.|
00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.|
00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.|
00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.|
00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.|
00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.|
00000060 20 00 3d d8 00 de 2e 00 | .=.....|
00000070
bindump sample
00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.|
00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.|
0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .|
00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.|
00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.|
0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.|
00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.|
0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.|
00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.|
00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.|
0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.|
00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.|
00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.|
0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.|
00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.|
0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.|
00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...|
00000066 00101110 00000000 |..|
0000006c
Java
import java.io.IOException;
import java.nio.file.Files;
import java.nio.file.Path;
import java.util.List;
import java.util.regex.MatchResult;
import java.util.regex.Pattern;
import java.util.stream.Collectors;
import java.util.stream.IntStream;
public final class HexDump {
public static void main(String[] args) throws IOException {
byte[] bytes = Files.readAllBytes(Path.of("ExampleUTF16LE.dat"));
System.out.println("Hex dump of the entire file:");
System.out.println( new Converter(bytes, 0, bytes.length, DumpType.HEX).toConvertedString() );
System.out.println();
System.out.println("xxd dump of the entire file:");
System.out.println( new Converter(bytes, 0, bytes.length, DumpType.XXD).toConvertedString() );
System.out.println();
System.out.println("Hex dump of the file from byte 20 to byte 94:");
System.out.println( new Converter(bytes, 20, 75, DumpType.HEX).toConvertedString() );
System.out.println();
System.out.println("xxd dump of the file from byte 38 to byte 58:");
System.out.println( new Converter(bytes, 38, 21, DumpType.XXD).toConvertedString() );
}
private static final class Converter {
public Converter(byte[] aBytes, int aStartIndex, int aLength, DumpType aDumpType) {
startIndex = Math.min(aBytes.length, Math.max(0, aStartIndex));
length = ( aLength < 1 || aLength > aBytes.length - startIndex ) ? aBytes.length - startIndex : aLength;
dumpType = aDumpType;
bytes = IntStream.range(startIndex, startIndex + length).mapToObj( i -> aBytes[i] ).toList();
}
public String toConvertedString() {
return IntStream.iterate(0, i -> i * dumpType.factor < bytes.size(), i -> i + 1)
.mapToObj( i -> byteList(i * dumpType.factor, dumpType.factor) )
.map( list -> toConvertedRow(list) )
.collect(Collectors.joining())
+ toHex(counterFinish);
}
private List<Byte> byteList(int currentIndex, int currentLength) {
counterStart = currentIndex;
counterFinish = Math.min(currentIndex + currentLength, bytes.size());
return bytes.subList(currentIndex, counterFinish);
}
private String toConvertedRow(List<Byte> row) {
String line = row.stream().map( b -> toDigit(b) ).collect(Collectors.joining());
line = padding(insertSpace(line));
return toHex(counterStart) + line + "|" +
row.stream().map( b -> printableCharacter(b) ).collect(Collectors.joining()) + "|" + "\n";
}
private String insertSpace(String line) {
return Pattern.compile(".{1," + dumpType.blockLength + "}")
.matcher(line).results().map(MatchResult::group).collect(Collectors.joining(" "));
}
private String toDigit(int number) {
return switch ( dumpType ) {
case HEX -> String.format("%02x ", number & 0xff);
case XXD -> Integer.toBinaryString( ( 1 << 8 | ( number & 0xff ) ) ).substring(1);
};
}
private String printableCharacter(int number) {
return ( number >= 32 && number < 127 ) ? String.valueOf((char) number) : ".";
}
private String padding(String line) {
return String.format("%1$-" + dumpType.lineLength + "s", line);
}
private String toHex(int number) {
return String.format("%08x ", number);
}
private int counterStart, counterFinish;
private final int startIndex, length;
private final List<Byte> bytes;
private final DumpType dumpType;
}
private static enum DumpType {
HEX(16, 24, 50), XXD(6, 8, 55);
private DumpType(int aFactor, int aBlockLength, int aLineLength) {
factor = aFactor;
blockLength = aBlockLength;
lineLength = aLineLength;
}
private final int factor, blockLength, lineLength;
}
}
- Output:
Hex dump of the entire file: 00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068 xxd dump of the entire file: 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068 Hex dump of the file from byte 20 to byte 94: 00000000 6f 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000010 20 00 70 00 72 00 6f 00 67 00 72 00 61 00 6d 00 | .p.r.o.g.r.a.m.| 00000020 6d 00 69 00 6e 00 67 00 20 00 63 00 68 00 72 00 |m.i.n.g. .c.h.r.| 00000030 65 00 73 00 74 00 6f 00 6d 00 61 00 74 00 68 00 |e.s.t.o.m.a.t.h.| 00000040 79 00 20 00 73 00 69 00 74 00 65 |y. .s.i.t.e| 0000004b xxd dump of the file from byte 38 to byte 58: 00000000 01110000 00000000 01110010 00000000 01101111 00000000 |p.r.o.| 00000006 01100111 00000000 01110010 00000000 01100001 00000000 |g.r.a.| 0000000c 01101101 00000000 01101101 00000000 01101001 00000000 |m.m.i.| 00000012 01101110 00000000 01100111 |n.g| 00000015
JavaScript
// Generate UTF-16 LE bytes from a string.
function* utf16leBytes(str) {
// Little endian byte order mark.
yield 0xff;
yield 0xfe;
// Iterate code units.
let code_unit;
for (let i = 0; i < str.length; i++) {
code_unit = str.charCodeAt(i);
yield code_unit & 0xff;
yield code_unit >>> 8;
}
}
/**
* Generate sequences of length {@link n} from items in iterable {@link it}.
*/
function* groupBy(it, n) {
let chunk = [];
for (const item of it) {
chunk.push(item);
if (chunk.length == n) {
yield chunk;
chunk = [];
}
}
if (chunk.length) {
yield chunk;
}
}
/**
* @callback Formatter
* @param {Array<number>} chunk
* @returns {string} {@link chunk} formatted for output on one line.
*/
function canonicalFormatter(chunk) {
const bytesAsHex = chunk.map((byte) => byte.toString(16).padStart(2, "0"));
const hex = `${bytesAsHex.slice(0, 8).join(" ")} ${bytesAsHex
.slice(8)
.join(" ")}`.padEnd(48, " ");
const ascii = chunk
.map((byte) => (byte > 31 && byte < 127 ? String.fromCharCode(byte) : "."))
.join("");
return `${hex} |${ascii}|`;
}
/**
* @callback Formatter
* @param {Array<number>} chunk
* @returns {string} {@link chunk} formatted for output on one line.
*/
function binaryFormatter(chunk) {
const bits = chunk
.map((byte) => byte.toString(2).padStart(8, "0"))
.join(" ")
.padEnd(53, " ");
const ascii = chunk
.map((byte) => (byte > 31 && byte < 127 ? String.fromCharCode(byte) : "."))
.join("");
return `${bits} |${ascii}|`;
}
/**
* Generate a textual representation of bytes in {@link data} one line at a time.
*
* @param {Iterable<number>} data
* @param {number} skip
* @param {number} length
* @param {Formatter} formatter
* @param {number} chunkSize
*/
function* hexDumpLines(
data,
skip = 0,
length = Infinity,
formatter = canonicalFormatter,
chunkSize = 16
) {
const it = data[Symbol.iterator]();
for (let i = 0; i < skip; i++) {
it.next();
}
let offset = skip;
let byteCount = 0;
let line = "";
for (let chunk of groupBy(data, chunkSize)) {
// Discard excess bytes if we've overshot length.
if (byteCount + chunk.length > length) {
chunk = chunk.slice(0, length - byteCount);
}
line = formatter(chunk);
yield `${offset.toString(16).padStart(8, "0")} ${line}`;
offset += chunkSize;
byteCount += chunk.length;
if (byteCount >= length) {
break;
}
}
// Final byte count
yield (byteCount + skip).toString(16).padStart(8, "0");
}
/**
* Log a hex dump of {@link data} to the console.
*
* @param {Iterable<number>} data
* @param {number} skip
* @param {number} length
* @param {Formatter} formatter
* @param {number} chunkSize
*/
function consoleHexDump(
data,
skip = 0,
length = Infinity,
formatter = canonicalFormatter,
chunkSize = 16
) {
for (const line of hexDumpLines(data, skip, length, formatter, chunkSize)) {
console.log(line);
}
}
const exampleData = "Rosetta Code is a programming chrestomathy site 😀.";
consoleHexDump(utf16leBytes(exampleData));
console.log("");
consoleHexDump(utf16leBytes(exampleData), 20, 25);
console.log("");
consoleHexDump(utf16leBytes(exampleData), 0, Infinity, binaryFormatter, 6);
- Output:
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068 00000014 6f 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000024 20 00 70 00 72 00 6f 00 67 | .p.r.o.g| 0000002d 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068
Julia
function baseddump(io::IO, data::Vector{UInt8}; base = 16, offset = 0, len = -1, displayadjust = 0)
@assert 2 <= base <= 16 "display base $base not supported"
datastop = len < 0 ? length(data) : min(offset + len, length(data))
bytes = data[begin+offset:datastop]
fullchunksize = base == 16 ? 16 : base > 8 ? 10 : base > 4 ? 8 : 6
padsize = base == 16 ? 2 : base == 2 ? 8 : base > 7 ? 3 : base > 3 ? 4 : 5
midpad = " "^(base != 2)
vl = (padsize + 1) * fullchunksize + length(midpad)
halflen, pos = fullchunksize ÷ 2, offset + displayadjust
for chunk in Iterators.partition(bytes, fullchunksize)
chunklen = length(chunk)
values = map(n -> string(n, base = base, pad = padsize) * " ", chunk)
s1 = join(values[begin:begin+min(halflen, chunklen)-1])
if chunklen > halflen
s1 *= midpad * join(values[begin+halflen:end])
end
s2 = prod(map(n -> n < 128 && isprint(Char(n)) ? Char(n) : '.', chunk))
println(io, string(pos, base = 16, pad = 8) * " " * rpad(s1, vl) * "|" * s2 * "|")
pos += chunklen
end
println(io, string(pos - offset - displayadjust, base = 16, pad = 8))
end
function baseddump(data; base = 16, offset = 0, len = -1)
return baseddump(vec(collect(reinterpret(UInt8, data))); base, offset, len)
end
function baseddump(filename::AbstractString; base = 16, offset = 0, len = -1)
fromio = open(filename)
flen = stat(fromio).size
len = len < 0 ? flen - offset : min(len, flen - offset)
offset != 0 && seek(fromio, offset)
data::Vector{UInt8} = read(fromio, len)
baseddump(data; base = base, offset = 0, displayadjust = offset)
close(fromio)
end
hexdump(data; offset = 0, len = -1) = baseddump(data; offset, len)
xxd(data; offset = 0, len = -1) = baseddump(data; base = 2, offset, len)
decdump(data; offset = 0, len = -1) = baseddump(data; base = 10, offset, len)
const tstr = b"Rosetta Code is a programming chrestomathy site 😀."
const utf16 = vcat(b"\xff\xfe", reinterpret(UInt8, transcode(UInt16, tstr)))
print("hexdump of utf-16 string "), display(String(tstr))
hexdump(utf16)
print("\nxxd of utf-16 string "), display(String(tstr))
xxd(utf16)
print("\ndecdump of utf-16 string "), display(String(tstr))
decdump(utf16)
println("\nbaseddump of utf-16 string bytes 16-56 from file:")
fname = tempname()
open(fname, "w") do fd; write(fd, utf16) end
baseddump(fname, offset = 16, len = 40)
- Output:
hexdump of utf-16 string "Rosetta Code is a programming chrestomathy site 😀." 00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068 xxd of utf-16 string "Rosetta Code is a programming chrestomathy site 😀." 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068 decdump of utf-16 string "Rosetta Code is a programming chrestomathy site 😀." 00000000 255 254 082 000 111 000 115 000 101 000 |..R.o.s.e.| 0000000a 116 000 116 000 097 000 032 000 067 000 |t.t.a. .C.| 00000014 111 000 100 000 101 000 032 000 105 000 |o.d.e. .i.| 0000001e 115 000 032 000 097 000 032 000 112 000 |s. .a. .p.| 00000028 114 000 111 000 103 000 114 000 097 000 |r.o.g.r.a.| 00000032 109 000 109 000 105 000 110 000 103 000 |m.m.i.n.g.| 0000003c 032 000 099 000 104 000 114 000 101 000 | .c.h.r.e.| 00000046 115 000 116 000 111 000 109 000 097 000 |s.t.o.m.a.| 00000050 116 000 104 000 121 000 032 000 115 000 |t.h.y. .s.| 0000005a 105 000 116 000 101 000 032 000 061 216 |i.t.e. .=.| 00000064 000 222 046 000 |....| 00000068 baseddump of utf-16 string bytes 16-56 from file: 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 |a.m.m.i.| 00000028
Phix
with javascript_semantics
sequence utf16 = #FEFF & "Rosetta Code is a programming chrestomathy site " & {#d83d,#DE00,'.'}
function to2(integer i) return {and_bits(i,#FF),floor(i/#100)} end function
constant string s = flatten(apply(utf16,to2),"")
--or: (javascript incompatible)
--constant string s = get_text(filename) -- (if you have a suitable premade one to hand)
procedure hexdump(string s, integer start=0, finish=-1, bool bHex=true, bFinalSize=true)
s = s[start+1..finish]
integer ll = iff(bHex?16:6), ls = length(s)
string hbfmt = iff(bHex?"%02x ":"%08b "),
lnfmt = "%08x %s |%-" & sprintf("%d",ll) & "s|\n"
sequence lines = split_by(s,ll)
for l in lines do
string hb = " ", ascii = ""
for i,b in l do
hb &= sprintf(hbfmt,b)
if b<' ' or b>'~' then b = '.' end if
ascii &= b
if i=8 then hb &= ' ' end if
end for
hb = pad_tail(hb,iff(bHex?50:55))
printf(1,lnfmt,{start,hb,ascii})
start += length(l)
end for
if bFinalSize then
printf(1,"%08x\n",{ls})
end if
end procedure
printf(1,"Hexadecimal:\n")
hexdump(s)
printf(1,"\nBinary:\n")
hexdump(s,bHex:=false)
Although not shown, the intention is the outer calling code (last four lines) could call hexdump() to display one page at a time, with appropriate user input, and/or read s in chunks and pass a file offset instead of or as well as start, finish.
- Output:
Hexadecimal: 00000000 FF FE 52 00 6F 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6F 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6F 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6D 00 6D 00 69 00 6E 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6F 00 6D 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3D D8 00 DE 2E 00 | .=..... | 00000068 Binary: 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000C 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001E 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002A 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003C 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004E 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005A 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |.. | 00000068
PHP
<?php
// Output the contents of a file (or part of a file) in either hexadecimal or binary
function dump($filename, $mode, $offset=0, $length=null) {
$data = file_get_contents($filename, false, null, $offset, $length);
$c = '';
$h = '';
$a = $offset;
$output = '<pre>';
if ($mode == 'h') {
$linesize = 16;
for ($i = 0; $i < strlen($data); $i++) {
$x = substr($data, $i, 1);
$h .= bin2hex($x) . ' ';
if ($i % 8 == 7) {
$h .= ' ';
}
if (ord($x) >= 32 && ord($x) <= 126) {
$c .= $x;
}
else {
$c .= '.';
}
if ($i % $linesize == 15 || $i == strlen($data) - 1) {
$o = str_pad(dechex($a), 8, '0', STR_PAD_LEFT) . ' ';
$a += $linesize;
$h = $o . str_pad($h, 50, ' ', STR_PAD_RIGHT) . '|' . $c . '|';
$output .= $h . '<br>';
$c = '';
$h = '';
}
}
}
elseif ($mode == 'b') {
$linesize = 6;
for ($i = 0; $i < strlen($data); $i++) {
$x = substr($data, $i, 1);
$h .= str_pad(decbin(ord($x)), 8, '0', STR_PAD_LEFT) . ' ';
if (ord($x) >= 32 && ord($x) <= 126) {
$c .= $x;
}
else {
$c .= '.';
}
if ($i % $linesize == 5 || $i == strlen($data) - 1) {
$o = str_pad(dechex($a), 8, '0', STR_PAD_LEFT) . ' ';
$a += $linesize;
$h = $o . str_pad($h, 54, ' ', STR_PAD_RIGHT) . '|' . $c . '|';
$output .= $h . '<br>';
$c = '';
$h = '';
}
}
}
// final byte count
$output .=str_pad(dechex(strlen($data)), 8, '0', STR_PAD_LEFT) . ' ';
$output .= '</pre>';
return $output;
}
$x = dump("file1.txt", "h");
echo '<p>Hexadecimal dump of file' . $x . '</p>';
$x = dump("file1.txt", "h", 10, 20);
echo '<p>Hexadecimal dump of 20 bytes of file from offset 10' . $x . '</p>';
$x = dump("file1.txt", "b");
echo '<p>Binary dump of file1' . $x . '</p>';
?>
- Output:
Hexadecimal dump of file
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068
Hexadecimal dump of file from offset 10 for length of 20
0000000a 74 00 74 00 61 00 20 00 43 00 6f 00 64 00 65 00 |t.t.a. .C.o.d.e.| 0000001a 20 00 69 00 | .i.| 00000014
Binary dump of file
00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068
Python
"""Display bytes in a file like hexdump or xxd."""
import abc
import math
from io import BufferedIOBase
from io import SEEK_END
from itertools import islice
from typing import Iterable
from typing import Iterator
from typing import Sequence
from typing import Tuple
from typing import TypeVar
READ_SIZE = 2048
class Formatter(abc.ABC):
"""Base class for hex dump formatters."""
@abc.abstractmethod
def format(self, data: Sequence[int]) -> str:
"""Return _data_ formatted for output on one line."""
@property
@abc.abstractmethod
def bytes_per_line(self) -> int:
"""The number of bytes to display per line of output."""
class CanonicalFormatter(Formatter):
bytes_per_line = 16
def format(self, data: Sequence[int]) -> str:
assert len(data) <= 16
hex = f"{bytes(data[:8]).hex(' ')} {bytes(data[8:]).hex(' ')}".ljust(48)
ascii_ = "".join(chr(b) if b > 31 and b < 127 else "." for b in data)
return f"{hex} |{ascii_}|"
class BinaryFormatter(Formatter):
bytes_per_line = 6
def format(self, data: Sequence[int]) -> str:
assert len(data) <= 6
bits = " ".join(bin(b)[2:].rjust(8, "0") for b in data).ljust(53)
ascii_ = "".join(chr(b) if b > 31 and b < 127 else "." for b in data)
return f"{bits} |{ascii_}|"
canonicalFormatter = CanonicalFormatter()
binaryFormatter = BinaryFormatter()
T = TypeVar("T")
def group(it: Iterable[T], n: int) -> Iterator[Tuple[T, ...]]:
"""Split iterable _it_ in to groups of size _n_.
The last group might contain less than _n_ items.
"""
_it = iter(it)
while True:
g = tuple(islice(_it, n))
if not g:
break
yield g
def hex_dump(
f: BufferedIOBase,
*,
skip: int = 0,
length: int = math.inf, # type: ignore
formatter: Formatter = canonicalFormatter,
) -> Iterator[str]:
"""Generate a textual representation of bytes in _f_, one line at a time."""
f.seek(skip)
offset = skip
byte_count = 0
previous_line = ""
squeezing = False # True if the last output line was squeezed
assert length > 0
while byte_count < length:
# Read at most READ_SIZE bytes at a time.
data = f.read(READ_SIZE)
# Stop if we've run out of data.
if not data:
break
# Discard excess bytes if we've overshot length.
if byte_count + len(data) > length:
data = data[: length - byte_count]
# One line per chunk
for chunk in group(data, formatter.bytes_per_line):
line = formatter.format(chunk)
if previous_line == line:
if squeezing is False:
squeezing = True
yield "*"
else:
previous_line = line
squeezing = False
yield f"{offset:0>8x} {line}"
offset += formatter.bytes_per_line
byte_count += len(chunk)
# Final byte count
bytes_in_f = f.seek(0, SEEK_END)
yield f"{min(byte_count + skip, bytes_in_f):0>8x}"
if __name__ == "__main__":
import argparse
parser = argparse.ArgumentParser(
prog="hex_dump.py",
description="Display bytes in a file.",
)
parser.add_argument(
"file",
type=argparse.FileType(mode="rb"),
metavar="FILE",
help="target file to dump",
)
parser.add_argument(
"-b",
"--binary",
action="store_true",
help="display bytes in binary instead of hex",
)
parser.add_argument(
"-s",
"--skip",
type=int,
default=0,
help="skip SKIP bytes from the beginning",
)
parser.add_argument(
"-n",
"--length",
type=int,
default=math.inf,
help="read up to LENGTH bytes",
)
args = parser.parse_args()
formatter = binaryFormatter if args.binary else canonicalFormatter
for line in hex_dump(
args.file,
formatter=formatter,
skip=args.skip,
length=args.length,
):
print(line)
- Output:
$ python hex_dump.py example_utf16.txt
00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068
$ python hex_dump.py example_utf16.txt -s 20 -n 25
00000014 6f 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000024 20 00 70 00 72 00 6f 00 67 | .p.r.o.g| 0000002d
$ python hex_dump.py example_utf16.txt -b
00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068
Raku
The hexdump() routine expects a Blob. How you feed it the Blob is up to you. You may read a file in binary mode, encode a string, whatever. Using encoded strings here for a compact, self-contained example. Encoded in a few different ways for variety.
say my $string = 'Rosettacode is a programming crestomathy site 😀. 🍨 👨👩👦 ⚽ ¯\_(ツ)_/¯';
say "\nHex dump UTF-16BE, offset 0";
hexdump $string.encode("UTF-16BE");
say "\nHex dump UTF-16LE, offset 0";
hexdump $string.encode("UTF-16LE");
say "\nBinary dump UTF-8, offset 17";
hexdump $string.encode("UTF-8"), :bin, :17offset;
sub hexdump(Blob $blob, Int :$offset is copy = 0, :$bin = False) {
my ($fmt, $space, $batch) = $bin ?? ("%08b", ' ' x 8, 6) !! ("%02X", ' ', 16);
for $blob.skip($offset).batch($batch) {
my @h = flat $_».fmt($fmt), $space xx $batch;
@h[7] ~= ' ';
printf "%08X %s |%s|\n", $offset, @h[^$batch].Str,
$_».chr.join.subst(/<-print>|\t|\n/, '.', :g);
$offset += $batch;
}
}
- Output:
Rosettacode is a programming crestomathy site 😀. 🍨 👨👩👦 ⚽ ¯\_(ツ)_/¯ Hex dump UTF-16BE, offset 0 00000000 00 52 00 6F 00 73 00 65 00 74 00 74 00 61 00 63 |.R.o.s.e.t.t.a.c| 00000010 00 6F 00 64 00 65 00 20 00 69 00 73 00 20 00 61 |.o.d.e. .i.s. .a| 00000020 00 20 00 70 00 72 00 6F 00 67 00 72 00 61 00 6D |. .p.r.o.g.r.a.m| 00000030 00 6D 00 69 00 6E 00 67 00 20 00 63 00 72 00 65 |.m.i.n.g. .c.r.e| 00000040 00 73 00 74 00 6F 00 6D 00 61 00 74 00 68 00 79 |.s.t.o.m.a.t.h.y| 00000050 00 20 00 73 00 69 00 74 00 65 00 20 D8 3D DE 00 |. .s.i.t.e. Ø=Þ.| 00000060 00 2E 00 20 00 20 00 20 00 20 D8 3C DF 68 00 20 |... . . . Ø<ßh. | 00000070 D8 3D DC 68 20 0D D8 3D DC 69 20 0D D8 3D DC 66 |Ø=Üh .Ø=Üi .Ø=Üf| 00000080 00 20 26 BD 00 20 00 AF 00 5C 00 5F 00 28 30 C4 |. &½. .¯.\._.(0Ä| 00000090 00 29 00 5F 00 2F 00 AF |.)._./.¯| Hex dump UTF-16LE, offset 0 00000000 52 00 6F 00 73 00 65 00 74 00 74 00 61 00 63 00 |R.o.s.e.t.t.a.c.| 00000010 6F 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000020 20 00 70 00 72 00 6F 00 67 00 72 00 61 00 6D 00 | .p.r.o.g.r.a.m.| 00000030 6D 00 69 00 6E 00 67 00 20 00 63 00 72 00 65 00 |m.i.n.g. .c.r.e.| 00000040 73 00 74 00 6F 00 6D 00 61 00 74 00 68 00 79 00 |s.t.o.m.a.t.h.y.| 00000050 20 00 73 00 69 00 74 00 65 00 20 00 3D D8 00 DE | .s.i.t.e. .=Ø.Þ| 00000060 2E 00 20 00 20 00 20 00 20 00 3C D8 68 DF 20 00 |.. . . . .<Øhß .| 00000070 3D D8 68 DC 0D 20 3D D8 69 DC 0D 20 3D D8 66 DC |=ØhÜ. =ØiÜ. =ØfÜ| 00000080 20 00 BD 26 20 00 AF 00 5C 00 5F 00 28 00 C4 30 | .½& .¯.\._.(.Ä0| 00000090 29 00 5F 00 2F 00 AF 00 |)._./.¯.| Binary dump UTF-8, offset 17 00000011 01110000 01110010 01101111 01100111 01110010 01100001 |progra| 00000017 01101101 01101101 01101001 01101110 01100111 00100000 |mming | 0000001D 01100011 01110010 01100101 01110011 01110100 01101111 |cresto| 00000023 01101101 01100001 01110100 01101000 01111001 00100000 |mathy | 00000029 01110011 01101001 01110100 01100101 00100000 11110000 |site ð| 0000002F 10011111 10011000 10000000 00101110 00100000 00100000 |.... | 00000035 00100000 00100000 11110000 10011111 10001101 10101000 | ð..¨| 0000003B 00100000 11110000 10011111 10010001 10101000 11100010 | ð..¨â| 00000041 10000000 10001101 11110000 10011111 10010001 10101001 |..ð..©| 00000047 11100010 10000000 10001101 11110000 10011111 10010001 |â..ð..| 0000004D 10100110 00100000 11100010 10011010 10111101 00100000 |¦ â.½ | 00000053 11000010 10101111 01011100 01011111 00101000 11100011 |¯\_(ã| 00000059 10000011 10000100 00101001 01011111 00101111 11000010 |..)_/Â| 0000005F 10101111 |¯|
Rust
use is_printable::IsPrintable;
use std::env;
use std::fs::File;
use std::io::{Read, Seek, SeekFrom::Start};
use std::process::ExitCode;
const BYTES_HEX: usize = 16;
const BYTES_BIN: usize = 6;
fn print_hex(data: &[u8], count: usize) {
for i in 0..count {
if i % 8 == 0 {
print!(" ");
}
print!(" {:02x}", data[i]);
}
for i in count..BYTES_HEX {
if i % 8 == 0 {
print!(" ");
}
print!(" ");
}
}
fn print_binary(data: &[u8], count: usize) {
print!(" ");
for i in 0..count {
let c = data[i];
print!(" ");
for j in (1..8).rev() {
let m = 1 << j;
print!("{}", if c & m != 0 { "1" } else { "0" });
}
}
for _i in count..BYTES_BIN {
print!(" ");
}
}
fn print_chars(data: &[u8], count: usize) {
for i in 0..count {
print!(
"{}",
if data[i] < 129 && (data[i] as char).to_string().is_printable() {
data[i] as char
} else {
'.'
}
);
}
}
fn usage(program: &str) {
eprintln!("usage: {} [-b] [-s skip] [-n length] filename", program);
}
fn usage_err(err: &str, arg: &str, program: &str) -> ExitCode {
if err != "" && arg != "" {
eprintln!("{} {}.", err, arg);
usage(program);
}
return ExitCode::FAILURE;
}
fn main() -> ExitCode {
let mut offset = 0_usize;
let mut max_length = std::u32::MAX as usize;
let mut binary = false;
let mut source: String = ": No file name provided".to_owned();
let args: Vec<String> = env::args().collect();
for (i, arg) in args.clone().into_iter().enumerate() {
if i == 0 {
continue;
}
if i == args.len() - 1 || arg[0..=0] != *"-" {
source = arg.to_owned();
break;
}
match arg.as_bytes()[1] as char {
's' => {
if i == args.len() - 1 {
return usage_err("", "", &args[0]);
}
offset = match usize::from_str_radix(&arg[2..], 10) {
Ok(k) => k,
_ => return usage_err("Invalid skip ", &arg, &args[0]),
};
}
'n' => {
if i == args.len() - 1 {
return usage_err("", "", &args[0]);
}
max_length = match usize::from_str_radix(&arg[2..], 10) {
Ok(k) => k,
_ => return usage_err("Invalid length ", &arg, &args[0]),
};
}
'b' => {
binary = true;
}
_ => return usage_err("", "", &args[0]),
}
}
let mut buf = [0_u8; BYTES_HEX];
let data = if binary {
&mut buf[0..BYTES_BIN]
} else {
&mut buf[..]
};
let mut file = match File::open(&source) {
Ok(f) => f,
_ => return usage_err("Cannot open to read", &source, &args[0]),
};
if offset > 0 {
if offset > file.metadata().unwrap().len() as usize {
offset = file.metadata().unwrap().len() as usize;
}
let _ = file.seek(Start(offset as u64));
}
let mut length = 0_usize;
while length < max_length {
let mut count = match file.read(data) {
Ok(num_read) => num_read,
_ => 0,
};
if count > max_length - length {
count = max_length - length;
}
if count == 0 {
println!();
break;
}
if binary {
print_binary(data, count);
} else {
print_hex(data, count);
}
print!(" |");
print_chars(data, count);
println!("|");
offset += count;
length += count;
}
return ExitCode::SUCCESS;
}
- Output:
ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 20 00 3d d8 00 de 2e 00 | .=.....|
- > .\test1 -b hexdump_test_string.utf16
1111111 1111111 0101001 0000000 0110111 0000000 |..R.o.| 0111001 0000000 0110010 0000000 0111010 0000000 |s.e.t.| 0111010 0000000 0110000 0000000 0010000 0000000 |t.a. .| 0100001 0000000 0110111 0000000 0110010 0000000 |C.o.d.| 0110010 0000000 0010000 0000000 0110100 0000000 |e. .i.| 0111001 0000000 0010000 0000000 0110000 0000000 |s. .a.| 0010000 0000000 0111000 0000000 0111001 0000000 | .p.r.| 0110111 0000000 0110011 0000000 0111001 0000000 |o.g.r.| 0110000 0000000 0110110 0000000 0110110 0000000 |a.m.m.| 0110100 0000000 0110111 0000000 0110011 0000000 |i.n.g.| 0010000 0000000 0110001 0000000 0110100 0000000 | .c.h.| 0111001 0000000 0110010 0000000 0111001 0000000 |r.e.s.| 0111010 0000000 0110111 0000000 0110110 0000000 |t.o.m.| 0110000 0000000 0111010 0000000 0110100 0000000 |a.t.h.| 0111100 0000000 0010000 0000000 0111001 0000000 |y. .s.| 0110100 0000000 0111010 0000000 0110010 0000000 |i.t.e.| 0010000 0000000 0011110 1101100 0000000 1101111 | .=...| 0010111 0000000 |..|
Wren
This is only tested on Linux (Ubuntu 22.04).
As my text editor always adds a trailing \n, the method removes this before dumping the remainder.
import "io" for File
import "./seq" for Lst
import "./fmt" for Fmt
class Dumper {
static dump(fileName, base, start, length) {
if ([2, 3, 8, 10, 16].indexOf(base) == -1) Fiber.abort("Base %(base) is not supported.")
var bytes = File.read(fileName).bytes.toList
var bc = bytes.count
// remove final \n if present
if (bc > 0 && bytes[-1] == 10) {
bytes.removeAt(-1)
bc = bc - 1
} else if (bc > 1 && bytes[-1] == 0 && bytes[-2] == 10) {
bytes.removeAt(-1)
bytes.removeAt(-1)
bc = bc - 2
}
if (bc == 0) Fmt.print("$q is empty.", fileName)
if (start < 0 || start >= bc) Fiber.abort("Starting point is invalid.")
if (length < 1 || length > bc - start) length = bc - start
var end = start + length - 1
if (start > 0 || end < bc - 1) {
bytes = bytes[start..end]
bc = end - start + 1
}
var rowLens = {2: 6, 3: 8, 8: 10, 10: 10, 16: 16}
var rl = rowLens[base]
var hrl = rl / 2
var sp = (base < 8) ? " " : " "
var baseFmts = {2: "$08b", 3: "$06t", 8: "$03o", 10: "$03d", 16: "$02x"}
var bf = baseFmts[base]
var bl = Num.fromString(bf[2])
var rows = Lst.chunks(bytes, rl)
var rc = rows.count
Fmt.print("Dump of $q in base $d from byte index $d to $d:", fileName, base, start, end)
for (i in 0...rc) {
var line = rows[i]
var lc = line.count
var ascii = List.filled(lc, 0)
for (b in 0...lc) {
var c = line[b]
if (c >= 32 && c < 127) {
ascii[b] = String.fromByte(c)
} else {
ascii[b] = "."
}
}
var text = "|" + ascii.join() + "|"
var offset = start + i * rl
if (i < rc-1 || lc == rl) {
var fmt = "$08x %(bf)$s%(bf) $s"
Fmt.print(fmt, offset, line[0...hrl], sp, line[hrl..-1], text)
} else {
var extra = " " * ((bl+1) * (rl - lc))
if (lc <= hrl) {
var fmt = "$08x %(bf)$s$s $s"
Fmt.print(fmt, offset, line[0..-1], sp, extra, text)
} else {
var fmt = "$08x %(bf)$s%(bf)$s $s"
Fmt.print(fmt, offset, line[0...hrl], sp, line[hrl..-1], extra, text)
}
}
}
Fmt.print("$08x", start + bc)
}
static dump(fileName, base, start) { dump(fileName, base, start, -1) }
static dump(fileName, base) { dump(fileName, base, 0, -1) }
}
var fileName = "example_utf16.txt"
for (base in [16, 10, 8, 3, 2]) {
Dumper.dump(fileName, base)
System.print()
}
Dumper.dump(fileName, 16, 2, 24)
- Output:
Dump of "example_utf16.txt" in base 16 from byte index 0 to 103: 00000000 ff fe 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6f 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6f 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6d 00 6d 00 69 00 6e 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6f 00 6d 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3d d8 00 de 2e 00 | .=.....| 00000068 Dump of "example_utf16.txt" in base 10 from byte index 0 to 103: 00000000 255 254 082 000 111 000 115 000 101 000 |..R.o.s.e.| 0000000a 116 000 116 000 097 000 032 000 067 000 |t.t.a. .C.| 00000014 111 000 100 000 101 000 032 000 105 000 |o.d.e. .i.| 0000001e 115 000 032 000 097 000 032 000 112 000 |s. .a. .p.| 00000028 114 000 111 000 103 000 114 000 097 000 |r.o.g.r.a.| 00000032 109 000 109 000 105 000 110 000 103 000 |m.m.i.n.g.| 0000003c 032 000 099 000 104 000 114 000 101 000 | .c.h.r.e.| 00000046 115 000 116 000 111 000 109 000 097 000 |s.t.o.m.a.| 00000050 116 000 104 000 121 000 032 000 115 000 |t.h.y. .s.| 0000005a 105 000 116 000 101 000 032 000 061 216 |i.t.e. .=.| 00000064 000 222 046 000 |....| 00000068 Dump of "example_utf16.txt" in base 8 from byte index 0 to 103: 00000000 377 376 122 000 157 000 163 000 145 000 |..R.o.s.e.| 0000000a 164 000 164 000 141 000 040 000 103 000 |t.t.a. .C.| 00000014 157 000 144 000 145 000 040 000 151 000 |o.d.e. .i.| 0000001e 163 000 040 000 141 000 040 000 160 000 |s. .a. .p.| 00000028 162 000 157 000 147 000 162 000 141 000 |r.o.g.r.a.| 00000032 155 000 155 000 151 000 156 000 147 000 |m.m.i.n.g.| 0000003c 040 000 143 000 150 000 162 000 145 000 | .c.h.r.e.| 00000046 163 000 164 000 157 000 155 000 141 000 |s.t.o.m.a.| 00000050 164 000 150 000 171 000 040 000 163 000 |t.h.y. .s.| 0000005a 151 000 164 000 145 000 040 000 075 330 |i.t.e. .=.| 00000064 000 336 056 000 |....| 00000068 Dump of "example_utf16.txt" in base 3 from byte index 0 to 103: 00000000 100110 100102 010001 000000 011010 000000 011021 000000 |..R.o.s.| 00000008 010202 000000 011022 000000 011022 000000 010121 000000 |e.t.t.a.| 00000010 001012 000000 002111 000000 011010 000000 010201 000000 | .C.o.d.| 00000018 010202 000000 001012 000000 010220 000000 011021 000000 |e. .i.s.| 00000020 001012 000000 010121 000000 001012 000000 011011 000000 | .a. .p.| 00000028 011020 000000 011010 000000 010211 000000 011020 000000 |r.o.g.r.| 00000030 010121 000000 011001 000000 011001 000000 010220 000000 |a.m.m.i.| 00000038 011002 000000 010211 000000 001012 000000 010200 000000 |n.g. .c.| 00000040 010212 000000 011020 000000 010202 000000 011021 000000 |h.r.e.s.| 00000048 011022 000000 011010 000000 011001 000000 010121 000000 |t.o.m.a.| 00000050 011022 000000 010212 000000 011111 000000 001012 000000 |t.h.y. .| 00000058 011021 000000 010220 000000 011022 000000 010202 000000 |s.i.t.e.| 00000060 001012 000000 002021 022000 000000 022020 001201 000000 | .=.....| 00000068 Dump of "example_utf16.txt" in base 2 from byte index 0 to 103: 00000000 11111111 11111110 01010010 00000000 01101111 00000000 |..R.o.| 00000006 01110011 00000000 01100101 00000000 01110100 00000000 |s.e.t.| 0000000c 01110100 00000000 01100001 00000000 00100000 00000000 |t.a. .| 00000012 01000011 00000000 01101111 00000000 01100100 00000000 |C.o.d.| 00000018 01100101 00000000 00100000 00000000 01101001 00000000 |e. .i.| 0000001e 01110011 00000000 00100000 00000000 01100001 00000000 |s. .a.| 00000024 00100000 00000000 01110000 00000000 01110010 00000000 | .p.r.| 0000002a 01101111 00000000 01100111 00000000 01110010 00000000 |o.g.r.| 00000030 01100001 00000000 01101101 00000000 01101101 00000000 |a.m.m.| 00000036 01101001 00000000 01101110 00000000 01100111 00000000 |i.n.g.| 0000003c 00100000 00000000 01100011 00000000 01101000 00000000 | .c.h.| 00000042 01110010 00000000 01100101 00000000 01110011 00000000 |r.e.s.| 00000048 01110100 00000000 01101111 00000000 01101101 00000000 |t.o.m.| 0000004e 01100001 00000000 01110100 00000000 01101000 00000000 |a.t.h.| 00000054 01111001 00000000 00100000 00000000 01110011 00000000 |y. .s.| 0000005a 01101001 00000000 01110100 00000000 01100101 00000000 |i.t.e.| 00000060 00100000 00000000 00111101 11011000 00000000 11011110 | .=...| 00000066 00101110 00000000 |..| 00000068 Dump of "example_utf16.txt" in base 16 from byte index 2 to 25: 00000002 52 00 6f 00 73 00 65 00 74 00 74 00 61 00 20 00 |R.o.s.e.t.t.a. .| 00000012 43 00 6f 00 64 00 65 00 |C.o.d.e.| 0000001a
XPL0
Works for both MS-DOS and RPi Linux.
int Offset, Length, Limit, Byte;
char FileName(80);
func GetByte; \Return a byte from input file
int Return;
[Return:= Byte;
Byte:= ChIn(3); \one-byte look-ahead detects EOF
return Return;
];
proc DumpHex(I); \Show line of hex and its ASCII, starting at offset I
int I, J;
char Line(16);
[HexOut(0, I); Text(0, " ");
SetHexDigits(2);
for J:= 0 to 15 do
[Line(J):= GetByte;
if GetErr and I+J < Limit then Limit:= I+J;
if I+J < Limit then
HexOut(0, Line(J))
else Text(0, " ");
ChOut(0, ^ );
if (J&7) = 7 then ChOut(0, ^ );
];
SetHexDigits(8); \restore default number of digits
ChOut(0, ^|); \display corresponding ASCII characters
for J:= 0 to 15 do
if I+J < Limit then
ChOut(0, if Line(J)<=$1F or Line(J)>=$7F then ^. else Line(J));
ChOut(0, ^|); CrLf(0);
];
func OpenInFile; \Open file for input; return 'true' if success
int FD; \file descriptor
[FD:= FOpen(FileName, 0);
FSet(FD, ^i); \associate device 3 with file; use small buffer (i)
OpenI(3);
return GetErr = 0;
];
func GetFileName; \Get FileName from command line, and set any switches
int C, I; \returns 'true' if no errors
[FileName(0):= 0;
C:= ChIn(8);
loop [while C = $20 do C:= ChIn(8); \skip leading spaces (for MS-DOS)
if C = ^- then
[case ChIn(8) of
^s: Offset:= IntIn(8);
^n: Length:= IntIn(8)
other return false; \Error
Backup; \in case number was terminated by CR or EOF
C:= ChIn(8);
]
else if C = $0D\CR\ or C = $1A\EOF\ then quit
else [I:= 0;
repeat FileName(I):= C;
I:= I+1;
C:= ChIn(8);
until C <= $20;
FileName(I):= 0; \terminate string
];
];
return true;
];
int I;
[Trap(false); \don't abort program on errors
Offset:= 0; Length:= -1>>1;
if not GetFileName then
[Text(0, "Unrecognized switch. Use -s offset, -n length"); exit];
if not OpenInFile(FileName) then
[Text(0, "File not found"); exit];
Byte:= ChIn(3); \look ahead
Limit:= Offset + Length;
if Limit < 0 then Limit:= -1>>1;
for I:= 0 to Offset-1 do \skip any offset bytes
[GetByte; if GetErr then exit];
repeat DumpHex(I);
I:= I + 16;
until I >= Limit;
HexOut(0, Limit); CrLf(0);
]
- Output:
hexdump examp16.txt 00000000 FF FE 52 00 6F 00 73 00 65 00 74 00 74 00 61 00 |..R.o.s.e.t.t.a.| 00000010 20 00 43 00 6F 00 64 00 65 00 20 00 69 00 73 00 | .C.o.d.e. .i.s.| 00000020 20 00 61 00 20 00 70 00 72 00 6F 00 67 00 72 00 | .a. .p.r.o.g.r.| 00000030 61 00 6D 00 6D 00 69 00 6E 00 67 00 20 00 63 00 |a.m.m.i.n.g. .c.| 00000040 68 00 72 00 65 00 73 00 74 00 6F 00 6D 00 61 00 |h.r.e.s.t.o.m.a.| 00000050 74 00 68 00 79 00 20 00 73 00 69 00 74 00 65 00 |t.h.y. .s.i.t.e.| 00000060 20 00 3D D8 00 DE 2E 00 | .=.....| 00000068 hexdump -s 20 examp16.txt -n 20 00000014 6F 00 64 00 65 00 20 00 69 00 73 00 20 00 61 00 |o.d.e. .i.s. .a.| 00000024 20 00 70 00 | .p.| 00000028