Topological order
foo
foo/bar
foo/bar/baz
foo-fleem
foo-fleem/morx
Simple version
/* Put re-ordered character from
* string sa into ca */
if (*sa == '/')
ca = 1;
else if (*sa > 0 && *sa < '/')
ca = *sa + 1;
else
ca = *sa;
Single Instruction
Multiple Data
Some 128-bit SIMD registers
four 32-bit integers
data:image/s3,"s3://crabby-images/46fd0/46fd03d4f98013a8b081205a779b7a5aa40977e4" alt=""
eight 16-bit integers
data:image/s3,"s3://crabby-images/1e35f/1e35f87448bc85154adbd63237bc7b9b9204d2db" alt=""
sixteen bytes
data:image/s3,"s3://crabby-images/4e44f/4e44f8f3cf8e1aee133ee71c6b6506d77e926595" alt=""
movdqa (%rdi), %xmm0
paddusb (%rsi), %xmm0
movdqa %xmm0, (%rdi)
data:image/s3,"s3://crabby-images/8c37e/8c37ecded89c863a93b0c8d8a876f62f2558ce69" alt=""
becomes
we already know this tune
movdqa (%rdi), %xmm0
paddusb (%rsi), %xmm0
movdqa %xmm0, (%rdi)
Constructing if-then-else
from
AND, XOR, and OR
if (*sa == '/')
ca = 1;
else
ca = *sa;
xmm1 before pcmpeqb
data:image/s3,"s3://crabby-images/02924/029249805148e08492fd8b81332b3ff4e14ed3ad" alt=""
xmm7
data:image/s3,"s3://crabby-images/cad44/cad441922bc673f9d552e804de67ab5d20c20e97" alt=""
xmm1 after pcmpeqb
data:image/s3,"s3://crabby-images/cb7a1/cb7a15bf6cdf8d55abc384affa810e1956d78ee1" alt=""
xmm6
data:image/s3,"s3://crabby-images/768f4/768f48e0253a363ace21b1ebce9aac28de1771c3" alt=""
movdqa %xmm1, %xmm2
pand %xmm6, %xmm2
xmm2
xmm5
xmm1 before pxor
data:image/s3,"s3://crabby-images/cb7a1/cb7a15bf6cdf8d55abc384affa810e1956d78ee1" alt=""
pxor %xmm5, %xmm1
xmm5 after pxor
xmm0 before pand
data:image/s3,"s3://crabby-images/02924/029249805148e08492fd8b81332b3ff4e14ed3ad" alt=""
xmm1
data:image/s3,"s3://crabby-images/18a51/18a51f11c84b6312cf589fc9218fba104fd99e3f" alt=""
pand %xmm1, %xmm0
xmm0 after pand
xmm0
xmm2
data:image/s3,"s3://crabby-images/6e39e/6e39e010beb70f016611bb3b7f6f938ee575fe8a" alt=""
por %xmm2, %xmm0
xmm0, after por
xmm0
xmm1
pcmpistri %xmm0, %xmm1
rcx register gets 7
carry flag and zero flag get set
pshufb
Bonus slide
Extracting a byte
xmm5
data:image/s3,"s3://crabby-images/8b53d/8b53d00c6195c2000a376d18b9ed7ab145b608c8" alt=""
add $1, %rcx
movq %rcx, %xmm4
data:image/s3,"s3://crabby-images/3533e/3533e0b0decb1260c61f416637931b18555c9610" alt=""
paddb %xmm5, %xmm4
data:image/s3,"s3://crabby-images/63522/635228c716d538dfe3815b2c96d5015dc0581541" alt=""
pshufb %xmm4, %xmm0
movq %xmm0, %rax