import base64
import os.path
from random import randbytes

import pandas as pd
import matplotlib.pyplot as plt

# From pyca/cryptography
from cryptography.hazmat.primitives import padding
from cryptography.hazmat.primitives.ciphers import Cipher, algorithms, modes

def xor(x, y):
    return bytes(xb^yb for xb, yb in zip(x, y))

mask32 = 0xFFFFFFFF

def lrot32(n, k):
    # Left rotate 32-bit integer k bits
    return ((n << k) | (n >> (32-k))) & mask32

def inv32(n):
    # Invert bits of 32-bit integer
    return ~n & mask32

def pad_pkcs7(text):
    padder = padding.PKCS7(128).padder()
    return padder.update(text) + padder.finalize()

def unpad_pkcs7(text):
    unpadder = padding.PKCS7(128).unpadder()
    return unpadder.update(text) + unpadder.finalize()

def aes_128_ecb_encrypt(ptext, key):
    # N.B.: performs no padding
    encryptor = Cipher(algorithms.AES128(key), modes.ECB()).encryptor()
    return encryptor.update(ptext) + encryptor.finalize()

def aes_128_ecb_decrypt(ctext, key):
    decryptor = Cipher(algorithms.AES128(key), modes.ECB()).decryptor()
    return unpad_pkcs7(decryptor.update(ctext) + decryptor.finalize())

def aes_128_cbc_encrypt(ptext, key, iv):
    encryptor = Cipher(algorithms.AES128(key), modes.CBC(iv)).encryptor()
    return encryptor.update(pad_pkcs7(ptext)) + encryptor.finalize()

def aes_128_cbc_decrypt(ctext, key, iv):
    decryptor = Cipher(algorithms.AES128(key), modes.CBC(iv)).decryptor()
    return unpad_pkcs7(decryptor.update(ctext) + decryptor.finalize())

def aes_128_ctr_crypt(text, key, nonce, offset=0):
    # Symmetric encryption/decryption
    n = (len(text)-1)//16+1
    stream = b"".join(
        aes_128_ecb_encrypt(nonce + int.to_bytes(i, 8, "little"), key)
        for i in range(offset, offset+n)
    )
    return xor(text, stream[:len(text)])

def A(n):
    return b"A"*n

def hamming_distance(x, y):
    # Distance between two strings in characters
    return sum(xc != yc for xc, yc in zip(x, y))


random_key = randbytes(16)
random_nonce = randbytes(8)

def edit(ctext, key, nonce, offset, new_text):
    # A subtle point: in CTR mode, the block structure effectively
    # disappears; the plaintext is simply being XOR-ed with a
    # keystream.  We need to refer to the block structure only to pick
    # up the correct position in the keystream.
    bn, bo = divmod(offset, 16)  # starting block number, intra-block offset
    new_ctext = aes_128_ctr_crypt(A(bo)+new_text, key, nonce, bn)[bo:]
    return ctext[:offset] + new_ctext + ctext[offset+len(new_text):]

def attack_edit(ctext, offset, new_text):
    return edit(ctext, random_key, random_nonce, offset, new_text)

ciphertext = aes_128_ctr_crypt(
    aes_128_ecb_decrypt(
        base64.b64decode(open("07.in").read()),
        b"YELLOW SUBMARINE"
    ),
    random_key,
    random_nonce
)

plaintext = attack_edit(ciphertext, 0, new_text=ciphertext)
print(plaintext.decode("ASCII").strip())

I'm back and I'm ringin' the bell 
A rockin' on the mike while the fly girls yell 
In ecstasy in the back of me 
Well that's my DJ Deshay cuttin' all them Z's 
Hittin' hard and the girlies goin' crazy 
Vanilla's on the mike, man I'm not lazy. 

I'm lettin' my drug kick in 
It controls my mouth and I begin 
To just let it flow, let my concepts go 
My posse's to the side yellin', Go Vanilla Go! 

Smooth 'cause that's the way I will be 
And if you don't give a damn, then 
Why you starin' at me 
So get off 'cause I control the stage 
There's no dissin' allowed 
I'm in my own phase 
The girlies sa y they love me and that is ok 
And I can dance better than any kid n' play 

Stage 2 -- Yea the one ya' wanna listen to 
It's off my head so let the beat play through 
So I can funk it up and make it sound good 
1-2-3 Yo -- Knock on some wood 
For good luck, I like my rhymes atrocious 
Supercalafragilisticexpialidocious 
I'm an effect and that you can bet 
I can take a fly girl and make her wet. 

I'm like Samson -- Samson to Delilah 
There's no denyin', You can try to hang 
But you'll keep tryin' to get my style 
Over and over, practice makes perfect 
But not if you're a loafer. 

You'll get nowhere, no place, no time, no girls 
Soon -- Oh my God, homebody, you probably eat 
Spaghetti with a spoon! Come on and say it! 

VIP. Vanilla Ice yep, yep, I'm comin' hard like a rhino 
Intoxicating so you stagger like a wino 
So punks stop trying and girl stop cryin' 
Vanilla Ice is sellin' and you people are buyin' 
'Cause why the freaks are jockin' like Crazy Glue 
Movin' and groovin' trying to sing along 
All through the ghetto groovin' this here song 
Now you're amazed by the VIP posse. 

Steppin' so hard like a German Nazi 
Startled by the bases hittin' ground 
There's no trippin' on mine, I'm just gettin' down 
Sparkamatic, I'm hangin' tight like a fanatic 
You trapped me once and I thought that 
You might have it 
So step down and lend me your ear 
'89 in my time! You, '90 is my year. 

You're weakenin' fast, YO! and I can tell it 
Your body's gettin' hot, so, so I can smell it 
So don't be mad and don't be sad 
'Cause the lyrics belong to ICE, You can call me Dad 
You're pitchin' a fit, so step back and endure 
Let the witch doctor, Ice, do the dance to cure 
So come up close and don't be square 
You wanna battle me -- Anytime, anywhere 

You thought that I was weak, Boy, you're dead wrong 
So come on, everybody and sing this song 

Say -- Play that funky music Say, go white boy, go white boy go 
play that funky music Go white boy, go white boy, go 
Lay down and boogie and play that funky music till you die. 

Play that funky music Come on, Come on, let me hear 
Play that funky music white boy you say it, say it 
Play that funky music A little louder now 
Play that funky music, white boy Come on, Come on, Come on 
Play that funky music


prefix = b"comment1=cooking%20MCs;userdata="
suffix = b";comment2=%20like%20a%20pound%20of%20bacon"

def fun1(userdata):
    return aes_128_ctr_crypt(
        prefix + userdata.replace(b";", b"%3B").replace(b"=", b"%3D") + suffix,
        random_key,
        random_nonce
    )

def fun2(ctext):
    return (
        b";admin=true;" in aes_128_ctr_crypt(ctext, random_key, random_nonce)
    )

ciphertext = fun1(b"the ;admin=true; in this string will be quoted away")

print(fun2(ciphertext))

False


replacement_text = b";admin=true;"
n = len(replacement_text)
delta = xor(prefix[:n], replacement_text)
new_ciphertext = xor(ciphertext[:n], delta) + ciphertext[n:]
print(fun2(new_ciphertext))

True


def fun1(userdata):
    # Back to CBC mode
    return aes_128_cbc_encrypt(
        prefix + userdata.replace(b";", b"%3B").replace(b"=", b"%3D") + suffix,
        key=random_key,
        iv=random_key
    )

def fun3(ctext):
    ptext = aes_128_cbc_decrypt(ctext, key=random_key, iv=random_key)
    return (all(b < 128 for b in ptext), ptext)

ciphertext = bytearray(fun1(A(48)))
ciphertext[16:32] = bytes(16)
ciphertext[32:48] = ciphertext[:16]

is_valid, plaintext = fun3(bytes(ciphertext))
assert not is_valid

recovered_key = xor(plaintext[:16], plaintext[32:48])
recovered_key == random_key

True


def sha1(message, starting_hash=None, starting_offset=0):

    # Initialize hash
    if starting_hash != None:
        h0, h1, h2, h3, h4 = [
            int(starting_hash[i:i+8], 16) for i in range(0, 40, 8)
        ]
    else:
        h0 = 0x67452301
        h1 = 0xEFCDAB89
        h2 = 0x98BADCFE
        h3 = 0x10325476
        h4 = 0xC3D2E1F0

    # Pad message and append message length in bits (8 bytes,
    # big-endian) so that message is a multiple of 64 bytes in length
    oml = len(message)  # original message length
    n = 63 - (oml+8)%64
    message = message + b"\x80" + bytes(n) + int.to_bytes(oml*8, 8, "big")

    # For each chunk
    for i in range(starting_offset, len(message), 64):

        # Create 80-word "message schedule"
        w = [
            int.from_bytes(message[i+j:i+j+4], "big")
            for j in range(0, 64, 4)
        ]
        for j in range(16, 80):
            w.append(lrot32(w[j-3] ^ w[j-8] ^ w[j-14] ^ w[j-16], 1))

        # Initialize chunk hash from running hash
        a = h0
        b = h1
        c = h2
        d = h3
        e = h4

        # Mystery stuff
        for j in range(80):
            if j < 20:
                f = (b & c) | (inv32(b) & d)
                k = 0x5A827999
            elif 20 <= j < 40:
                f = b ^ c ^ d
                k = 0x6ED9EBA1
            elif 40 <= j < 60:
                f = (b & c) | (b & d) | (c & d)
                k = 0x8F1BBCDC
            else:
                f = b ^ c ^ d
                k = 0xCA62C1D6
            temp = (lrot32(a, 5) + f + e + k + w[j]) & mask32
            e = d
            d = c
            c = lrot32(b, 30)
            b = a
            a = temp

        # Add chunk hash back into running hash
        h0 = (h0 + a) & mask32
        h1 = (h1 + b) & mask32
        h2 = (h2 + c) & mask32
        h3 = (h3 + d) & mask32
        h4 = (h4 + e) & mask32

    return "%08x%08x%08x%08x%08x" % (h0, h1, h2, h3, h4)

# Show that the hashes are not just different, but very different

def hash_distance(message_1, message_2):
    return f"{hamming_distance(sha1(message_1), sha1(message_2))}/40"

print(hash_distance(random_key + b"message", random_key + b"MESSAGE"))
print(hash_distance(random_key + b"message", b"different key" + b"message"))
print(hash_distance(random_key + b"MESSAGE", b"different key" + b"message"))

38/40
39/40
37/40


message = b"comment1=cooking%20MCs;userdata=foo;comment2=%20like%20a%20pound%20of%20bacon"

# Recreate the padding added internally by SHA-1 (here we use
# knowledge of the length of the key)
oml = len(random_key) + len(message)
n = 63 - (oml+8)%64
padding = b"\x80" + bytes(n) + int.to_bytes(oml*8, 8, "big")

# Hash the original message (which includes hashing the padding) as
# would be done by the server and as would be returned to the client
h_original = sha1(random_key + message)

# The attack message
attack_message = message + padding + b";admin=true"

# Now craft a hash, knowing only the length of the key but not the key
# itself, by picking up where SHA-1 left off before
h_fake = sha1(
    A(len(random_key)) + attack_message,
    h_original,
    len(random_key)+len(message)+len(padding)
)

# Hash the attack message as would be done by the server and check,
# would we fool the server?
h_attack = sha1(random_key + attack_message)
h_fake == h_attack

True


def md4(message, starting_hash=None, starting_offset=0):

    def F(x, y, z):
        return (x & y) | (inv32(x) & z)

    def G(x, y, z):
        return (x & y) | (x & z) | (y & z)

    def H(x, y, z):
        return x ^ y ^ z

    # Initialize hash
    if starting_hash != None:
        h = [
            int.from_bytes(bytes.fromhex(starting_hash[i:i+8]), "little")
            for i in range(0, 32, 8)
        ]
    else:
        h = [0x67452301, 0xEFCDAB89, 0x98BADCFE, 0x10325476]

    # Pad message and append message length in bits (8 bytes,
    # little-endian) so that message is a multiple of 64 bytes in
    # length
    oml = len(message)  # original message length
    n = 63 - (oml+8)%64
    message = message + b"\x80" + bytes(n) + int.to_bytes(oml*8, 8, "little")

    # For each chunk
    for i in range(starting_offset, len(message), 64):

        # Create 16-word block
        X = [
            int.from_bytes(message[i+j:i+j+4], "little")
            for j in range(0, 64, 4)
        ]

        # Initialize chunk hash from running hash
        ch = h.copy()

        # Round 1
        Xi = [3, 7, 11, 19]
        for n in range(16):
            i, j, k, l = map(lambda x: x%4, range(-n, -n+4))
            K = n
            S = Xi[n%4]
            hn = ch[i] + F(ch[j], ch[k], ch[l]) + X[K]
            ch[i] = lrot32(hn & mask32, S)

        # Round 2
        Xi = [3, 5, 9, 13]
        for n in range(16):
            i, j, k, l = map(lambda x: x%4, range(-n, -n+4))
            K = (n%4)*4 + n//4
            S = Xi[n%4]
            hn = ch[i] + G(ch[j], ch[k], ch[l]) + X[K] + 0x5A827999
            ch[i] = lrot32(hn & mask32, S)

        # Round 3
        Xi = [3, 9, 11, 15]
        Ki = [0, 8, 4, 12, 2, 10, 6, 14, 1, 9, 5, 13, 3, 11, 7, 15]
        for n in range(16):
            i, j, k, l = map(lambda x: x%4, range(-n, -n+4))
            K = Ki[n]
            S = Xi[n%4]
            hn = ch[i] + H(ch[j], ch[k], ch[l]) + X[K] + 0x6ED9EBA1
            ch[i] = lrot32(hn & mask32, S)

        # Add chunk hash back into running hash
        h = [(x + y) & mask32 for x, y in zip(h, ch)]

    return b"".join(int.to_bytes(x, 4, "little") for x in h).hex()


message = b"comment1=cooking%20MCs;userdata=foo;comment2=%20like%20a%20pound%20of%20bacon"

# Recreate the padding added internally by MD4 (here we use
# knowledge of the length of the key)
oml = len(random_key) + len(message)
n = 63 - (oml+8)%64
padding = b"\x80" + bytes(n) + int.to_bytes(oml*8, 8, "little")

# Hash the original message (which includes hashing the padding) as
# would be done by the server and as would be returned to the client
h_original = md4(random_key + message)

# The attack message
attack_message = message + padding + b";admin=true"

# Now craft a hash, knowing only the length of the key but not the key
# itself, by picking up where MD4 left off before
h_fake = md4(
    A(len(random_key)) + attack_message,
    h_original,
    len(random_key)+len(message)+len(padding)
)

# Hash the attack message as would be done by the server and check,
# would we fool the server?
h_attack = md4(random_key + attack_message)
h_fake == h_attack

True


M = 10    # maximum number of comparisons to test
N = 1000  # sample size

if not os.path.exists("31-timing-data-50ms.csv"):

    # IMPORTS

    import csv
    from http.server import HTTPServer, BaseHTTPRequestHandler
    from threading import Thread
    from time import time, sleep
    from urllib.parse import urlparse, parse_qs

    import requests

    # SERVER

    delay = 50  # milliseconds

    class handler(BaseHTTPRequestHandler):

        def do_GET(self):
            url = urlparse(self.path)
            if url.path == "/test":
                s = parse_qs(url.query)["signature"][0]
                for c in s:
                    sleep(delay/1000)
                    if c != "A":
                        break
            elif url.path == "/exit":
                def shutdown():
                    sleep(1)
                    self.server.shutdown()
                Thread(target=shutdown).start()
            self.send_response(200)
            self.end_headers()

        def log_message(*args, **kwargs):
            pass

    Thread(
        target=lambda: HTTPServer(("", 8000), handler).serve_forever(),
        daemon=True
    ).start()

    # CLIENT

    with open("31-timing-data-50ms.csv", "w") as f:
        fw = csv.writer(f)
        fw.writerow(["num_correct_chars", "time"])
        for num_correct_chars in range(M):
            s = "A"*num_correct_chars + "B"*(40-num_correct_chars)
            for _ in range(N):
                start = time()
                requests.get(f"http://localhost:8000/test?signature={s}")
                elapsed = time() - start
                fw.writerow([num_correct_chars, elapsed])

    requests.get("http://localhost:8000/exit")

# Plot the data

df = pd.read_csv("31-timing-data-50ms.csv")

def plot_timing_data():
    for i in range(M):
        df[df.num_correct_chars == i].time.plot.kde()
    plt.xlabel(f"Total comparison time, 1-{M} comparisons (s)")
    plt.show()

plot_timing_data()


def print_timing_statistics(num_digits_guessed=1):
    df.sort_values("time", inplace=True)
    seen = [0]*M  # seen[n] = number of (n+1)-digit comparisons seen so far
    delta = num_digits_guessed
    s = 0
    for n in df.num_correct_chars:
        if n < M-delta:
            s += N - seen[n+delta]
            seen[n] += 1
    p_1 = s/((M-delta)*N*N)
    p_success = p_1**(40//delta-1)
    print(
        "P(can distinguish number of comparisons performed)",
        f"= {round(p_1*100, 3)}%"
    )
    print(f"P(overall success) = {round(p_success*100, 3)}%")

print_timing_statistics()

P(can distinguish number of comparisons performed) = 99.989%
P(overall success) = 99.568%


def hmac(key, message):
    def _sha1(message):
        return bytes.fromhex(sha1(message))
    if len(key) > 64:
        key = _sha1(key)
    if len(key) < 64:
        key = key + bytes(64-len(key))
    return sha1(xor(key, b"\x5c"*64) + _sha1(xor(key, b"\x36"*64) + message))

def insecure_compare(a, b):
    # Return length of matching prefix
    n = 0
    for i in range(len(a)):
        if a[i] == b[i]:
            n += 1
        else:
            break
    return n

def verify_signature(file, signature):
    # Return (comparison time, result of comparison)
    n = insecure_compare(signature, hmac(random_key, file))
    return (n+1, n == len(signature))

file = b"foo"

signature = ["0"]*40  # signature that will be guessed digit by digit
for i in range(len(signature)):
    def probe(i, digit):
        signature[i] = digit
        time, is_correct = verify_signature(file, "".join(signature))
        return {"time": time, "is_correct": is_correct, "digit": digit}
    r = [probe(i, digit) for digit in "0123456789abcdef"]
    if any(t["is_correct"] for t in r):
        signature[i] = [t for t in r if t["is_correct"]][0]["digit"]
        break
    else:
        signature[i] = max(r, key=lambda t: t["time"])["digit"]

# Did we correctly guess the signature?
"".join(signature) == hmac(random_key, file)

True


df = pd.read_csv("31-timing-data-1ms.csv")
plot_timing_data()


print_timing_statistics()

P(can distinguish number of comparisons performed) = 85.977%
P(overall success) = 0.276%


print_timing_statistics(num_digits_guessed=2)

P(can distinguish number of comparisons performed) = 96.387%
P(overall success) = 49.697%

Set 4: Stream crypto and randomness¶

Preliminaries¶

Challenge 25: Break "random access read/write" AES CTR¶

Challenge 26: CTR bitflipping¶

Challenge 27: Recover the key from CBC with IV=Key¶

Challenge 28: Implement a SHA-1 keyed MAC¶

Challenge 29: Break a SHA-1 keyed MAC using length extension¶

Challenge 30: Break an MD4 keyed MAC using length extension¶

Challenge 31: Implement and break HMAC-SHA1 with an artificial timing leak¶

Challenge 32: Break HMAC-SHA1 with a slightly less artificial timing leak¶