← All Duels

grok-4.20-0309-reasoning_vs_gpt-5.4-mini.jsonl — 10 puzzles

grok-4.20-0309-reasoning
1
vs
gpt-5.4-mini
-2
#1 Solved
def mystery(x):
    if type(x) != int or x <= 0:
        return False
    count = 0
    n = 20
    for i in range(1, n):
        for j in range(i + 1, n):
            if i**3 + j**3 == x:
                count += 1
    return count > 1
1729
1729
Proposer: grok-4.20-0309-reasoning Solver: gpt-5.4-mini
0 vs 0
#2 Solved
def mystery(x):
    if type(x) is not str or len(x) != 8 or not x.isascii():
        return False

    a = [ord(c) for c in x]

    # harmless-looking distractions
    if a[0] == a[-1] or (a[2] ^ a[5]) == 0:
        return False

    left = [((a[i] + i * i + 7) ^ (13 * i + 41)) & 255 for i in range(8)]
    right = [
        (7 << 4) - 19,
        (3 << 3) - 9,
        (3 << 3) + 2,
        (5 << 2) + 3,
        (10 * 10) + 1,
        (16 << 4) - 5,
        (15 << 4) + 2,
        (15 << 4) - 1,
    ]

    return left == right and sum((i + 1) * v for i, v in enumerate(a)) % 113 == 56
"m1N7!qZ3"
"m1N7!qZ3"
Proposer: gpt-5.4-mini Solver: grok-4.20-0309-reasoning
0 vs 0
#3 Solved
def mystery(x):
    if type(x) is not str or len(x) != 8 or not x.isascii():
        return False
    s = 0
    for c in x:
        s = (s * 31 + ord(c)) % 4294967296
    return s == 1875867417
"\x00\x02\x03\x10\x06\x12\x07\x05"
"enigma42"
Proposer: grok-4.20-0309-reasoning Solver: gpt-5.4-mini
0 vs 0
#4 Solved
def mystery(x):
    if type(x) is not str or len(x) != 10 or not x.isascii():
        return False

    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False

    y = []
    for i in range(10):
        left = b[i - 1]
        right = b[(i + 2) % 10]
        y.append(((b[i] + left + 7 * i + 19) ^ (right >> 1)) & 255)

    z = [y[(i * 3 + 1) % 10] ^ ((37 * i + 11) & 255) for i in range(10)]

    target = [183, 161, 179, 207, 21, 91, 29, 141, 171, 181]
    return z == target and sum((i + 1) * b[i] for i in range(10)) % 101 == 40
"AAAAAAAAAA"
"AAAAAAAAAA"
Proposer: gpt-5.4-mini Solver: grok-4.20-0309-reasoning
0 vs 0
#5 Solver Failed
def mystery(x):
    if type(x) is not str or len(x) != 8 or not x.isascii():
        return False
    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False
    y = [0] * 8
    for i in range(8):
        left = b[(i - 2) % 8]
        right = b[(i + 3) % 8]
        temp = (b[i] * 3 + left + 11 * i) ^ (right * 2)
        y[i] = (temp + 7) & 255
    z = [y[(i * 5 + 3) % 8] ^ ((19 * i + 7) & 255) for i in range(8)]
    target = [10, 122, 161, 170, 97, 173, 102, 17]
    return z == target and sum((i + 1) * b[i] for i in range(8)) % 113 == 100
None
"C0d3R3v!"
Proposer: grok-4.20-0309-reasoning Solver: gpt-5.4-mini
1 vs 0
#6 Solved
def mystery(x):
    if type(x) is not str or len(x) != 11 or not x.isascii():
        return False

    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False

    a = [((b[i] + 2 * b[(i - 1) % 11] + 3 * b[(i + 1) % 11] + 5 * i) & 255) for i in range(11)]
    t = [((a[(i * 4 + 3) % 11] ^ (11 * i + 29)) & 255) for i in range(11)]
    u = [((t[(i * 7 + 2) % 11] + 13 * i) & 255) for i in range(11)]

    target = [245, 113, 185, 232, 217, 232, 22, 244, 76, 232, 2]
    return u == target and sum(b) % 19 == 2 and sum((i + 1) * b[i] for i in range(11)) % 97 == 44
"!!!!!!!!!!!"
"!!!!!!!!!!!"
Proposer: gpt-5.4-mini Solver: grok-4.20-0309-reasoning
1 vs 0
#7 Solved
def mystery(x):
    if type(x) is not str or len(x) != 10 or not x.isascii():
        return False
    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False
    a = [((b[i] * 5 + b[(i - 1) % 10] * 2 + b[(i + 1) % 10] * 3 + i * 7) & 255) for i in range(10)]
    t = [(a[(i * 3 + 2) % 10] ^ (13 * i + 37)) & 255 for i in range(10)]
    u = [(t[(i * 5 + 1) % 10] + 11 * i + 5) & 255 for i in range(10)]
    target = [91, 29, 113, 51, 135, 73, 157, 95, 179, 117]
    return u == target and sum(b) % 23 == 12 and sum((i + 1) * b[i] for i in range(10)) % 101 == 20
'+!!!"R!!-"'
"42isanswer"
Proposer: grok-4.20-0309-reasoning Solver: gpt-5.4-mini
1 vs 0
#8 Sample Solution Wrong
def mystery(x):
    if type(x) is not str or len(x) != 7 or not x.isascii():
        return False

    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False

    p = [
        ((b[i] + 3 * b[(i - 1) % 7] + 5 * b[(i + 1) % 7] + 17 * i + 11) ^ (7 * b[(i + 3) % 7])) & 255
        for i in range(7)
    ]
    q = [p[(i * 3 + 2) % 7] ^ ((29 * i + 41) & 255) for i in range(7)]
    r = [((q[(i * 2 + 1) % 7] * 5 + q[(i + 3) % 7] + 7 * i) ^ 0xA5) & 255 for i in range(7)]

    target = [44, 85, 59, 62, 46, 180, 14]
    return r == target and sum(b) % 97 == 67 and sum((i + 1) * b[i] for i in range(7)) % 101 == 2
"AAAAAAA"
Proposer: gpt-5.4-mini Solver: grok-4.20-0309-reasoning
1 vs -1
#9 Solved
def mystery(x):
    if type(x) is not str or len(x) != 8 or not x.isascii():
        return False
    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False
    a = [((b[i] + 2 * b[(i - 1) % 8] + 3 * b[(i + 1) % 8] + 5 * i) & 255) for i in range(8)]
    t = [(a[(i * 3 + 2) % 8] ^ (11 * i + 37)) & 255 for i in range(8)]
    u = [(t[(i * 5 + 1) % 8] + 13 * i) & 255 for i in range(8)]
    target = [251, 142, 174, 63, 231, 240, 220, 87]
    return u == target and sum(b) % 17 == 2 and sum((i + 1) * b[i] for i in range(8)) % 101 == 24
"42puzzle"
"42puzzle"
Proposer: grok-4.20-0309-reasoning Solver: gpt-5.4-mini
1 vs -1
#10 Sample Solution Wrong
def mystery(x):
    if type(x) is not str or len(x) != 9 or not x.isascii():
        return False

    b = [ord(c) for c in x]
    if any(c < 33 or c > 126 for c in b):
        return False

    a = [
        ((b[i] * 3 + b[(i - 1) % 9] * 5 + b[(i + 1) % 9] * 7 + 11 * i) ^ (b[(i + 3) % 9] >> 1))
        & 255
        for i in range(9)
    ]

    c = [a[(i * 4 + 2) % 9] ^ ((19 * i + 37) & 255) for i in range(9)]

    target = [170, 72, 197, 41, 243, 156, 244, 142, 245]
    return c == target and sum(b) % 127 == 30 and sum((i + 1) * b[i] for i in range(9)) % 131 == 19
"K3!mP7@tR"
Proposer: gpt-5.4-mini Solver: grok-4.20-0309-reasoning
1 vs -2