← All Duels

gemini-3-flash-preview_vs_grok-4.20-0309-reasoning.jsonl — 10 puzzles

gemini-3-flash-preview
-5
vs
grok-4.20-0309-reasoning
2
#1 Sample Solution Wrong
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(32):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0x6735505e and b == 0x75981504
"PuzzleMe"
Proposer: gemini-3-flash-preview Solver: grok-4.20-0309-reasoning
-1 vs 0
#2 Solved
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(5):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0x121a20 and b == 0x223a820
"\x00\x00\x00\x01\x00\x00\x00\x01"
'\x00\x00\x00\x01\x00\x00\x00\x01'
Proposer: grok-4.20-0309-reasoning Solver: gemini-3-flash-preview
-1 vs 0
#3 Sample Solution Wrong
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(8):
        a = (a + 0x9E3779B9) & 0xFFFFFFFF
        b = (b ^ a)
        b = ((b << 13) & 0xFFFFFFFF) | (b >> 19)
        a = (a ^ b)
        
    return a == 0x0dc74382 and b == 0xc7af4f97
"mystery!"
Proposer: gemini-3-flash-preview Solver: grok-4.20-0309-reasoning
-2 vs 0
#4 Solved
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(5):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0xabd63769 and b == 0xff1aac22
"\x11\x22\x33\x44\x55\x66\x77\x88"
'\x11\x22\x33\x44\x55\x66\x77\x88'
Proposer: grok-4.20-0309-reasoning Solver: gemini-3-flash-preview
-2 vs 0
#5 Sample Solution Wrong
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(12):
        a ^= 0xDEADBEEF
        a = ((a << 7) | (a >> 25)) & 0xFFFFFFFF
        a = (a + b) & 0xFFFFFFFF
        
        b ^= 0xCAFEBABE
        b = ((b << 11) | (b >> 21)) & 0xFFFFFFFF
        b = (b + a) & 0xFFFFFFFF
        
    return a == 0xc7826622 and b == 0x386d34e9
"12345678"
Proposer: gemini-3-flash-preview Solver: grok-4.20-0309-reasoning
-3 vs 0
#6 Solved
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(5):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0x555551a9 and b == 0xf5f57ee9
"AAAAAAAA"
'AAAAAAAA'
Proposer: grok-4.20-0309-reasoning Solver: gemini-3-flash-preview
-3 vs 0
#7 Sample Solution Wrong
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for i in range(32):
        k = (a * 0x9E3779B1 + i) & 0xFFFFFFFF
        k = ((k << 15) | (k >> 17)) & 0xFFFFFFFF
        a, b = (b ^ k) & 0xFFFFFFFF, a
        
    return a == 0x933010f3 and b == 0x9376916e
"TopCoder"
Proposer: gemini-3-flash-preview Solver: grok-4.20-0309-reasoning
-4 vs 0
#8 Solver Failed
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(6):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0x235c240 and b == 0x4640c640
"\x28\xff\xff\xce\xc7\x00\x00\x00"
'\x00\x00\x00\x01\x00\x00\x00\x01'
Proposer: grok-4.20-0309-reasoning Solver: gemini-3-flash-preview
-4 vs 1
#9 Sample Solution Wrong
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    delta = 0x9E3779B9
    sum_val = 0
    for _ in range(8):
        sum_val = (sum_val + delta) & 0xFFFFFFFF
        a = (a + (((b << 4) + 0x636F6465) ^ (b + sum_val) ^ ((b >> 5) + 0x7A6F6E65))) & 0xFFFFFFFF
        b = (b + (((a << 4) + 0x62797465) ^ (a + sum_val) ^ ((a >> 5) + 0x736C6F74))) & 0xFFFFFFFF
        
    return a == 0xb46b9623 and b == 0x47e1136c
"Pyth0n3!"
Proposer: gemini-3-flash-preview Solver: grok-4.20-0309-reasoning
-5 vs 1
#10 Solver Failed
def mystery(x):
    if not isinstance(x, str) or len(x) != 8:
        return False
    
    a, b = 0, 0
    for i in range(4):
        a = (a << 8) | ord(x[i])
        b = (b << 8) | ord(x[i+4])
        
    for _ in range(4):
        a = (a + b) & 0xFFFFFFFF
        b = (((b << 5) & 0xFFFFFFFF) | (b >> 27)) ^ a
        
    return a == 0x55555554 and b == 0x99999998
"\x40\x11\x11\x11\x20\x22\x22\x22"
'\x11\x11\x11\x11\x22\x22\x22\x22'
Proposer: grok-4.20-0309-reasoning Solver: gemini-3-flash-preview
-5 vs 2