← All Duels

gemini-3.1-pro-preview_vs_grok-4-fast-reasoning.jsonl — 10 puzzles

gemini-3.1-pro-preview
2
vs
grok-4-fast-reasoning
0
#1 Solver Failed
def mystery(x):
    if type(x) is not int or x <= 10:
        return False
    s = str(x)
    return x * 6 == int(s[-1] + s[:-1])
101694915254237288135593220338983050847457627118644067796
1016949152542372881355932203389830508474576271186440677966
Proposer: gemini-3.1-pro-preview Solver: grok-4-fast-reasoning
1 vs 0
#2 Solved
def mystery(x):
    if type(x) is not int or x <= 9999:
        return False
    s = str(x)
    return x * 4 == int(s[-1] + s[:-1])
102564
102564
Proposer: grok-4-fast-reasoning Solver: gemini-3.1-pro-preview
1 vs 0
#3 Solver Failed
def mystery(x):
    if type(x) is not int or x < 10**50:
        return False
    s = str(x)
    return x * 3 == int(s[2:] + s[:2])
1030927835051546391752577319587628865979381443298969072164948536082474226804123711340206185567010
13 * (10**96 - 1) // 97
Proposer: gemini-3.1-pro-preview Solver: grok-4-fast-reasoning
2 vs 0
#4 Solved
def mystery(x):
    if type(x) is not int or x < 10**18:
        return False
    s = str(x)
    return int(s[::-1]) == x * 9
10891089108910891089
1099999999999999989
Proposer: grok-4-fast-reasoning Solver: gemini-3.1-pro-preview
2 vs 0
#5 Solved
def mystery(x):
    if type(x) is not str or len(x) > 300:
        return False
    if any(c in x for c in ['"', "'", 'chr', 'eval', 'exec', 'import']):
        return False
    try:
        return eval(x) == x
    except:
        return False
"x"
"(lambda t: bytes(t).decode() % (t,))((40, 108, 97, 109, 98, 100, 97, 32, 116, 58, 32, 98, 121, 116, 101, 115, 40, 116, 41, 46, 100, 101, 99, 111, 100, 101, 40, 41, 32, 37, 37, 32, 40, 116, 44, 41, 41, 40, 37, 115, 41))"
Proposer: gemini-3.1-pro-preview Solver: grok-4-fast-reasoning
2 vs 0
#6 Solved
def mystery(x):
    if type(x) is not int or x < 10**17:
        return False
    s = str(x)
    return x * 2 == int(s[-1] + s[:-1])
105263157894736842
105263157894736842
Proposer: grok-4-fast-reasoning Solver: gemini-3.1-pro-preview
2 vs 0
#7 Solved
def mystery(x):
    if type(x) is not int or x <= 10**40:
        return False
    return pow(x, x, 10**40) == x % 10**40 and x % 10 == 6
10**40 + 2**40 * pow(2**40, -1, 5**40)
pow(2**40, -1, 5**40) * 2**40 + 10**40
Proposer: gemini-3.1-pro-preview Solver: grok-4-fast-reasoning
2 vs 0
#8 Solved
def mystery(x):
    if type(x) is not int or x < 10**17:
        return False
    s = str(x)
    return x * 5 == int(s[-1] + s[:-1])
142857142857142857
142857142857142857
Proposer: grok-4-fast-reasoning Solver: gemini-3.1-pro-preview
2 vs 0
#9 Solved
def mystery(x):
    if type(x) is not list or len(x) != 60:
        return False
    if not all(type(i) is int for i in x):
        return False
    return all(x.count(i) + 2 == x[i] for i in range(60))
[2, 2, 60, 3] + [2] * 56
[2, 2, 58, 4, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 2]
Proposer: gemini-3.1-pro-preview Solver: grok-4-fast-reasoning
2 vs 0
#10 Solved
def mystery(x):
    if type(x) is not int or x < 10**27:
        return False
    s = str(x)
    return x * 3 == int(s[-1] + s[:-1])
1034482758620689655172413793
1034482758620689655172413793
Proposer: grok-4-fast-reasoning Solver: gemini-3.1-pro-preview
2 vs 0