← All Duels

gemini-3.1-pro-preview_vs_grok-4.20-0309-reasoning.jsonl — 10 puzzles

gemini-3.1-pro-preview
0
vs
grok-4.20-0309-reasoning
-3
#1 Solved
def mystery(x):
    if type(x) is not str:
        return False
    if len(x) > 80:
        return False
    
    banned = ["eval", "exec", "import", "chr", "getattr", "compile", "sys", "open", "read"]
    if any(word in x for word in banned):
        return False
        
    try:
        return eval(x) == x[::-1] and x != x[::-1]
    except Exception:
        return False
"(lambda x:(x%repr(x))[::-1])('(lambda x:(x%%repr(x))[::-1])(%s)')"
"(lambda s: (s % s)[::-1])('(lambda s: (s %% s)[::-1])(%r)')"
Proposer: gemini-3.1-pro-preview Solver: grok-4.20-0309-reasoning
0 vs 0
#2 Sample Solution Wrong
def mystery(x):
    if type(x) is not float:
        return False
    if str(x).lower() in ("nan", "inf", "-inf"):
        return False
    if abs(x) < 1e300:
        return False
    try:
        return (1 / (x - x)) == 0 and x == x * 2 and x != x + 1
    except Exception:
        return False
1e999
Proposer: grok-4.20-0309-reasoning Solver: gemini-3.1-pro-preview
0 vs -1
#3 Solved
def mystery(x):
    if type(x) is not str:
        return False
    
    banned = "0123456789.eE+- "
    if any(c in x for c in banned):
        return False
    
    if len(x) != 4:
        return False
        
    try:
        val = float(x)
        if val != 1337.0:
            return False
            
        return sum(ord(c) for c in x) == 9638
    except Exception:
        return False
"१३३७"
'१३३७'
Proposer: gemini-3.1-pro-preview Solver: grok-4.20-0309-reasoning
0 vs -1
#4 Solved
def mystery(x):
    if type(x) is not float:
        return False
    if abs(x) < 1e300:
        return False
    try:
        return (x == x + 1) and (1 / x == 0) and (x * x == x)
    except Exception:
        return False
float('inf')
1e309
Proposer: grok-4.20-0309-reasoning Solver: gemini-3.1-pro-preview
0 vs -1
#5 Sample Solution Wrong
def mystery(x):
    if type(x) is not str:
        return False
    
    if len(x) > 5:
        return False
        
    import keyword
    if keyword.iskeyword(x) or not x.isidentifier():
        return False
        
    try:
        eval(x)
    except SyntaxError:
        return True
    except Exception:
        return False
        
    return False
"\uff49\uff46"
Proposer: gemini-3.1-pro-preview Solver: grok-4.20-0309-reasoning
-1 vs -1
#6 Sample Solution Wrong
def mystery(x):
    if type(x) is not float:
        return False
    if x != 0:
        return False
    return (1 / x) < 0
-0.0
Proposer: grok-4.20-0309-reasoning Solver: gemini-3.1-pro-preview
-1 vs -2
#7 Solved
def mystery(x):
    if type(x) is not str:
        return False
    if len(x) != 2:
        return False
    
    if len(x.lower()) != 3:
        return False
    if len(x.upper()) != 3:
        return False
    if len(x.casefold()) != 4:
        return False
    if len(x.title()) != 4:
        return False
        
    return True
"ßİ"
"\u00df\u0130"
Proposer: gemini-3.1-pro-preview Solver: grok-4.20-0309-reasoning
-1 vs -2
#8 Solved
def mystery(x):
    if type(x) is not float:
        return False
    if abs(x) < 1e300:
        return False
    try:
        return (x == x + 1) and (x < 0) and (x * x == -x) and (x / x != x / x)
    except Exception:
        return False
float('-inf')
float('-inf')
Proposer: grok-4.20-0309-reasoning Solver: gemini-3.1-pro-preview
-1 vs -2
#9 Solver Failed
def mystery(x):
    if type(x) is not float:
        return False
    if x.is_integer():
        return False
        
    return hash(x) == 623748548390934259
(1 + 2251799813805811 / 2**52) * 2**-885
120563.2705078125
Proposer: gemini-3.1-pro-preview Solver: grok-4.20-0309-reasoning
0 vs -2
#10 Sample Solution Wrong
def mystery(x):
    if type(x) is not float:
        return False
    if x * 2 != 0:
        return False
    try:
        return (1 / x < 0) and (x == -x) and (x / x != x / x) and (1 + (1 / x) == (1 / x))
    except Exception:
        return False
-0.0
Proposer: grok-4.20-0309-reasoning Solver: gemini-3.1-pro-preview
0 vs -3