{
  "generated": "2026-05-05T18:35:18.447710+00:00",
  "models": [
    {
      "key": "claude-opus-4-7",
      "label": "Claude Opus 4.7",
      "run_id": "65ab97ac_cli_claude_claude-opus-4-7_20260427_183924",
      "model": "cli/claude:claude-opus-4-7",
      "judge_model": "cli/codex:gpt-5.5:high",
      "judge_models": [
        "cli/codex:gpt-5.5:high",
        "cli/claude:claude-opus-4-7",
        "cli/gemini:gemini-3.1-pro-preview"
      ],
      "language": "wgsl",
      "runtime": "wgpu"
    },
    {
      "key": "gemini-3.1-pro-preview",
      "label": "Gemini 3.1-pro-preview",
      "run_id": "f995b01e_cli_gemini_20260427_184028",
      "model": "cli/gemini",
      "judge_model": "cli/codex:gpt-5.5:high",
      "judge_models": [
        "cli/codex:gpt-5.5:high",
        "cli/claude:claude-opus-4-7",
        "cli/gemini:gemini-3.1-pro-preview"
      ],
      "language": "wgsl",
      "runtime": "wgpu"
    },
    {
      "key": "codex-gpt-5.5-high",
      "label": "Codex GPT-5.5 high",
      "run_id": "68ca3b4b_cli_codex_gpt-5.5_high_20260428_170724",
      "model": "cli/codex:gpt-5.5:high",
      "judge_model": "cli/codex:gpt-5.5:high",
      "judge_models": [
        "cli/codex:gpt-5.5:high",
        "cli/claude:claude-opus-4-7",
        "cli/gemini:gemini-3.1-pro-preview"
      ],
      "language": "wgsl",
      "runtime": "wgpu"
    }
  ],
  "problems": [
    "braid_word_reduction_ribbons",
    "cellular_potts_tissue_folding",
    "coxeter_reflection_kaleidoscope",
    "crystal_dislocation_network",
    "differentiable_rendering_ambiguity_landscape",
    "earthquake_fault_slip_wavefronts",
    "error_correcting_code_decoding_landscape",
    "fractal_drum_eigenfunctions",
    "mean_curvature_flow_surgery",
    "minimal_surface_knot_boundaries",
    "navier_stokes_vortex_reconnection",
    "ocean_eddy_lcs",
    "optimal_transport_mass_flow_tubes",
    "polyrhythm_phase_torus",
    "protein_folding_energy_landscape",
    "qec_threshold_phase_diagram",
    "reaction_diffusion_nonorientable_surfaces",
    "riemann_surface_covering_sheets",
    "spinodal_decomposition_3d",
    "topological_quantum_code_defect_braiding",
    "reproduce_image",
    "reproduce_image_andrew_pons",
    "reproduce_image_fabrice_villard",
    "reproduce_image_jason_leung",
    "reproduce_image_javier_penas",
    "reproduce_image_mark_basarab",
    "reproduce_image_photoholgic",
    "reproduce_image_rayul",
    "reproduce_image_sebastien_gabriel",
    "reproduce_image_tim_stief",
    "ackermann_function_growth",
    "al_khwarizmi_geometric_algebra",
    "apollonian_gasket",
    "apollonius_conic_sections",
    "archimedean_spiral_galaxy",
    "archimedes_spiral",
    "barbell_dumbbell_shape",
    "binary_tree_fractal",
    "brahmagupta_cyclic_quadrilaterals",
    "braided_rope",
    "butterfly_curve",
    "calabi_yau_manifold",
    "capsule_shape",
    "cardioid_limacon_collection",
    "catenoid_helicoid_minimal",
    "chinese_remainder_sunzi",
    "chinese_remainder_theorem",
    "chladni_patterns",
    "complex_analysis_stained_glass",
    "compound_polyhedra_stella_octangula",
    "conformal_spiral_mapping",
    "costa_minimal_surface",
    "crystal_lattice_diffraction",
    "cycloid_wave_patterns",
    "cylindrical_bend_deformation",
    "differential_equations_water",
    "dna_double_helix",
    "epicycloids",
    "euler_polyhedron_formula",
    "euler_polyhedron_platonic",
    "fermat_parabolic_spiral",
    "five_pointed_star_polygon",
    "fourier_architectural_blueprint",
    "fourier_epicycles_drawing",
    "fractal_loxodromic_patterns",
    "fractal_tree_2d",
    "gauss_complex_plane",
    "geometric_cube",
    "glass_sphere_red_core",
    "group_theory_kaleidoscope",
    "gyroscopic_nested_rings",
    "helical_twist_deformation",
    "helical_twisted_cube_advanced",
    "holographic_interference",
    "hopf_fibration_base_loops",
    "hyper_menger_cube_3sphere",
    "hyperbolic_heat_kernel",
    "icosahedron_wireframe",
    "klein_bottle",
    "lissajous_curve_garden",
    "logarithmic_spiral_motion",
    "lorenz_attractor_poincare",
    "loxodromic_sphere_spirals",
    "mandala_circles",
    "mandelbulb_fractal",
    "menger_cube_fractal",
    "menger_sponge_fractal",
    "mobius_strip_half_twist",
    "mobius_strip_triple_twist",
    "mobius_transformation_3d",
    "number_theory_music",
    "octagram_star_polygon",
    "parametric_gear_train",
    "parametric_seashell",
    "penrose_tiling_p3",
    "phyllotaxis_spiral",
    "poincare_disc",
    "prime_crystal_lattice",
    "probability_weather_patterns",
    "quantum_probability_waves",
    "ramanujan_mock_theta",
    "reaction_diffusion_patterns",
    "regular_dodecahedron",
    "regular_icosahedron",
    "regular_octahedron",
    "regular_tetrahedron",
    "riemann_surface_branch_cuts",
    "riemann_zeta_zeros",
    "rose_curves",
    "rotating_hypercube_projection",
    "rounded_box",
    "schwarzschild_black_hole",
    "sierpinski_tetrahedron",
    "sierpinski_triangle_6_iterations",
    "spherical_inversion_mapping",
    "spinning_gear_assembly",
    "spinning_vortex_funnel",
    "spiral_staircase_tower",
    "stella_octangula",
    "superformula_explorer",
    "taper_shear_transformation",
    "topology_fabric_texture",
    "torus_donut_parametric",
    "trefoil_alexander_polynomial",
    "trigonometric_mandalas",
    "truncated_icosahedron",
    "twisted_stellated_polyhedron",
    "voronoi_diagram",
    "wave_deformation_field",
    "weierstrass_function"
  ],
  "problem_categories": {
    "ackermann_function_growth": "Number Theory & Algebra",
    "al_khwarizmi_geometric_algebra": "Historical Mathematics",
    "apollonian_gasket": "Fractals & Recursion",
    "apollonius_conic_sections": "Historical Mathematics",
    "archimedean_spiral_galaxy": "Parametric Curves & Spirals",
    "archimedes_spiral": "Parametric Curves & Spirals",
    "barbell_dumbbell_shape": "Classical Geometry",
    "binary_tree_fractal": "Fractals & Recursion",
    "brahmagupta_cyclic_quadrilaterals": "Historical Mathematics",
    "braid_word_reduction_ribbons": "Frontier",
    "braided_rope": "Topology & Knot Theory",
    "butterfly_curve": "Parametric Curves & Spirals",
    "calabi_yau_manifold": "Differential Geometry",
    "capsule_shape": "Classical Geometry",
    "cardioid_limacon_collection": "Parametric Curves & Spirals",
    "catenoid_helicoid_minimal": "Differential Geometry",
    "cellular_potts_tissue_folding": "Frontier",
    "chinese_remainder_sunzi": "Historical Mathematics",
    "chinese_remainder_theorem": "Historical Mathematics",
    "chladni_patterns": "Physics & Simulations",
    "complex_analysis_stained_glass": "Complex Analysis & Visualization",
    "compound_polyhedra_stella_octangula": "Classical Geometry",
    "conformal_spiral_mapping": "Advanced Topology",
    "costa_minimal_surface": "Differential Geometry",
    "coxeter_reflection_kaleidoscope": "Frontier",
    "crystal_dislocation_network": "Frontier",
    "crystal_lattice_diffraction": "Deformations & Transformations",
    "cycloid_wave_patterns": "Parametric Curves & Spirals",
    "cylindrical_bend_deformation": "Deformations & Transformations",
    "differentiable_rendering_ambiguity_landscape": "Frontier",
    "differential_equations_water": "Cross-Disciplinary",
    "dna_double_helix": "Topology & Knot Theory",
    "earthquake_fault_slip_wavefronts": "Frontier",
    "epicycloids": "Parametric Curves & Spirals",
    "error_correcting_code_decoding_landscape": "Frontier",
    "euler_polyhedron_formula": "Historical Mathematics",
    "euler_polyhedron_platonic": "Historical Mathematics",
    "fermat_parabolic_spiral": "Parametric Curves & Spirals",
    "five_pointed_star_polygon": "Classical Geometry",
    "fourier_architectural_blueprint": "Cross-Disciplinary",
    "fourier_epicycles_drawing": "Cross-Disciplinary",
    "fractal_drum_eigenfunctions": "Frontier",
    "fractal_loxodromic_patterns": "Cross-Disciplinary",
    "fractal_tree_2d": "Fractals & Recursion",
    "gauss_complex_plane": "Historical Mathematics",
    "geometric_cube": "Classical Geometry",
    "glass_sphere_red_core": "Physics & Simulations",
    "group_theory_kaleidoscope": "Number Theory & Algebra",
    "gyroscopic_nested_rings": "Topology & Knot Theory",
    "helical_twist_deformation": "Deformations & Transformations",
    "helical_twisted_cube_advanced": "Topology & Knot Theory",
    "holographic_interference": "Complex Analysis & Visualization",
    "hopf_fibration_base_loops": "Differential Geometry",
    "hyper_menger_cube_3sphere": "Fractals & Recursion",
    "hyperbolic_heat_kernel": "Cross-Disciplinary",
    "icosahedron_wireframe": "Classical Geometry",
    "klein_bottle": "Differential Geometry",
    "lissajous_curve_garden": "Parametric Curves & Spirals",
    "logarithmic_spiral_motion": "Parametric Curves & Spirals",
    "lorenz_attractor_poincare": "Physics & Simulations",
    "loxodromic_sphere_spirals": "Physics & Simulations",
    "mandala_circles": "Fractals & Recursion",
    "mandelbulb_fractal": "Deformations & Transformations",
    "mean_curvature_flow_surgery": "Frontier",
    "menger_cube_fractal": "Fractals & Recursion",
    "menger_sponge_fractal": "Fractals & Recursion",
    "minimal_surface_knot_boundaries": "Frontier",
    "mobius_strip_half_twist": "Differential Geometry",
    "mobius_strip_triple_twist": "Differential Geometry",
    "mobius_transformation_3d": "Advanced Topology",
    "navier_stokes_vortex_reconnection": "Frontier",
    "number_theory_music": "Cross-Disciplinary",
    "ocean_eddy_lcs": "Frontier",
    "octagram_star_polygon": "Cross-Disciplinary",
    "optimal_transport_mass_flow_tubes": "Frontier",
    "parametric_gear_train": "Deformations & Transformations",
    "parametric_seashell": "Parametric Curves & Spirals",
    "penrose_tiling_p3": "Advanced Topology",
    "phyllotaxis_spiral": "Fractals & Recursion",
    "poincare_disc": "Advanced Topology",
    "polyrhythm_phase_torus": "Frontier",
    "prime_crystal_lattice": "Number Theory & Algebra",
    "probability_weather_patterns": "Cross-Disciplinary",
    "protein_folding_energy_landscape": "Frontier",
    "qec_threshold_phase_diagram": "Frontier",
    "quantum_probability_waves": "Complex Analysis & Visualization",
    "ramanujan_mock_theta": "Complex Analysis & Visualization",
    "reaction_diffusion_nonorientable_surfaces": "Frontier",
    "reaction_diffusion_patterns": "Physics & Simulations",
    "regular_dodecahedron": "Classical Geometry",
    "regular_icosahedron": "Classical Geometry",
    "regular_octahedron": "Classical Geometry",
    "regular_tetrahedron": "Classical Geometry",
    "reproduce_image": "Image Reproduction",
    "reproduce_image_andrew_pons": "Image Reproduction",
    "reproduce_image_fabrice_villard": "Image Reproduction",
    "reproduce_image_jason_leung": "Image Reproduction",
    "reproduce_image_javier_penas": "Image Reproduction",
    "reproduce_image_mark_basarab": "Image Reproduction",
    "reproduce_image_photoholgic": "Image Reproduction",
    "reproduce_image_rayul": "Image Reproduction",
    "reproduce_image_sebastien_gabriel": "Image Reproduction",
    "reproduce_image_tim_stief": "Image Reproduction",
    "riemann_surface_branch_cuts": "Historical Mathematics",
    "riemann_surface_covering_sheets": "Frontier",
    "riemann_zeta_zeros": "Complex Analysis & Visualization",
    "rose_curves": "Parametric Curves & Spirals",
    "rotating_hypercube_projection": "Advanced Topology",
    "rounded_box": "Classical Geometry",
    "schwarzschild_black_hole": "Physics & Simulations",
    "sierpinski_tetrahedron": "Fractals & Recursion",
    "sierpinski_triangle_6_iterations": "Fractals & Recursion",
    "spherical_inversion_mapping": "Advanced Topology",
    "spinning_gear_assembly": "Topology & Knot Theory",
    "spinning_vortex_funnel": "Physics & Simulations",
    "spinodal_decomposition_3d": "Frontier",
    "spiral_staircase_tower": "Topology & Knot Theory",
    "stella_octangula": "Classical Geometry",
    "superformula_explorer": "Parametric Curves & Spirals",
    "taper_shear_transformation": "Deformations & Transformations",
    "topological_quantum_code_defect_braiding": "Frontier",
    "topology_fabric_texture": "Cross-Disciplinary",
    "torus_donut_parametric": "Classical Geometry",
    "trefoil_alexander_polynomial": "Cross-Disciplinary",
    "trigonometric_mandalas": "Deformations & Transformations",
    "truncated_icosahedron": "Classical Geometry",
    "twisted_stellated_polyhedron": "Advanced Topology",
    "voronoi_diagram": "Deformations & Transformations",
    "wave_deformation_field": "Physics & Simulations",
    "weierstrass_function": "Complex Analysis & Visualization"
  },
  "problem_groups": {
    "Frontier": [
      "braid_word_reduction_ribbons",
      "cellular_potts_tissue_folding",
      "coxeter_reflection_kaleidoscope",
      "crystal_dislocation_network",
      "differentiable_rendering_ambiguity_landscape",
      "earthquake_fault_slip_wavefronts",
      "error_correcting_code_decoding_landscape",
      "fractal_drum_eigenfunctions",
      "mean_curvature_flow_surgery",
      "minimal_surface_knot_boundaries",
      "navier_stokes_vortex_reconnection",
      "ocean_eddy_lcs",
      "optimal_transport_mass_flow_tubes",
      "polyrhythm_phase_torus",
      "protein_folding_energy_landscape",
      "qec_threshold_phase_diagram",
      "reaction_diffusion_nonorientable_surfaces",
      "riemann_surface_covering_sheets",
      "spinodal_decomposition_3d",
      "topological_quantum_code_defect_braiding"
    ],
    "Reconstruction": [
      "reproduce_image",
      "reproduce_image_andrew_pons",
      "reproduce_image_fabrice_villard",
      "reproduce_image_jason_leung",
      "reproduce_image_javier_penas",
      "reproduce_image_mark_basarab",
      "reproduce_image_photoholgic",
      "reproduce_image_rayul",
      "reproduce_image_sebastien_gabriel",
      "reproduce_image_tim_stief"
    ],
    "Rest": [
      "ackermann_function_growth",
      "al_khwarizmi_geometric_algebra",
      "apollonian_gasket",
      "apollonius_conic_sections",
      "archimedean_spiral_galaxy",
      "archimedes_spiral",
      "barbell_dumbbell_shape",
      "binary_tree_fractal",
      "brahmagupta_cyclic_quadrilaterals",
      "braided_rope",
      "butterfly_curve",
      "calabi_yau_manifold",
      "capsule_shape",
      "cardioid_limacon_collection",
      "catenoid_helicoid_minimal",
      "chinese_remainder_sunzi",
      "chinese_remainder_theorem",
      "chladni_patterns",
      "complex_analysis_stained_glass",
      "compound_polyhedra_stella_octangula",
      "conformal_spiral_mapping",
      "costa_minimal_surface",
      "crystal_lattice_diffraction",
      "cycloid_wave_patterns",
      "cylindrical_bend_deformation",
      "differential_equations_water",
      "dna_double_helix",
      "epicycloids",
      "euler_polyhedron_formula",
      "euler_polyhedron_platonic",
      "fermat_parabolic_spiral",
      "five_pointed_star_polygon",
      "fourier_architectural_blueprint",
      "fourier_epicycles_drawing",
      "fractal_loxodromic_patterns",
      "fractal_tree_2d",
      "gauss_complex_plane",
      "geometric_cube",
      "glass_sphere_red_core",
      "group_theory_kaleidoscope",
      "gyroscopic_nested_rings",
      "helical_twist_deformation",
      "helical_twisted_cube_advanced",
      "holographic_interference",
      "hopf_fibration_base_loops",
      "hyper_menger_cube_3sphere",
      "hyperbolic_heat_kernel",
      "icosahedron_wireframe",
      "klein_bottle",
      "lissajous_curve_garden",
      "logarithmic_spiral_motion",
      "lorenz_attractor_poincare",
      "loxodromic_sphere_spirals",
      "mandala_circles",
      "mandelbulb_fractal",
      "menger_cube_fractal",
      "menger_sponge_fractal",
      "mobius_strip_half_twist",
      "mobius_strip_triple_twist",
      "mobius_transformation_3d",
      "number_theory_music",
      "octagram_star_polygon",
      "parametric_gear_train",
      "parametric_seashell",
      "penrose_tiling_p3",
      "phyllotaxis_spiral",
      "poincare_disc",
      "prime_crystal_lattice",
      "probability_weather_patterns",
      "quantum_probability_waves",
      "ramanujan_mock_theta",
      "reaction_diffusion_patterns",
      "regular_dodecahedron",
      "regular_icosahedron",
      "regular_octahedron",
      "regular_tetrahedron",
      "riemann_surface_branch_cuts",
      "riemann_zeta_zeros",
      "rose_curves",
      "rotating_hypercube_projection",
      "rounded_box",
      "schwarzschild_black_hole",
      "sierpinski_tetrahedron",
      "sierpinski_triangle_6_iterations",
      "spherical_inversion_mapping",
      "spinning_gear_assembly",
      "spinning_vortex_funnel",
      "spiral_staircase_tower",
      "stella_octangula",
      "superformula_explorer",
      "taper_shear_transformation",
      "topology_fabric_texture",
      "torus_donut_parametric",
      "trefoil_alexander_polynomial",
      "trigonometric_mandalas",
      "truncated_icosahedron",
      "twisted_stellated_polyhedron",
      "voronoi_diagram",
      "wave_deformation_field",
      "weierstrass_function"
    ]
  },
  "scores": {
    "braid_word_reduction_ribbons": {
      "claude-opus-4-7": {
        "scores": [
          83,
          86,
          82,
          86,
          85
        ],
        "total": 422,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            84,
            76,
            83,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            74,
            70,
            76,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          46,
          64,
          35,
          69,
          60
        ],
        "total": 274,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            56,
            82,
            43,
            78,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            64,
            52,
            68,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            45,
            10,
            60,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "cellular_potts_tissue_folding": {
      "claude-opus-4-7": {
        "scores": [
          82,
          78,
          82,
          78,
          84
        ],
        "total": 404,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            76,
            82,
            78,
            80
          ],
          "cli/claude:claude-opus-4-7": [
            65,
            62,
            68,
            60,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            96,
            97,
            97,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          10,
          32,
          9,
          16,
          13
        ],
        "total": 80,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            45,
            7,
            18,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            22,
            9,
            15,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            30,
            10,
            15,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          64,
          64,
          64,
          64,
          69
        ],
        "total": 325,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            84,
            79,
            81,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            70,
            74,
            68,
            72,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            35,
            45,
            40,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "coxeter_reflection_kaleidoscope": {
      "claude-opus-4-7": {
        "scores": [
          85,
          85,
          85,
          84,
          83
        ],
        "total": 422,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            76,
            80,
            74,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            80,
            76,
            78,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          3,
          6,
          2,
          5,
          7
        ],
        "total": 23,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            8,
            3,
            7,
            6
          ],
          "cli/claude:claude-opus-4-7": [
            3,
            5,
            2,
            3,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            5,
            1,
            5,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          4,
          5,
          4,
          4,
          5
        ],
        "total": 22,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            3,
            5,
            2,
            3,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            5,
            4,
            4,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            5,
            5,
            5,
            5,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "crystal_dislocation_network": {
      "claude-opus-4-7": {
        "scores": [
          87,
          87,
          85,
          84,
          88
        ],
        "total": 431,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            86,
            82,
            79,
            81
          ],
          "cli/claude:claude-opus-4-7": [
            80,
            76,
            80,
            76,
            83
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            96,
            100,
            92,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          76,
          77,
          72,
          68,
          72
        ],
        "total": 365,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            76,
            70,
            69,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            62,
            60,
            58,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            88,
            92,
            85,
            78,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          60,
          44,
          57,
          45,
          70
        ],
        "total": 276,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            58,
            66,
            55,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            40,
            45,
            40,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            35,
            60,
            40,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "differentiable_rendering_ambiguity_landscape": {
      "claude-opus-4-7": {
        "scores": [
          13,
          18,
          9,
          10,
          10
        ],
        "total": 60,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            28,
            10,
            14,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            18,
            15,
            12,
            10,
            12
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            5,
            5,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          68,
          64,
          68,
          61,
          72
        ],
        "total": 333,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            61,
            70,
            58,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            42,
            40,
            38,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            90,
            95,
            88,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          43,
          54,
          45,
          52,
          56
        ],
        "total": 250,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            73,
            84,
            68,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            40,
            40,
            38,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            50,
            10,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "earthquake_fault_slip_wavefronts": {
      "claude-opus-4-7": {
        "scores": [
          32,
          64,
          29,
          36,
          32
        ],
        "total": 193,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            66,
            38,
            45,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            40,
            20,
            28,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            85,
            30,
            35,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          75,
          73,
          77,
          67,
          76
        ],
        "total": 368,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            77,
            79,
            78,
            72,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            55,
            62,
            50,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            85,
            90,
            80,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          74,
          79,
          74,
          75,
          80
        ],
        "total": 382,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            82,
            76,
            80,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            58,
            50,
            52,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            96,
            95,
            94,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "error_correcting_code_decoding_landscape": {
      "claude-opus-4-7": {
        "scores": [
          85,
          83,
          85,
          82,
          88
        ],
        "total": 423,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            78,
            80,
            76,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            72,
            80,
            72,
            85
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            96,
            98,
            96,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          77,
          59,
          80,
          61,
          78
        ],
        "total": 355,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            58,
            74,
            56,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            55,
            70,
            58,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            65,
            95,
            68,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          70,
          73,
          74,
          62,
          62
        ],
        "total": 341,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            82,
            70,
            73,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            72,
            76,
            68,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            65,
            75,
            45,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "fractal_drum_eigenfunctions": {
      "claude-opus-4-7": {
        "scores": [
          81,
          73,
          83,
          73,
          82
        ],
        "total": 392,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            72,
            80,
            70,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            76,
            71,
            74,
            70,
            82
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            75,
            95,
            80,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          60,
          55,
          58,
          55,
          68
        ],
        "total": 296,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            62,
            78,
            55,
            72,
            63
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            38,
            28,
            34,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            50,
            90,
            60,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "mean_curvature_flow_surgery": {
      "claude-opus-4-7": {
        "scores": [
          15,
          19,
          17,
          21,
          26
        ],
        "total": 98,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            18,
            5,
            12,
            8
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            28,
            20,
            27,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            10,
            25,
            25,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          82,
          83,
          83,
          82,
          82
        ],
        "total": 412,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            80,
            82,
            78,
            82,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            67,
            72,
            66,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            100,
            98,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          51,
          47,
          50,
          47,
          62
        ],
        "total": 257,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            68,
            70,
            66,
            71
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            32,
            26,
            30,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            40,
            55,
            45,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "minimal_surface_knot_boundaries": {
      "claude-opus-4-7": {
        "scores": [
          8,
          12,
          6,
          7,
          13
        ],
        "total": 46,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            10,
            18,
            4,
            6,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            8,
            5,
            6,
            12
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          32,
          31,
          25,
          27,
          48
        ],
        "total": 163,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            43,
            42,
            31,
            39,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            25,
            28,
            22,
            35
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            25,
            15,
            20,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          45,
          46,
          37,
          40,
          63
        ],
        "total": 231,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            66,
            52,
            61,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            28,
            20,
            25,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            45,
            40,
            35,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "navier_stokes_vortex_reconnection": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          8,
          13,
          6,
          7,
          7
        ],
        "total": 41,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            18,
            2,
            4,
            3
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            10,
            5,
            8,
            7
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          75,
          73,
          74,
          68,
          74
        ],
        "total": 364,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            68,
            73,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            60,
            58,
            60,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            78,
            95,
            72,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "ocean_eddy_lcs": {
      "claude-opus-4-7": {
        "scores": [
          77,
          73,
          77,
          70,
          79
        ],
        "total": 376,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            68,
            70,
            62,
            64
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            55,
            62,
            52,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            98,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          84,
          79,
          85,
          79,
          82
        ],
        "total": 409,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            72,
            78,
            70,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            70,
            78,
            72,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            96,
            98,
            94,
            99
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          72,
          69,
          74,
          66,
          70
        ],
        "total": 351,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            73,
            78,
            70,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            58,
            48,
            54,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            75,
            95,
            75,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "optimal_transport_mass_flow_tubes": {
      "claude-opus-4-7": {
        "scores": [
          12,
          16,
          9,
          10,
          11
        ],
        "total": 58,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            16,
            24,
            8,
            10,
            9
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            15,
            8,
            9,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          11,
          18,
          7,
          8,
          9
        ],
        "total": 53,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            35,
            8,
            10,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            8,
            3,
            3,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          70,
          64,
          75,
          59,
          71
        ],
        "total": 339,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            76,
            83,
            72,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            45,
            48,
            40,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            70,
            95,
            65,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "polyrhythm_phase_torus": {
      "claude-opus-4-7": {
        "scores": [
          80,
          77,
          81,
          74,
          81
        ],
        "total": 393,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            88,
            82,
            86,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            55,
            60,
            50,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            88,
            100,
            85,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          57,
          67,
          47,
          59,
          62
        ],
        "total": 292,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            68,
            42,
            58,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            48,
            45,
            45,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            85,
            55,
            75,
            75
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          87,
          82,
          89,
          80,
          88
        ],
        "total": 426,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            80,
            88,
            77,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            83,
            82,
            80,
            78,
            86
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            85,
            100,
            85,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "protein_folding_energy_landscape": {
      "claude-opus-4-7": {
        "scores": [
          45,
          24,
          40,
          25,
          26
        ],
        "total": 160,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            37,
            42,
            34,
            35,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            14,
            16,
            22,
            14,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            15,
            65,
            25,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          46,
          58,
          57,
          56,
          52
        ],
        "total": 269,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            67,
            74,
            62,
            70,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            50,
            58,
            48,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            50,
            50,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          59,
          75,
          57,
          76,
          61
        ],
        "total": 328,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            84,
            68,
            82,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            58,
            48,
            62,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            82,
            55,
            85,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "qec_threshold_phase_diagram": {
      "claude-opus-4-7": {
        "scores": [
          72,
          78,
          79,
          67,
          65
        ],
        "total": 361,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            78,
            78,
            70,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            62,
            60,
            55,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            95,
            98,
            75,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          86,
          84,
          86,
          84,
          86
        ],
        "total": 426,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            86,
            82,
            88,
            84,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            76,
            72,
            74,
            82
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            98,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reaction_diffusion_nonorientable_surfaces": {
      "claude-opus-4-7": {
        "scores": [
          32,
          68,
          24,
          58,
          42
        ],
        "total": 224,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            73,
            34,
            59,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            50,
            22,
            40,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            80,
            15,
            75,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          47,
          73,
          49,
          69,
          72
        ],
        "total": 310,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            76,
            52,
            70,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            52,
            34,
            48,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            90,
            60,
            90,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          61,
          58,
          65,
          56,
          78
        ],
        "total": 318,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            64,
            67,
            66,
            65,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            66,
            48,
            58,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            40,
            80,
            45,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "riemann_surface_covering_sheets": {
      "claude-opus-4-7": {
        "scores": [
          80,
          79,
          74,
          77,
          81
        ],
        "total": 391,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            78,
            67,
            76,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            62,
            62,
            60,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            93,
            96,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          38,
          39,
          41,
          41,
          51
        ],
        "total": 210,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            70,
            62,
            66,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            32,
            30,
            32,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            15,
            30,
            25,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "spinodal_decomposition_3d": {
      "claude-opus-4-7": {
        "scores": [
          83,
          79,
          86,
          79,
          77
        ],
        "total": 404,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            78,
            81,
            77,
            80
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            62,
            78,
            66,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            96,
            98,
            95,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          64,
          54,
          57,
          50,
          73
        ],
        "total": 298,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            60,
            45,
            48,
            62
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            42,
            40,
            38,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            60,
            85,
            65,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          69,
          52,
          62,
          52,
          79
        ],
        "total": 314,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            72,
            76,
            70,
            73
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            44,
            56,
            46,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            40,
            55,
            40,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "topological_quantum_code_defect_braiding": {
      "claude-opus-4-7": {
        "scores": [
          68,
          76,
          63,
          68,
          57
        ],
        "total": 332,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            81,
            74,
            78,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            56,
            28,
            40,
            26
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            92,
            88,
            85,
            78
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          76,
          71,
          79,
          68,
          72
        ],
        "total": 366,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            84,
            80,
            78,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            48,
            62,
            50,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            80,
            95,
            75,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          71,
          72,
          70,
          73,
          71
        ],
        "total": 357,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            84,
            72,
            82,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            56,
            54,
            60,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            75,
            85,
            78,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image": {
      "claude-opus-4-7": {
        "scores": [
          47,
          56,
          63,
          67,
          40
        ],
        "total": 273,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            55,
            58,
            63,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            74,
            72,
            72,
            64
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            40,
            60,
            65,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          45,
          60,
          59,
          59,
          43
        ],
        "total": 266,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            74,
            78,
            76,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            52,
            15,
            40,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            55,
            85,
            60,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_andrew_pons": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          39,
          48,
          48,
          52,
          38
        ],
        "total": 225,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            36,
            47,
            42,
            50,
            32
          ],
          "cli/claude:claude-opus-4-7": [
            20,
            38,
            18,
            32,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            60,
            85,
            75,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_fabrice_villard": {
      "claude-opus-4-7": {
        "scores": [
          43,
          52,
          64,
          53,
          42
        ],
        "total": 254,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            70,
            63,
            68,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            55,
            38,
            52,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            30,
            90,
            40,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          20,
          24,
          14,
          24,
          9
        ],
        "total": 91,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            12,
            15,
            10,
            4
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            10,
            6,
            8,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            50,
            20,
            54,
            19
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          23,
          28,
          31,
          29,
          25
        ],
        "total": 136,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            35,
            42,
            34,
            25
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            30,
            20,
            28,
            25
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            20,
            30,
            25,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_jason_leung": {
      "claude-opus-4-7": {
        "scores": [
          19,
          38,
          31,
          29,
          20
        ],
        "total": 137,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            20,
            58,
            32,
            42,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            18,
            32,
            22,
            25,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            25,
            40,
            20,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          37,
          51,
          61,
          45,
          31
        ],
        "total": 225,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            61,
            48,
            58,
            32
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            52,
            50,
            48,
            35
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            40,
            85,
            30,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          29,
          53,
          32,
          40,
          27
        ],
        "total": 181,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            55,
            42,
            48,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            40,
            20,
            32,
            25
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            65,
            35,
            40,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_javier_penas": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          31,
          38,
          56,
          43,
          26
        ],
        "total": 194,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            30,
            36,
            45,
            40,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            42,
            34,
            43,
            28
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            35,
            90,
            45,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          37,
          38,
          53,
          39,
          32
        ],
        "total": 199,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            25,
            42,
            55,
            50,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            38,
            30,
            36,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            35,
            75,
            30,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_mark_basarab": {
      "claude-opus-4-7": {
        "scores": [
          40,
          40,
          48,
          42,
          44
        ],
        "total": 214,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            43,
            55,
            46,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            48,
            50,
            45,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            30,
            40,
            35,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          42,
          39,
          55,
          41,
          42
        ],
        "total": 219,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            47,
            45,
            60,
            48,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            35,
            38,
            40,
            35,
            42
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            35,
            65,
            40,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          27,
          32,
          26,
          32,
          27
        ],
        "total": 144,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            47,
            39,
            46,
            38
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            28,
            20,
            26,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            20,
            20,
            25,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_photoholgic": {
      "claude-opus-4-7": {
        "scores": [
          34,
          38,
          39,
          40,
          33
        ],
        "total": 184,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            42,
            38,
            45,
            36
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            48,
            38,
            46,
            44
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            25,
            40,
            30,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          52,
          58,
          57,
          58,
          59
        ],
        "total": 284,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            58,
            50,
            56,
            44
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            55,
            40,
            52,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            60,
            80,
            65,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          47,
          49,
          57,
          53,
          53
        ],
        "total": 259,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            52,
            61,
            55,
            60,
            54
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            42,
            32,
            45,
            34
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            45,
            85,
            55,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_rayul": {
      "claude-opus-4-7": {
        "scores": [
          58,
          64,
          65,
          63,
          56
        ],
        "total": 306,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            43,
            50,
            58,
            48,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            58,
            48,
            55,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            85,
            90,
            85,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          58,
          58,
          63,
          61,
          55
        ],
        "total": 295,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            43,
            56,
            58,
            57,
            47
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            52,
            45,
            50,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            65,
            85,
            75,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "reproduce_image_sebastien_gabriel": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          46,
          56,
          52,
          50,
          41
        ],
        "total": 245,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            68,
            72,
            64,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            55,
            45,
            50,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            45,
            40,
            35,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reproduce_image_tim_stief": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          42,
          31,
          49,
          35,
          47
        ],
        "total": 204,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            38,
            50,
            42,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            25,
            32,
            22,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            30,
            65,
            40,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          33,
          30,
          39,
          31,
          30
        ],
        "total": 163,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            43,
            48,
            42,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            26,
            28,
            30,
            27,
            25
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            20,
            40,
            25,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "ackermann_function_growth": {
      "claude-opus-4-7": {
        "scores": [
          56,
          53,
          24,
          54,
          55
        ],
        "total": 242,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            36,
            42,
            16,
            45,
            39
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            58,
            32,
            62,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            60,
            25,
            55,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          40,
          45,
          36,
          44,
          38
        ],
        "total": 203,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            46,
            15,
            35,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            30,
            18,
            28,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            60,
            75,
            70,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          50,
          71,
          31,
          58,
          59
        ],
        "total": 269,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            43,
            68,
            18,
            58,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            55,
            30,
            50,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            90,
            45,
            65,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "al_khwarizmi_geometric_algebra": {
      "claude-opus-4-7": {
        "scores": [
          19,
          60,
          26,
          45,
          22
        ],
        "total": 172,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            72,
            22,
            34,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            32,
            5,
            30,
            6
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            75,
            50,
            70,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          5,
          14,
          3,
          8,
          3
        ],
        "total": 33,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            28,
            5,
            10,
            4
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            10,
            3,
            8,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            2,
            5,
            1,
            5,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          23,
          44,
          20,
          30,
          20
        ],
        "total": 137,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            44,
            67,
            39,
            50,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            14,
            26,
            10,
            16,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            40,
            10,
            25,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "apollonian_gasket": {
      "claude-opus-4-7": {
        "scores": [
          29,
          51,
          18,
          30,
          30
        ],
        "total": 158,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            62,
            22,
            39,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            52,
            22,
            32,
            26
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            40,
            10,
            20,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          39,
          82,
          31,
          56,
          42
        ],
        "total": 250,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            88,
            42,
            63,
            49
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            62,
            30,
            40,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            95,
            20,
            65,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          19,
          47,
          11,
          22,
          16
        ],
        "total": 115,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            78,
            18,
            42,
            28
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            22,
            5,
            5,
            6
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            40,
            10,
            20,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "apollonius_conic_sections": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          59,
          64,
          66,
          61,
          45
        ],
        "total": 295,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            78,
            62,
            73,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            38,
            40,
            30,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            75,
            95,
            80,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          77,
          77,
          80,
          79,
          77
        ],
        "total": 390,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            78,
            73,
            82,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            55,
            68,
            58,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            98,
            98,
            98,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "archimedean_spiral_galaxy": {
      "claude-opus-4-7": {
        "scores": [
          69,
          71,
          68,
          61,
          66
        ],
        "total": 335,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            76,
            52,
            48,
            54
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            55,
            68,
            50,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            88,
            82,
            85,
            84,
            86
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          86,
          83,
          89,
          77,
          83
        ],
        "total": 418,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            85,
            82,
            88,
            72,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            68,
            78,
            58,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          2,
          7,
          1,
          2,
          2
        ],
        "total": 14,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            4,
            18,
            1,
            3,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            3,
            2,
            3,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            1,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "archimedes_spiral": {
      "claude-opus-4-7": {
        "scores": [
          21,
          43,
          17,
          30,
          16
        ],
        "total": 127,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            67,
            28,
            45,
            31
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            28,
            8,
            20,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            35,
            15,
            25,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          3,
          16,
          1,
          6,
          2
        ],
        "total": 28,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            4,
            36,
            1,
            10,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            3,
            8,
            2,
            4,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            5,
            1,
            5,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          39,
          54,
          35,
          48,
          35
        ],
        "total": 211,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            54,
            76,
            45,
            70,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            40,
            26,
            34,
            28
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            45,
            35,
            40,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "barbell_dumbbell_shape": {
      "claude-opus-4-7": {
        "scores": [
          42,
          51,
          41,
          42,
          40
        ],
        "total": 216,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            22,
            5,
            7,
            5
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            35,
            18,
            28,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            100,
            90,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          68,
          37,
          80,
          46,
          55
        ],
        "total": 286,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            42,
            78,
            46,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            25,
            68,
            32,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            45,
            95,
            60,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "binary_tree_fractal": {
      "claude-opus-4-7": {
        "scores": [
          29,
          25,
          32,
          18,
          27
        ],
        "total": 131,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            8,
            1,
            1,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            8,
            10,
            4,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            60,
            85,
            50,
            75
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          35,
          30,
          58,
          21,
          35
        ],
        "total": 179,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            42,
            28,
            30,
            25
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            28,
            52,
            22,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            20,
            95,
            10,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          19,
          15,
          37,
          14,
          29
        ],
        "total": 114,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            1,
            8,
            1,
            4
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            3,
            3,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            40,
            100,
            40,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "brahmagupta_cyclic_quadrilaterals": {
      "claude-opus-4-7": {
        "scores": [
          70,
          84,
          87,
          76,
          53
        ],
        "total": 370,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            84,
            82,
            72,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            74,
            84,
            62,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            75,
            95,
            95,
            95,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          69,
          66,
          81,
          72,
          60
        ],
        "total": 348,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            76,
            78,
            63
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            50,
            68,
            52,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            65,
            100,
            85,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          33,
          35,
          34,
          32,
          34
        ],
        "total": 168,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            4,
            1,
            1,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            2,
            2,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            100,
            94,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "braided_rope": {
      "claude-opus-4-7": {
        "scores": [
          64,
          67,
          69,
          59,
          64
        ],
        "total": 323,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            80,
            77,
            78,
            75,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            80,
            85,
            82,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            45,
            45,
            20,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          81,
          86,
          82,
          72,
          78
        ],
        "total": 399,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            84,
            72,
            78,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            80,
            78,
            62,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            95,
            75,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          91,
          91,
          90,
          89,
          89
        ],
        "total": 450,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            88,
            86,
            82,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            91,
            87,
            89,
            90,
            91
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            97,
            96,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "butterfly_curve": {
      "claude-opus-4-7": {
        "scores": [
          57,
          56,
          76,
          42,
          58
        ],
        "total": 289,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            52,
            88,
            24,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            22,
            40,
            10,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            100,
            92,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          28,
          31,
          69,
          15,
          29
        ],
        "total": 172,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            42,
            88,
            25,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            20,
            22,
            78,
            10,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            30,
            40,
            10,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          35,
          52,
          79,
          16,
          31
        ],
        "total": 213,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            70,
            88,
            28,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            22,
            55,
            10,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            65,
            95,
            10,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "calabi_yau_manifold": {
      "claude-opus-4-7": {
        "scores": [
          6,
          12,
          4,
          6,
          5
        ],
        "total": 33,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            6,
            12,
            1,
            3,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            3,
            15,
            2,
            4,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          64,
          78,
          39,
          72,
          38
        ],
        "total": 291,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            76,
            24,
            55,
            23
          ],
          "cli/claude:claude-opus-4-7": [
            70,
            78,
            62,
            72,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            80,
            30,
            90,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "capsule_shape": {
      "claude-opus-4-7": {
        "scores": [
          52,
          66,
          46,
          67,
          42
        ],
        "total": 273,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            66,
            52,
            60,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            52,
            50,
            50,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            80,
            35,
            90,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          65,
          78,
          47,
          69,
          73
        ],
        "total": 332,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            78,
            42,
            63,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            62,
            50,
            58,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            95,
            50,
            85,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          72,
          85,
          59,
          82,
          78
        ],
        "total": 376,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            86,
            52,
            82,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            74,
            55,
            70,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            95,
            70,
            95,
            88
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "cardioid_limacon_collection": {
      "claude-opus-4-7": {
        "scores": [
          85,
          87,
          91,
          81,
          81
        ],
        "total": 425,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            88,
            90,
            76,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            74,
            82,
            68,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            100,
            98,
            96
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          80,
          81,
          84,
          77,
          78
        ],
        "total": 400,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            88,
            80,
            82,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            68,
            78,
            70,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            88,
            95,
            80,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          84,
          83,
          91,
          79,
          81
        ],
        "total": 418,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            88,
            90,
            78,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            68,
            82,
            65,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            92,
            100,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "catenoid_helicoid_minimal": {
      "claude-opus-4-7": {
        "scores": [
          82,
          68,
          86,
          63,
          77
        ],
        "total": 376,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            66,
            82,
            62,
            74
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            62,
            78,
            58,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            75,
            98,
            70,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          13,
          16,
          26,
          9,
          9
        ],
        "total": 73,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            22,
            35,
            8,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            15,
            22,
            8,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            20,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "chinese_remainder_sunzi": {
      "claude-opus-4-7": {
        "scores": [
          49,
          71,
          44,
          49,
          25
        ],
        "total": 238,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            39,
            74,
            36,
            47,
            15
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            55,
            46,
            40,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            85,
            50,
            60,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          21,
          46,
          13,
          29,
          10
        ],
        "total": 119,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            22,
            68,
            10,
            36,
            8
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            40,
            14,
            30,
            12
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            30,
            15,
            20,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          35,
          30,
          30,
          33,
          34
        ],
        "total": 162,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            42,
            31,
            45,
            28
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            38,
            50,
            45,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            10,
            10,
            10,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "chinese_remainder_theorem": {
      "claude-opus-4-7": {
        "scores": [
          68,
          59,
          72,
          66,
          63
        ],
        "total": 328,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            70,
            50,
            72,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            52,
            70,
            55,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            55,
            95,
            70,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          2,
          3,
          2,
          2,
          2
        ],
        "total": 11,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            5,
            3,
            2,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            3,
            2,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            1,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "chladni_patterns": {
      "claude-opus-4-7": {
        "scores": [
          74,
          82,
          67,
          70,
          68
        ],
        "total": 361,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            62,
            78,
            45,
            67,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            72,
            72,
            48,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            96,
            85,
            95,
            92
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          83,
          82,
          89,
          67,
          77
        ],
        "total": 398,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            82,
            88,
            58,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            70,
            80,
            58,
            66
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            96,
            95,
            98,
            85,
            94
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "complex_analysis_stained_glass": {
      "claude-opus-4-7": {
        "scores": [
          48,
          48,
          51,
          35,
          34
        ],
        "total": 216,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            46,
            67,
            38,
            44,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            38,
            40,
            32,
            35
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            40,
            75,
            30,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          25,
          22,
          28,
          14,
          11
        ],
        "total": 100,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            36,
            38,
            24,
            16
          ],
          "cli/claude:claude-opus-4-7": [
            12,
            15,
            10,
            8,
            7
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            15,
            35,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          66,
          63,
          65,
          57,
          61
        ],
        "total": 312,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            62,
            78,
            55,
            70,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            45,
            55,
            42,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            65,
            85,
            60,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "compound_polyhedra_stella_octangula": {
      "claude-opus-4-7": {
        "scores": [
          72,
          60,
          76,
          49,
          62
        ],
        "total": 319,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            58,
            66,
            32,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            62,
            78,
            50,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            60,
            85,
            65,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          63,
          48,
          68,
          39,
          64
        ],
        "total": 282,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            38,
            46,
            18,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            55,
            74,
            38,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            50,
            85,
            60,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          82,
          81,
          81,
          67,
          79
        ],
        "total": 390,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            84,
            72,
            61,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            68,
            74,
            54,
            66
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            90,
            98,
            85,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "conformal_spiral_mapping": {
      "claude-opus-4-7": {
        "scores": [
          63,
          63,
          62,
          58,
          60
        ],
        "total": 306,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            74,
            45,
            62,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            33,
            52,
            28,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            82,
            88,
            85,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          62,
          67,
          56,
          60,
          53
        ],
        "total": 298,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            78,
            46,
            62,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            28,
            35,
            25,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            96,
            88,
            94,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          64,
          63,
          61,
          59,
          57
        ],
        "total": 304,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            67,
            52,
            55,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            38,
            42,
            30,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            85,
            90,
            92,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "costa_minimal_surface": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          5,
          4,
          4,
          4,
          4
        ],
        "total": 21,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            3,
            1,
            1,
            1,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            2,
            2,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          23,
          37,
          13,
          26,
          13
        ],
        "total": 112,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            45,
            12,
            33,
            8
          ],
          "cli/claude:claude-opus-4-7": [
            26,
            42,
            18,
            30,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            25,
            10,
            15,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "crystal_lattice_diffraction": {
      "claude-opus-4-7": {
        "scores": [
          85,
          92,
          81,
          92,
          80
        ],
        "total": 430,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            86,
            62,
            84,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            90,
            82,
            91,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          82,
          75,
          82,
          70,
          78
        ],
        "total": 387,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            78,
            66,
            76,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            62,
            80,
            58,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            85,
            100,
            75,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          60,
          76,
          51,
          65,
          60
        ],
        "total": 312,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            82,
            62,
            74,
            67
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            70,
            52,
            55,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            75,
            40,
            65,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "cycloid_wave_patterns": {
      "claude-opus-4-7": {
        "scores": [
          81,
          83,
          87,
          83,
          84
        ],
        "total": 418,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            78,
            90,
            82,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            74,
            72,
            70,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            96,
            100,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          88,
          86,
          90,
          88,
          83
        ],
        "total": 435,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            80,
            88,
            86,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            78,
            83,
            80,
            76
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          81,
          87,
          79,
          89,
          81
        ],
        "total": 417,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            86,
            75,
            88,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            76,
            62,
            78,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "cylindrical_bend_deformation": {
      "claude-opus-4-7": {
        "scores": [
          17,
          18,
          22,
          11,
          14
        ],
        "total": 82,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            24,
            30,
            10,
            14
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            20,
            32,
            18,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            5,
            5,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          74,
          72,
          81,
          63,
          63
        ],
        "total": 353,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            74,
            76,
            51,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            45,
            68,
            42,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            97,
            98,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          85,
          75,
          88,
          70,
          77
        ],
        "total": 395,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            83,
            74,
            88,
            63,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            56,
            78,
            52,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            96,
            98,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "differential_equations_water": {
      "claude-opus-4-7": {
        "scores": [
          13,
          17,
          11,
          12,
          12
        ],
        "total": 65,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            24,
            31,
            18,
            20,
            22
          ],
          "cli/claude:claude-opus-4-7": [
            6,
            10,
            5,
            7,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          22,
          25,
          19,
          17,
          17
        ],
        "total": 100,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            42,
            12,
            16,
            14
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            18,
            25,
            20,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            15,
            20,
            15,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          28,
          29,
          26,
          28,
          26
        ],
        "total": 137,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            41,
            27,
            31,
            26
          ],
          "cli/claude:claude-opus-4-7": [
            20,
            22,
            17,
            18,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            25,
            35,
            35,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "dna_double_helix": {
      "claude-opus-4-7": {
        "scores": [
          53,
          82,
          48,
          63,
          38
        ],
        "total": 284,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            78,
            52,
            63,
            38
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            78,
            38,
            62,
            35
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            90,
            55,
            65,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          48,
          77,
          44,
          69,
          31
        ],
        "total": 269,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            76,
            38,
            58,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            60,
            65,
            55,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            95,
            30,
            95,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "epicycloids": {
      "claude-opus-4-7": {
        "scores": [
          95,
          96,
          94,
          97,
          94
        ],
        "total": 476,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            91,
            94,
            92,
            96,
            88
          ],
          "cli/claude:claude-opus-4-7": [
            95,
            93,
            90,
            94,
            93
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          95,
          95,
          94,
          96,
          93
        ],
        "total": 473,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            90,
            91,
            88,
            93,
            86
          ],
          "cli/claude:claude-opus-4-7": [
            96,
            93,
            95,
            94,
            94
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          45,
          56,
          53,
          57,
          38
        ],
        "total": 249,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            76,
            70,
            73,
            54
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            38,
            40,
            32,
            25
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            55,
            50,
            65,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "euler_polyhedron_formula": {
      "claude-opus-4-7": {
        "scores": [
          64,
          79,
          53,
          59,
          54
        ],
        "total": 309,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            78,
            52,
            50,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            72,
            58,
            62,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            88,
            50,
            65,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          8,
          10,
          6,
          6,
          7
        ],
        "total": 37,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            12,
            5,
            4,
            6
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            8,
            3,
            4,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          21,
          31,
          15,
          18,
          18
        ],
        "total": 103,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            45,
            28,
            32,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            22,
            8,
            12,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            25,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "euler_polyhedron_platonic": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          8,
          23,
          4,
          13,
          3
        ],
        "total": 51,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            34,
            3,
            16,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            20,
            4,
            8,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            15,
            5,
            15,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "fermat_parabolic_spiral": {
      "claude-opus-4-7": {
        "scores": [
          76,
          92,
          64,
          81,
          69
        ],
        "total": 382,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            93,
            76,
            84,
            75
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            89,
            76,
            89,
            83
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            95,
            40,
            70,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          69,
          90,
          54,
          80,
          63
        ],
        "total": 356,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            93,
            68,
            86,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            82,
            55,
            80,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            95,
            40,
            75,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          77,
          93,
          64,
          78,
          69
        ],
        "total": 381,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            93,
            70,
            84,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            87,
            92,
            78,
            89,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            95,
            45,
            60,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "five_pointed_star_polygon": {
      "claude-opus-4-7": {
        "scores": [
          85,
          88,
          95,
          76,
          81
        ],
        "total": 425,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            86,
            92,
            91,
            88,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            90,
            92,
            93,
            91,
            89
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            80,
            100,
            50,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          93,
          91,
          96,
          92,
          93
        ],
        "total": 465,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            84,
            92,
            86,
            87
          ],
          "cli/claude:claude-opus-4-7": [
            92,
            88,
            96,
            90,
            93
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          92,
          94,
          95,
          93,
          92
        ],
        "total": 466,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            90,
            91,
            89,
            88
          ],
          "cli/claude:claude-opus-4-7": [
            92,
            93,
            94,
            91,
            93
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            100,
            100,
            100,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "fourier_architectural_blueprint": {
      "claude-opus-4-7": {
        "scores": [
          39,
          60,
          47,
          38,
          34
        ],
        "total": 218,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            58,
            30,
            24,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            52,
            50,
            40,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            70,
            60,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          58,
          62,
          58,
          59,
          54
        ],
        "total": 291,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            62,
            35,
            58,
            38
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            28,
            38,
            25,
            25
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            96,
            100,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          25,
          72,
          14,
          64,
          24
        ],
        "total": 199,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            32,
            78,
            18,
            62,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            52,
            15,
            50,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            85,
            10,
            80,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "fourier_epicycles_drawing": {
      "claude-opus-4-7": {
        "scores": [
          77,
          88,
          75,
          81,
          70
        ],
        "total": 391,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            88,
            56,
            78,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            78,
            74,
            68,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            95,
            98,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          75,
          85,
          73,
          77
        ],
        "total": 388,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            68,
            78,
            65,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            65,
            78,
            60,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            92,
            98,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          81,
          78,
          85,
          77,
          81
        ],
        "total": 402,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            78,
            75,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            55,
            76,
            58,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            96,
            100,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "fractal_loxodromic_patterns": {
      "claude-opus-4-7": {
        "scores": [
          11,
          24,
          8,
          14,
          10
        ],
        "total": 67,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            42,
            10,
            20,
            14
          ],
          "cli/claude:claude-opus-4-7": [
            6,
            10,
            4,
            8,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            20,
            10,
            15,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          57,
          60,
          55,
          52,
          51
        ],
        "total": 275,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            82,
            61,
            63,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            48,
            55,
            42,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            50,
            50,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          31,
          23,
          27,
          27,
          25
        ],
        "total": 133,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            35,
            24,
            37,
            27
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            20,
            22,
            24,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            15,
            35,
            20,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "fractal_tree_2d": {
      "claude-opus-4-7": {
        "scores": [
          76,
          84,
          70,
          86,
          72
        ],
        "total": 388,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            78,
            62,
            82,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            76,
            72,
            80,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            98,
            75,
            96,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          75,
          91,
          67,
          92,
          64
        ],
        "total": 389,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            69,
            84,
            63
          ],
          "cli/claude:claude-opus-4-7": [
            70,
            92,
            62,
            93,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            98,
            70,
            98,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          79,
          86,
          71,
          85,
          68
        ],
        "total": 389,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            86,
            72,
            84,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            78,
            62,
            76,
            66
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            95,
            80,
            95,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "gauss_complex_plane": {
      "claude-opus-4-7": {
        "scores": [
          74,
          83,
          92,
          82,
          58
        ],
        "total": 389,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            91,
            80,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            74,
            88,
            76,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            92,
            98,
            90,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          59,
          73,
          79,
          67,
          51
        ],
        "total": 329,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            83,
            74,
            78,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            62,
            68,
            52,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            75,
            95,
            70,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "geometric_cube": {
      "claude-opus-4-7": {
        "scores": [
          7,
          18,
          5,
          10,
          5
        ],
        "total": 45,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            22,
            6,
            9,
            5
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            22,
            7,
            15,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            5,
            10,
            1,
            5,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          89,
          92,
          86,
          89,
          88
        ],
        "total": 444,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            88,
            70,
            84,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            89,
            89,
            83,
            88
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          42,
          46,
          54,
          56,
          35
        ],
        "total": 233,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            63,
            54,
            66,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            40,
            62,
            52,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            35,
            45,
            50,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "glass_sphere_red_core": {
      "claude-opus-4-7": {
        "scores": [
          46,
          39,
          45,
          34,
          39
        ],
        "total": 203,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            42,
            36,
            34,
            38
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            40,
            48,
            38,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            35,
            50,
            30,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          48,
          40,
          57,
          37,
          43
        ],
        "total": 225,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            48,
            58,
            42,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            38,
            52,
            35,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            35,
            60,
            35,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          39,
          39,
          37,
          31,
          35
        ],
        "total": 181,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            50,
            58,
            45,
            42,
            44
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            25,
            32,
            22,
            26
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            35,
            35,
            30,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "group_theory_kaleidoscope": {
      "claude-opus-4-7": {
        "scores": [
          58,
          71,
          47,
          75,
          53
        ],
        "total": 304,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            76,
            42,
            70,
            39
          ],
          "cli/claude:claude-opus-4-7": [
            76,
            82,
            70,
            80,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            55,
            30,
            75,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          56,
          70,
          46,
          68,
          48
        ],
        "total": 288,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            62,
            78,
            48,
            72,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            80,
            82,
            76,
            78,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            50,
            15,
            55,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          30,
          65,
          21,
          47,
          25
        ],
        "total": 188,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            76,
            28,
            66,
            34
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            45,
            25,
            30,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            75,
            10,
            45,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "gyroscopic_nested_rings": {
      "claude-opus-4-7": {
        "scores": [
          75,
          91,
          72,
          91,
          87
        ],
        "total": 416,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            80,
            91,
            74,
            88,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            87,
            82,
            85,
            88
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            95,
            60,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          85,
          83,
          90,
          78,
          78
        ],
        "total": 414,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            84,
            82,
            72,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            84,
            74,
            88,
            68,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            92,
            100,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          75,
          81,
          78,
          72,
          77
        ],
        "total": 383,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            78,
            58,
            62
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            70,
            55,
            62,
            68
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            92,
            100,
            96,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "helical_twist_deformation": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          37,
          36,
          49,
          47,
          52
        ],
        "total": 221,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            32,
            48,
            38,
            22,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            25,
            30,
            18,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            35,
            80,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          28,
          23,
          22,
          19,
          32
        ],
        "total": 124,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            38,
            30,
            28,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            20,
            35,
            20,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            1,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "helical_twisted_cube_advanced": {
      "claude-opus-4-7": {
        "scores": [
          8,
          17,
          9,
          6,
          16
        ],
        "total": 56,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            22,
            5,
            8,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            20,
            22,
            10,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            10,
            1,
            1,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          46,
          51,
          52,
          20,
          57
        ],
        "total": 226,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            52,
            68,
            55,
            22,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            55,
            58,
            22,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            30,
            42,
            15,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          53,
          67,
          65,
          30,
          50
        ],
        "total": 265,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            72,
            42,
            28,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            55,
            68,
            32,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            75,
            85,
            30,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "holographic_interference": {
      "claude-opus-4-7": {
        "scores": [
          44,
          74,
          35,
          54,
          57
        ],
        "total": 264,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            68,
            38,
            45,
            40
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            70,
            28,
            38,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            85,
            40,
            80,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          58,
          78,
          37,
          59,
          66
        ],
        "total": 298,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            76,
            40,
            62,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            62,
            32,
            35,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            95,
            40,
            80,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          66,
          85,
          40,
          55,
          76
        ],
        "total": 322,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            54,
            82,
            45,
            50,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            72,
            35,
            45,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            100,
            40,
            70,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "hopf_fibration_base_loops": {
      "claude-opus-4-7": {
        "scores": [
          26,
          70,
          26,
          38,
          50
        ],
        "total": 210,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            46,
            74,
            41,
            48,
            38
          ],
          "cli/claude:claude-opus-4-7": [
            12,
            50,
            8,
            22,
            42
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            85,
            30,
            45,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          1,
          8,
          1,
          2,
          2
        ],
        "total": 14,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            15,
            1,
            3,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            1,
            3,
            1,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            5,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          66,
          76,
          72,
          52,
          61
        ],
        "total": 327,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            74,
            76,
            58,
            57
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            60,
            40,
            32,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            95,
            100,
            65,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "hyper_menger_cube_3sphere": {
      "claude-opus-4-7": {
        "scores": [
          30,
          21,
          34,
          24,
          32
        ],
        "total": 141,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            28,
            36,
            24,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            18,
            15,
            22,
            14,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            20,
            45,
            35,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          11,
          10,
          16,
          14,
          23
        ],
        "total": 74,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            12,
            5,
            8,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            8,
            3,
            5,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            10,
            40,
            30,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          15,
          20,
          17,
          17,
          16
        ],
        "total": 85,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            35,
            10,
            18,
            15
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            6,
            2,
            3,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            20,
            40,
            30,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "hyperbolic_heat_kernel": {
      "claude-opus-4-7": {
        "scores": [
          63,
          64,
          67,
          45,
          57
        ],
        "total": 296,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            70,
            54,
            58,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            58,
            62,
            42,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            65,
            85,
            35,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          75,
          83,
          73,
          70,
          70
        ],
        "total": 371,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            82,
            58,
            70,
            62
          ],
          "cli/claude:claude-opus-4-7": [
            65,
            68,
            62,
            55,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            98,
            85,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          79,
          84,
          63,
          80,
          76
        ],
        "total": 382,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            84,
            55,
            78,
            67
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            74,
            80,
            68,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            95,
            55,
            95,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "icosahedron_wireframe": {
      "claude-opus-4-7": {
        "scores": [
          8,
          16,
          8,
          8,
          6
        ],
        "total": 46,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            10,
            18,
            8,
            8,
            7
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            15,
            5,
            12,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            15,
            10,
            5,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          6,
          16,
          5,
          4,
          4
        ],
        "total": 35,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            1,
            4,
            3,
            1,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            5,
            3,
            1,
            1
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            40,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "klein_bottle": {
      "claude-opus-4-7": {
        "scores": [
          7,
          15,
          7,
          11,
          7
        ],
        "total": 47,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            4,
            18,
            1,
            3,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            18,
            10,
            15,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            15,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          57,
          65,
          51,
          52,
          52
        ],
        "total": 277,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            55,
            72,
            48,
            45,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            30,
            15,
            25,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            92,
            90,
            85,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          34,
          36,
          39,
          19,
          26
        ],
        "total": 154,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            46,
            55,
            28,
            40
          ],
          "cli/claude:claude-opus-4-7": [
            20,
            32,
            18,
            14,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            25,
            30,
            45,
            15,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "lissajous_curve_garden": {
      "claude-opus-4-7": {
        "scores": [
          63,
          59,
          14,
          9,
          15
        ],
        "total": 160,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            70,
            22,
            12,
            25
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            38,
            15,
            10,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            70,
            5,
            5,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          75,
          19,
          12,
          20
        ],
        "total": 204,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            82,
            35,
            20,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            68,
            20,
            15,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            75,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          75,
          76,
          16,
          10,
          18
        ],
        "total": 195,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            84,
            24,
            14,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            48,
            15,
            10,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            10,
            5,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "logarithmic_spiral_motion": {
      "claude-opus-4-7": {
        "scores": [
          33,
          33,
          34,
          29,
          34
        ],
        "total": 163,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            1,
            3,
            1,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            3,
            2,
            3,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            96,
            85,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          13,
          11,
          14,
          8,
          11
        ],
        "total": 57,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            20,
            22,
            8,
            15
          ],
          "cli/claude:claude-opus-4-7": [
            12,
            4,
            10,
            5,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          71,
          68,
          74,
          68,
          72
        ],
        "total": 353,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            63,
            78,
            68,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            50,
            48,
            45,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            90,
            95,
            92,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "lorenz_attractor_poincare": {
      "claude-opus-4-7": {
        "scores": [
          7,
          11,
          6,
          6,
          8
        ],
        "total": 38,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            12,
            5,
            4,
            6
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            5,
            3,
            3,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            15,
            10,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          68,
          49,
          65,
          50,
          59
        ],
        "total": 291,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            48,
            70,
            43,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            40,
            45,
            42,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            60,
            80,
            65,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          69,
          59,
          70,
          52,
          62
        ],
        "total": 312,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            58,
            61,
            55,
            57
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            50,
            58,
            45,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            70,
            90,
            55,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "loxodromic_sphere_spirals": {
      "claude-opus-4-7": {
        "scores": [
          6,
          11,
          5,
          7,
          5
        ],
        "total": 34,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            4,
            18,
            2,
            6,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            5,
            3,
            5,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          59,
          48,
          76,
          48,
          57
        ],
        "total": 288,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            73,
            78,
            62,
            67
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            25,
            55,
            32,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            45,
            95,
            50,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          52,
          55,
          61,
          57,
          46
        ],
        "total": 271,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            72,
            61,
            58,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            34,
            26,
            32,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            60,
            95,
            80,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "mandala_circles": {
      "claude-opus-4-7": {
        "scores": [
          81,
          90,
          81,
          94,
          80
        ],
        "total": 426,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            91,
            74,
            94,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            90,
            88,
            90,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            82,
            88,
            80,
            98,
            82
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          88,
          91,
          88,
          93,
          89
        ],
        "total": 449,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            88,
            72,
            91,
            75
          ],
          "cli/claude:claude-opus-4-7": [
            90,
            88,
            93,
            89,
            91
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            98,
            100,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          85,
          93,
          87,
          95,
          84
        ],
        "total": 444,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            81,
            90,
            78,
            95,
            80
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            88,
            82,
            90,
            76
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            100,
            100,
            100,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "mandelbulb_fractal": {
      "claude-opus-4-7": {
        "scores": [
          5,
          8,
          7,
          6,
          5
        ],
        "total": 31,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            3,
            1,
            2,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            10,
            10,
            6,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          1,
          4,
          1,
          2,
          1
        ],
        "total": 9,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            2,
            8,
            1,
            4,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            1,
            3,
            1,
            1,
            1
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            1,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          6,
          8,
          5,
          7,
          5
        ],
        "total": 31,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            6,
            12,
            2,
            8,
            3
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            3,
            2,
            3,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "menger_cube_fractal": {
      "claude-opus-4-7": {
        "scores": [
          3,
          6,
          2,
          6,
          2
        ],
        "total": 19,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            8,
            3,
            4,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            3,
            5,
            2,
            5,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            5,
            1,
            10,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          49,
          38,
          42,
          48,
          36
        ],
        "total": 213,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            41,
            45,
            50,
            39
          ],
          "cli/claude:claude-opus-4-7": [
            70,
            52,
            72,
            58,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            20,
            10,
            35,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          43,
          31,
          56,
          29,
          36
        ],
        "total": 195,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            34,
            56,
            25,
            36
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            40,
            68,
            38,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            20,
            45,
            25,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "menger_sponge_fractal": {
      "claude-opus-4-7": {
        "scores": [
          9,
          9,
          6,
          6,
          5
        ],
        "total": 35,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            12,
            1,
            2,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            5,
            8,
            5,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          8,
          8,
          3,
          5,
          5
        ],
        "total": 29,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            6,
            1,
            2,
            1
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            8,
            3,
            3,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            5,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          15,
          11,
          9,
          10,
          9
        ],
        "total": 54,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            22,
            18,
            20,
            18
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            5,
            3,
            4,
            3
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            5,
            5,
            5,
            5,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "mobius_strip_half_twist": {
      "claude-opus-4-7": {
        "scores": [
          79,
          69,
          82,
          62,
          69
        ],
        "total": 361,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            63,
            70,
            58,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            75,
            68,
            80,
            62,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            75,
            95,
            65,
            75
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          72,
          75,
          71,
          72,
          68
        ],
        "total": 358,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            70,
            61,
            63,
            56
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            60,
            55,
            58,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            96,
            98,
            96,
            97
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          8,
          4,
          10,
          3,
          6
        ],
        "total": 31,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            4,
            15,
            3,
            5
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            3,
            5,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            5,
            10,
            5,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "mobius_strip_triple_twist": {
      "claude-opus-4-7": {
        "scores": [
          85,
          88,
          86,
          73,
          79
        ],
        "total": 411,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            82,
            79,
            63,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            82,
            80,
            62,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            95,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          83,
          82,
          83,
          76,
          79
        ],
        "total": 403,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            84,
            72,
            66,
            68
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            62,
            78,
            62,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          72,
          43,
          81,
          43,
          51
        ],
        "total": 290,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            68,
            82,
            54,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            30,
            72,
            40,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            30,
            90,
            35,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "mobius_transformation_3d": {
      "claude-opus-4-7": {
        "scores": [
          6,
          1,
          17,
          1,
          2
        ],
        "total": 27,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            1,
            45,
            1,
            3
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            2,
            5,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            1,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          49,
          46,
          52,
          51,
          46
        ],
        "total": 244,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            72,
            60,
            64,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            35,
            22,
            55,
            25,
            28
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            45,
            40,
            65,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          7,
          9,
          13,
          6,
          7
        ],
        "total": 42,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            12,
            8,
            3,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            6,
            22,
            6,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "number_theory_music": {
      "claude-opus-4-7": {
        "scores": [
          9,
          11,
          9,
          9,
          8
        ],
        "total": 46,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            10,
            12,
            8,
            7,
            6
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            10,
            10,
            9,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          28,
          17,
          35,
          21,
          23
        ],
        "total": 124,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            24,
            18,
            19,
            23,
            17
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            12,
            10,
            11,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            20,
            75,
            30,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "octagram_star_polygon": {
      "claude-opus-4-7": {
        "scores": [
          77,
          89,
          79,
          63,
          69
        ],
        "total": 377,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            90,
            70,
            64,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            82,
            72,
            66,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            95,
            95,
            60,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          79,
          86,
          81,
          72,
          75
        ],
        "total": 393,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            64,
            88,
            58,
            55,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            70,
            85,
            62,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          36,
          61,
          61,
          31,
          29
        ],
        "total": 218,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            72,
            46,
            42,
            36
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            30,
            38,
            22,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            80,
            100,
            30,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "parametric_gear_train": {
      "claude-opus-4-7": {
        "scores": [
          68,
          81,
          77,
          79,
          70
        ],
        "total": 375,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            84,
            75,
            84,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            74,
            62,
            65,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            85,
            95,
            88,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          69,
          80,
          56,
          80,
          73
        ],
        "total": 358,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            86,
            49,
            82,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            70,
            58,
            67,
            72
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            68,
            85,
            60,
            90,
            76
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "parametric_seashell": {
      "claude-opus-4-7": {
        "scores": [
          63,
          77,
          55,
          66,
          79
        ],
        "total": 340,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            76,
            84,
            75,
            79
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            70,
            62,
            60,
            66
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            40,
            85,
            20,
            64,
            92
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          26,
          29,
          25,
          27,
          33
        ],
        "total": 140,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            48,
            36,
            48,
            52
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            30,
            20,
            18,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            10,
            20,
            15,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          49,
          56,
          70,
          41,
          45
        ],
        "total": 261,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            73,
            70,
            82,
            58,
            61
          ],
          "cli/claude:claude-opus-4-7": [
            30,
            48,
            62,
            25,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            50,
            65,
            40,
            45
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "penrose_tiling_p3": {
      "claude-opus-4-7": {
        "scores": [
          61,
          79,
          63,
          63,
          54
        ],
        "total": 320,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            80,
            67,
            65,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            62,
            38,
            40,
            38
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            95,
            85,
            85,
            75
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          22,
          34,
          17,
          35,
          20
        ],
        "total": 128,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            55,
            34,
            52,
            31
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            22,
            8,
            18,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            25,
            10,
            35,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          13,
          33,
          11,
          25,
          16
        ],
        "total": 98,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            22,
            63,
            18,
            45,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            22,
            5,
            10,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            15,
            10,
            20,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "phyllotaxis_spiral": {
      "claude-opus-4-7": {
        "scores": [
          7,
          19,
          15,
          6,
          7
        ],
        "total": 54,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            10,
            35,
            18,
            8,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            7,
            12,
            22,
            6,
            6
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            5,
            10,
            5,
            5,
            5
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          80,
          82,
          82,
          75,
          80
        ],
        "total": 399,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            88,
            73,
            74,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            58,
            72,
            50,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          4,
          17,
          17,
          6,
          5
        ],
        "total": 49,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            35,
            42,
            12,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            4,
            15,
            8,
            6,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            1,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "poincare_disc": {
      "claude-opus-4-7": {
        "scores": [
          94,
          95,
          94,
          96,
          93
        ],
        "total": 472,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            90,
            92,
            87,
            93,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            93,
            92,
            95,
            94,
            95
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          75,
          89,
          81,
          91,
          83
        ],
        "total": 419,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            89,
            86,
            97,
            93,
            88
          ],
          "cli/claude:claude-opus-4-7": [
            35,
            80,
            45,
            80,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          67,
          89,
          76,
          90,
          83
        ],
        "total": 405,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            83,
            87,
            93,
            87,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            86,
            90,
            89,
            90
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            95,
            45,
            95,
            75
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "prime_crystal_lattice": {
      "claude-opus-4-7": {
        "scores": [
          57,
          76,
          61,
          74,
          56
        ],
        "total": 324,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            82,
            59,
            81,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            58,
            38,
            52,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            88,
            85,
            90,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          32,
          71,
          35,
          73,
          55
        ],
        "total": 266,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            78,
            41,
            76,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            45,
            30,
            48,
            42
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            90,
            35,
            95,
            68
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "probability_weather_patterns": {
      "claude-opus-4-7": {
        "scores": [
          30,
          33,
          27,
          25,
          22
        ],
        "total": 137,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            32,
            46,
            28,
            26,
            22
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            28,
            18,
            25,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            25,
            35,
            25,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          32,
          33,
          27,
          30,
          28
        ],
        "total": 150,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            31,
            27,
            18,
            24,
            22
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            22,
            14,
            15,
            12
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            50,
            50,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          38,
          39,
          39,
          30,
          27
        ],
        "total": 173,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            46,
            57,
            38,
            43,
            34
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            30,
            28,
            26,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            30,
            50,
            20,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "quantum_probability_waves": {
      "claude-opus-4-7": {
        "scores": [
          81,
          86,
          65,
          78,
          74
        ],
        "total": 384,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            76,
            28,
            50,
            36
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            82,
            78,
            83,
            87
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            90,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          63,
          62,
          31,
          45,
          67
        ],
        "total": 268,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            82,
            42,
            66,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            48,
            35,
            45,
            52
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            80,
            55,
            15,
            25,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          41,
          55,
          46,
          37,
          52
        ],
        "total": 231,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            78,
            55,
            61,
            64
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            38,
            32,
            30,
            42
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            50,
            50,
            19,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "ramanujan_mock_theta": {
      "claude-opus-4-7": {
        "scores": [
          57,
          78,
          59,
          70,
          48
        ],
        "total": 312,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            80,
            38,
            68,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            70,
            58,
            72,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            45,
            85,
            80,
            70,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          69,
          73,
          58,
          75,
          64
        ],
        "total": 339,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            82,
            48,
            76,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            35,
            38,
            28,
            52,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            99,
            98,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          52,
          74,
          30,
          61,
          46
        ],
        "total": 263,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            78,
            35,
            55,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            32,
            48,
            25,
            52,
            32
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            75,
            95,
            30,
            75,
            65
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "reaction_diffusion_patterns": {
      "claude-opus-4-7": {
        "scores": [
          12,
          36,
          6,
          20,
          9
        ],
        "total": 83,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            18,
            55,
            8,
            25,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            22,
            5,
            10,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            30,
            5,
            25,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          20,
          47,
          16,
          35,
          19
        ],
        "total": 137,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            35,
            72,
            28,
            45,
            32
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            38,
            10,
            25,
            14
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            30,
            10,
            35,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          17,
          44,
          12,
          35,
          16
        ],
        "total": 124,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            63,
            18,
            48,
            24
          ],
          "cli/claude:claude-opus-4-7": [
            14,
            48,
            12,
            28,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            20,
            5,
            30,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "regular_dodecahedron": {
      "claude-opus-4-7": {
        "scores": [
          87,
          80,
          92,
          76,
          86
        ],
        "total": 421,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            72,
            88,
            68,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            80,
            72,
            88,
            62,
            80
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            95,
            100,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          88,
          80,
          91,
          79,
          85
        ],
        "total": 423,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            63,
            82,
            65,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            76,
            91,
            72,
            84
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          92,
          84,
          95,
          85,
          90
        ],
        "total": 446,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            73,
            92,
            76,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            80,
            92,
            78,
            86
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "regular_icosahedron": {
      "claude-opus-4-7": {
        "scores": [
          93,
          90,
          96,
          90,
          90
        ],
        "total": 459,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            91,
            84,
            96,
            88,
            82
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            87,
            92,
            83,
            87
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          79,
          89,
          85,
          75
        ],
        "total": 406,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            76,
            73,
            84,
            79,
            67
          ],
          "cli/claude:claude-opus-4-7": [
            58,
            65,
            82,
            76,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          93,
          93,
          95,
          91,
          90
        ],
        "total": 462,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            90,
            92,
            84,
            82
          ],
          "cli/claude:claude-opus-4-7": [
            91,
            89,
            92,
            88,
            89
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "regular_octahedron": {
      "claude-opus-4-7": {
        "scores": [
          91,
          91,
          95,
          90,
          89
        ],
        "total": 456,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            84,
            91,
            83,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            90,
            88,
            93,
            86,
            89
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          89,
          91,
          92,
          90,
          89
        ],
        "total": 451,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            88,
            82,
            87,
            80
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            86,
            94,
            83,
            86
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          92,
          91,
          92,
          91,
          92
        ],
        "total": 458,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            90,
            84,
            91,
            86
          ],
          "cli/claude:claude-opus-4-7": [
            89,
            87,
            92,
            86,
            89
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            95,
            100,
            96,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "regular_tetrahedron": {
      "claude-opus-4-7": {
        "scores": [
          12,
          13,
          16,
          9,
          9
        ],
        "total": 59,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            22,
            18,
            32,
            10,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            10,
            5,
            6,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          62,
          39,
          67,
          37,
          64
        ],
        "total": 269,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            80,
            58,
            88,
            55,
            81
          ],
          "cli/claude:claude-opus-4-7": [
            15,
            18,
            15,
            15,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            90,
            40,
            98,
            42,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          11,
          19,
          27,
          9,
          9
        ],
        "total": 75,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            12,
            28,
            25,
            8,
            10
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            20,
            15,
            10,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            40,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "riemann_surface_branch_cuts": {
      "claude-opus-4-7": {
        "scores": [
          73,
          75,
          76,
          72,
          68
        ],
        "total": 364,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            70,
            78,
            73,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            58,
            55,
            50,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            98,
            96,
            92,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          53,
          57,
          53,
          49,
          49
        ],
        "total": 261,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            52,
            63,
            45,
            58,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            18,
            20,
            28,
            20
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            90,
            95,
            60,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          22,
          16,
          21,
          18,
          17
        ],
        "total": 94,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            42,
            28,
            38,
            35,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            10,
            6,
            10,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            10,
            20,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "riemann_zeta_zeros": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          29,
          47,
          17,
          47,
          30
        ],
        "total": 170,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            28,
            62,
            10,
            55,
            22
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            58,
            32,
            55,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            20,
            10,
            30,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "rose_curves": {
      "claude-opus-4-7": {
        "scores": [
          75,
          91,
          88,
          87,
          73
        ],
        "total": 414,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            90,
            89,
            86,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            92,
            88,
            91,
            86,
            90
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            95,
            85,
            90,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          81,
          87,
          79,
          87,
          82
        ],
        "total": 416,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            91,
            87,
            89,
            86
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            70,
            50,
            72,
            60
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          94,
          92,
          95,
          92,
          93
        ],
        "total": 466,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            94,
            93,
            96,
            92,
            93
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            82,
            89,
            85,
            87
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "rotating_hypercube_projection": {
      "claude-opus-4-7": {
        "scores": [
          69,
          73,
          50,
          62,
          54
        ],
        "total": 308,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            68,
            78,
            55,
            60
          ],
          "cli/claude:claude-opus-4-7": [
            40,
            55,
            32,
            50,
            42
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            40,
            80,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          49,
          65,
          61,
          58,
          57
        ],
        "total": 290,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            68,
            52,
            50,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            76,
            82,
            74,
            75
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            50,
            50,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          43,
          46,
          75,
          35,
          37
        ],
        "total": 236,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            48,
            58,
            62,
            38,
            35
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            50,
            72,
            42,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            30,
            90,
            25,
            35
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "rounded_box": {
      "claude-opus-4-7": {
        "scores": [
          20,
          35,
          19,
          50,
          23
        ],
        "total": 147,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            22,
            38,
            18,
            42,
            15
          ],
          "cli/claude:claude-opus-4-7": [
            22,
            48,
            28,
            52,
            30
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            20,
            10,
            55,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          91,
          84,
          93,
          83,
          84
        ],
        "total": 435,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            86,
            90,
            82,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            85,
            70,
            88,
            72,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            95,
            100,
            95,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          88,
          85,
          92,
          84,
          86
        ],
        "total": 435,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            84,
            90,
            80,
            82
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            76,
            85,
            76,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            100,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "schwarzschild_black_hole": {
      "claude-opus-4-7": {
        "scores": [
          67,
          58,
          69,
          65,
          65
        ],
        "total": 324,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            53,
            40,
            56,
            39
          ],
          "cli/claude:claude-opus-4-7": [
            72,
            62,
            68,
            65,
            70
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            60,
            98,
            75,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          36,
          35,
          37,
          34,
          35
        ],
        "total": 177,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            3,
            8,
            1,
            2
          ],
          "cli/claude:claude-opus-4-7": [
            2,
            2,
            2,
            2,
            2
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          81,
          77,
          78,
          80,
          75
        ],
        "total": 391,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            70,
            76,
            55,
            72,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            70,
            83,
            78,
            76
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            85,
            95,
            90,
            92
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "sierpinski_tetrahedron": {
      "claude-opus-4-7": {
        "scores": [
          37,
          51,
          29,
          38,
          31
        ],
        "total": 186,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            62,
            30,
            45,
            25
          ],
          "cli/claude:claude-opus-4-7": [
            42,
            40,
            38,
            38,
            48
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            50,
            20,
            30,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          64,
          58,
          66,
          48,
          56
        ],
        "total": 292,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            48,
            55,
            42,
            30
          ],
          "cli/claude:claude-opus-4-7": [
            80,
            76,
            78,
            72,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            55,
            50,
            65,
            30,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          54,
          59,
          52,
          43,
          50
        ],
        "total": 258,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            72,
            55,
            58,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            40,
            55,
            32,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            65,
            45,
            40,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "sierpinski_triangle_6_iterations": {
      "claude-opus-4-7": {
        "scores": [
          94,
          91,
          95,
          92,
          90
        ],
        "total": 462,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            82,
            91,
            84,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            93,
            91,
            93,
            91,
            92
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          68,
          71,
          69,
          79,
          71
        ],
        "total": 358,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            52,
            68,
            45,
            66,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            88,
            84,
            88,
            87,
            82
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            65,
            60,
            75,
            85,
            80
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          8,
          44,
          6,
          23,
          14
        ],
        "total": 95,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            62,
            4,
            28,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            30,
            3,
            20,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            40,
            10,
            20,
            20
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "spherical_inversion_mapping": {
      "claude-opus-4-7": {
        "scores": [
          4,
          15,
          2,
          3,
          6
        ],
        "total": 30,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            35,
            2,
            4,
            12
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            4,
            3,
            5,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            5,
            1,
            1,
            1
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          29,
          14,
          40,
          15,
          56
        ],
        "total": 154,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            18,
            35,
            20,
            45
          ],
          "cli/claude:claude-opus-4-7": [
            20,
            15,
            25,
            15,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            10,
            60,
            10,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          47,
          65,
          41,
          58,
          76
        ],
        "total": 287,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            63,
            74,
            48,
            58,
            82
          ],
          "cli/claude:claude-opus-4-7": [
            48,
            42,
            55,
            32,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            30,
            80,
            20,
            85,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "spinning_gear_assembly": {
      "claude-opus-4-7": {
        "scores": [
          83,
          87,
          77,
          84,
          84
        ],
        "total": 415,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            86,
            68,
            82,
            76
          ],
          "cli/claude:claude-opus-4-7": [
            74,
            78,
            68,
            72,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            98,
            95,
            98,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          80,
          74,
          74,
          78
        ],
        "total": 384,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            68,
            74,
            55,
            66,
            62
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            70,
            68,
            60,
            74
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            98,
            96,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          68,
          81,
          54,
          62,
          71
        ],
        "total": 336,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            73,
            86,
            62,
            78,
            70
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            68,
            65,
            62,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            70,
            88,
            35,
            45,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "spinning_vortex_funnel": {
      "claude-opus-4-7": {
        "scores": [
          12,
          15,
          8,
          9,
          12
        ],
        "total": 56,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            22,
            28,
            12,
            14,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            5,
            8,
            3,
            4,
            5
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          48,
          58,
          37,
          59,
          57
        ],
        "total": 259,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            78,
            35,
            68,
            51
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            50,
            55,
            48,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            45,
            20,
            60,
            70
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          25,
          8,
          24,
          11,
          23
        ],
        "total": 91,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            50,
            10,
            50,
            18,
            20
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            5,
            8,
            6,
            8
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            10,
            15,
            10,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "spiral_staircase_tower": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          37,
          38,
          39,
          29,
          39
        ],
        "total": 182,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            55,
            42,
            43,
            48
          ],
          "cli/claude:claude-opus-4-7": [
            50,
            35,
            55,
            35,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            25,
            20,
            10,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "stella_octangula": {
      "claude-opus-4-7": {
        "scores": [
          95,
          90,
          95,
          93,
          93
        ],
        "total": 466,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            91,
            86,
            94,
            88,
            90
          ],
          "cli/claude:claude-opus-4-7": [
            93,
            87,
            92,
            90,
            89
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            98,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          89,
          83,
          89,
          80,
          86
        ],
        "total": 427,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            84,
            78,
            82,
            76,
            80
          ],
          "cli/claude:claude-opus-4-7": [
            83,
            80,
            86,
            78,
            82
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            90,
            100,
            85,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "superformula_explorer": {
      "claude-opus-4-7": {
        "scores": [
          79,
          76,
          82,
          77,
          71
        ],
        "total": 385,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            76,
            70,
            78,
            57
          ],
          "cli/claude:claude-opus-4-7": [
            70,
            68,
            78,
            68,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            85,
            98,
            85,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          83,
          82,
          80,
          73
        ],
        "total": 396,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            84,
            70,
            76,
            58
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            70,
            78,
            68,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            95,
            98,
            95,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          9,
          18,
          21,
          9,
          9
        ],
        "total": 66,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            8,
            28,
            18,
            10,
            6
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            12,
            30,
            8,
            10
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            15,
            15,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "taper_shear_transformation": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          29,
          42,
          29,
          30,
          33
        ],
        "total": 163,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            54,
            66,
            43,
            50
          ],
          "cli/claude:claude-opus-4-7": [
            14,
            26,
            12,
            22,
            18
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            15,
            45,
            10,
            25,
            30
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "topology_fabric_texture": {
      "claude-opus-4-7": {
        "scores": [
          7,
          15,
          6,
          6,
          6
        ],
        "total": 40,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            6,
            24,
            3,
            4,
            3
          ],
          "cli/claude:claude-opus-4-7": [
            6,
            10,
            4,
            4,
            4
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          56,
          70,
          50,
          61,
          57
        ],
        "total": 294,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            46,
            72,
            34,
            58,
            43
          ],
          "cli/claude:claude-opus-4-7": [
            38,
            55,
            32,
            48,
            40
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            82,
            85,
            78,
            88
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          32,
          35,
          30,
          26,
          26
        ],
        "total": 149,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            57,
            22,
            42,
            31
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            34,
            24,
            22,
            22
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            35,
            15,
            45,
            15,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "torus_donut_parametric": {
      "claude-opus-4-7": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          5,
          11,
          13,
          8,
          7
        ],
        "total": 44,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            5,
            18,
            8,
            6,
            4
          ],
          "cli/claude:claude-opus-4-7": [
            8,
            12,
            30,
            18,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            1,
            2,
            1,
            1,
            2
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          83,
          81,
          86,
          78,
          79
        ],
        "total": 407,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            84,
            86,
            76,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            58,
            78,
            60,
            65
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            100,
            95,
            98,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "trefoil_alexander_polynomial": {
      "claude-opus-4-7": {
        "scores": [
          39,
          83,
          33,
          80,
          41
        ],
        "total": 276,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            38,
            84,
            42,
            78,
            36
          ],
          "cli/claude:claude-opus-4-7": [
            28,
            68,
            22,
            62,
            28
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            98,
            35,
            100,
            60
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          53,
          73,
          40,
          82,
          56
        ],
        "total": 304,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            88,
            38,
            84,
            62
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            82,
            32,
            82,
            55
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            50,
            50,
            50,
            80,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      }
    },
    "trigonometric_mandalas": {
      "claude-opus-4-7": {
        "scores": [
          83,
          87,
          87,
          82,
          78
        ],
        "total": 417,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            92,
            84,
            86,
            85
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            72,
            78,
            62,
            58
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            92,
            96,
            98,
            98,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          76,
          79,
          75,
          73
        ],
        "total": 381,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            78,
            86,
            74,
            76,
            75
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            42,
            62,
            48,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          78,
          75,
          88,
          79,
          76
        ],
        "total": 396,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            72,
            74,
            82,
            68,
            66
          ],
          "cli/claude:claude-opus-4-7": [
            78,
            72,
            82,
            74,
            76
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            85,
            80,
            100,
            95,
            85
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "truncated_icosahedron": {
      "claude-opus-4-7": {
        "scores": [
          47,
          59,
          42,
          52,
          50
        ],
        "total": 250,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            67,
            58,
            64,
            52,
            63
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            58,
            52,
            55,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            60,
            10,
            50,
            25
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          41,
          74,
          30,
          65,
          47
        ],
        "total": 257,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            74,
            38,
            61,
            55
          ],
          "cli/claude:claude-opus-4-7": [
            45,
            58,
            42,
            38,
            45
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            90,
            10,
            95,
            40
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          88,
          82,
          90,
          82,
          88
        ],
        "total": 430,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            86,
            82,
            84,
            78,
            86
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            74,
            87,
            76,
            83
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            90,
            98,
            92,
            95
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "twisted_stellated_polyhedron": {
      "claude-opus-4-7": {
        "scores": [
          53,
          65,
          41,
          55,
          50
        ],
        "total": 264,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            45,
            58,
            34,
            36,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            55,
            62,
            50,
            58,
            54
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            60,
            75,
            40,
            70,
            55
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          41,
          38,
          34,
          31,
          36
        ],
        "total": 180,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            52,
            48,
            38,
            32,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            52,
            50,
            48,
            45,
            50
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            20,
            15,
            15,
            15,
            15
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "voronoi_diagram": {
      "claude-opus-4-7": {
        "scores": [
          88,
          91,
          91,
          85,
          87
        ],
        "total": 442,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            82,
            86,
            87,
            84,
            78
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            86,
            86,
            72,
            82
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": null,
        "total": null,
        "scores_by_judge": null,
        "has_image": false,
        "status": "render_fail"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          91,
          91,
          95,
          91,
          90
        ],
        "total": 458,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            88,
            86,
            94,
            91,
            84
          ],
          "cli/claude:claude-opus-4-7": [
            86,
            88,
            90,
            83,
            85
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            100,
            100,
            100,
            100,
            100
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "wave_deformation_field": {
      "claude-opus-4-7": {
        "scores": [
          21,
          22,
          23,
          20,
          18
        ],
        "total": 104,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            42,
            48,
            30,
            28
          ],
          "cli/claude:claude-opus-4-7": [
            18,
            15,
            15,
            14,
            15
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            5,
            15,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          78,
          81,
          78,
          77,
          77
        ],
        "total": 391,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            82,
            68,
            78,
            72
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            65,
            68,
            58,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            98,
            95,
            98,
            95,
            98
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          18,
          13,
          25,
          12,
          18
        ],
        "total": 86,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            34,
            22,
            42,
            18,
            31
          ],
          "cli/claude:claude-opus-4-7": [
            10,
            8,
            22,
            9,
            12
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            10,
            10,
            10,
            10
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    },
    "weierstrass_function": {
      "claude-opus-4-7": {
        "scores": [
          74,
          72,
          74,
          64,
          64
        ],
        "total": 348,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            58,
            62,
            41,
            57,
            39
          ],
          "cli/claude:claude-opus-4-7": [
            68,
            65,
            82,
            55,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            90,
            100,
            80,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "gemini-3.1-pro-preview": {
        "scores": [
          49,
          67,
          50,
          60,
          58
        ],
        "total": 284,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            74,
            78,
            61,
            70,
            63
          ],
          "cli/claude:claude-opus-4-7": [
            62,
            72,
            78,
            60,
            62
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            10,
            50,
            10,
            50,
            50
          ]
        },
        "has_image": true,
        "status": "ok"
      },
      "codex-gpt-5.5-high": {
        "scores": [
          81,
          81,
          68,
          78,
          70
        ],
        "total": 378,
        "scores_by_judge": {
          "cli/codex:gpt-5.5:high": [
            66,
            78,
            35,
            72,
            42
          ],
          "cli/claude:claude-opus-4-7": [
            82,
            80,
            74,
            78,
            78
          ],
          "cli/gemini:gemini-3.1-pro-preview": [
            95,
            85,
            95,
            85,
            90
          ]
        },
        "has_image": true,
        "status": "ok"
      }
    }
  },
  "summary": {
    "claude-opus-4-7": {
      "ok": 117,
      "permanent_fail": 13,
      "total": 130,
      "avg_total_filtered": 261.28205128205127,
      "avg_total_with_zeros": 235.15384615384616,
      "avg_total_by_judge_filtered": {
        "cli/codex:gpt-5.5:high": 252.8803418803419,
        "cli/claude:claude-opus-4-7": 236.25641025641025,
        "cli/gemini:gemini-3.1-pro-preview": 294.79487179487177
      },
      "judge_score_counts": {
        "cli/codex:gpt-5.5:high": 117,
        "cli/claude:claude-opus-4-7": 117,
        "cli/gemini:gemini-3.1-pro-preview": 117
      },
      "best_problem": {
        "name": "epicycloids",
        "total": 476
      },
      "worst_problem": {
        "name": "menger_cube_fractal",
        "total": 19
      }
    },
    "gemini-3.1-pro-preview": {
      "ok": 111,
      "permanent_fail": 19,
      "total": 130,
      "avg_total_filtered": 262.39639639639637,
      "avg_total_with_zeros": 224.04615384615386,
      "avg_total_by_judge_filtered": {
        "cli/codex:gpt-5.5:high": 259.47747747747746,
        "cli/claude:claude-opus-4-7": 221.02702702702703,
        "cli/gemini:gemini-3.1-pro-preview": 306.55855855855856
      },
      "judge_score_counts": {
        "cli/codex:gpt-5.5:high": 111,
        "cli/claude:claude-opus-4-7": 111,
        "cli/gemini:gemini-3.1-pro-preview": 111
      },
      "best_problem": {
        "name": "epicycloids",
        "total": 473
      },
      "worst_problem": {
        "name": "mandelbulb_fractal",
        "total": 9
      }
    },
    "codex-gpt-5.5-high": {
      "ok": 122,
      "permanent_fail": 8,
      "total": 130,
      "avg_total_filtered": 258.07377049180326,
      "avg_total_with_zeros": 242.19230769230768,
      "avg_total_by_judge_filtered": {
        "cli/codex:gpt-5.5:high": 277.4590163934426,
        "cli/claude:claude-opus-4-7": 219.5,
        "cli/gemini:gemini-3.1-pro-preview": 277.60655737704917
      },
      "judge_score_counts": {
        "cli/codex:gpt-5.5:high": 122,
        "cli/claude:claude-opus-4-7": 122,
        "cli/gemini:gemini-3.1-pro-preview": 122
      },
      "best_problem": {
        "name": "five_pointed_star_polygon",
        "total": 466
      },
      "worst_problem": {
        "name": "archimedean_spiral_galaxy",
        "total": 14
      }
    }
  }
}