20241029_OpenHands-CodeAct-2.1-sonnet-20241022
20241028_solver
20241022_tools_claude-3-5-sonnet-updated
20241025_composio_swekit
20241023_emergent
20240924_solver
20240824_gru
20240920_solver
20241022_tools_claude-3-5-haiku
20241016_composio_swekit
20240820_honeycomb
20241029_epam-ai-run-claude-3-5-sonnet
20241028_agentless-1.5_gpt4o
20240721_amazon-q-developer-agent-20240719-dev
20240628_autocoderover-v20240620
20240617_factory_code_droid
20240620_sweagent_claude3.5sonnet
20241007_nfactorial
20241002_lingma-agent_lingma-swe-gpt-72b
20241016_epam-ai-run-gpt-4o
20240615_appmap-navie_gpt4o
20241001_nfactorial
20240509_amazon-q-developer-agent-20240430-dev
20240918_lingma-agent_lingma-swe-gpt-72b
20240820_epam-ai-run-gpt-4o
20240728_sweagent_gpt4o
20240402_sweagent_gpt4
20241002_lingma-agent_lingma-swe-gpt-7b
20240402_sweagent_claude3opus
20240918_lingma-agent_lingma-swe-gpt-7b
20240402_rag_claude3opus
20231010_rag_claude2
20240402_rag_gpt4
20231010_rag_swellama7b
20231010_rag_swellama13b
20231010_rag_gpt35
astropy__astropy-13033
django__django-11477
django__django-13512
django__django-15098
django__django-16263
matplotlib__matplotlib-25960
pytest-dev__pytest-10356
sphinx-doc__sphinx-11510
sphinx-doc__sphinx-9461
sympy__sympy-18199
astropy__astropy-13236
django__django-15916
sphinx-doc__sphinx-10323
django__django-11239
django__django-14351
sympy__sympy-13031
matplotlib__matplotlib-20826
astropy__astropy-8872
django__django-15161
sympy__sympy-15345
scikit-learn__scikit-learn-25102
scikit-learn__scikit-learn-10908
django__django-15128
django__django-14017
astropy__astropy-14539
django__django-16136
pydata__xarray-3151
django__django-15561
django__django-15863
django__django-16642
django__django-12741
django__django-10880
pydata__xarray-4966
psf__requests-1921
django__django-12713
django__django-13516
django__django-15741
astropy__astropy-14995
django__django-15315
sympy__sympy-16886
django__django-13820
django__django-11603
sympy__sympy-13480
astropy__astropy-14309
django__django-15467
pylint-dev__pylint-6903
0
0.2
0.4
0.6
0.8
1
pass1_ex
model
example_id
plotly-logomark