<?xml version="1.0"?>
<News hasArchived="false" page="1" pageCount="1" pageSize="10" timestamp="Mon, 27 Apr 2026 12:25:44 -0400" url="https://beta.my.umbc.edu/groups/umbc-ai/posts.xml?tag=benchmark">
<NewsItem contentIssues="true" id="146462" important="false" status="posted" url="https://beta.my.umbc.edu/groups/umbc-ai/posts/146462">
<Title>Benchmarks that have been killed by LLM based systems</Title>
<Body>
<![CDATA[
    <div class="html-content"><img src="https://ai.umbc.edu/wp-content/uploads/sites/734/2025/01/killed_by_llm.png" style="max-width: 100%; height: auto;"><div><br></div><div><span><p><a href="https://r0bk.github.io/killedbyllm/" rel="nofollow external" class="bo"><span><strong>Killed by LLM</strong></span></a><span> is a project that documents public AI benchmarks that LLM-based AI systems have largely solved since 2018.  Getting killed means that a benchmark no longer measures the frontier of AI technology as a challenge asking "Can AI do X?", but might still be a useful tool. Links to papers documenting fallen benchmarks are provided.</span></p><span>The project is on </span><a href="https://github.com/R0bk/killedbyllm" rel="nofollow external" class="bo"><span><strong>GitHub</strong></span></a><span>, and other people are invited to contribute new benchmarks that have been overcome.</span></span></div><div><span><span><br></span></span></div>
    <hr><a href="https://ai.umbc.edu/" rel="nofollow external" class="bo"><strong>UMBC Center for AI</strong></a></div>
]]>
</Body>
<Summary>Killed by LLM is a project that documents public AI benchmarks that LLM-based AI systems have largely solved since 2018.  Getting killed means that a benchmark no longer measures the frontier of...</Summary>
<Website>https://r0bk.github.io/killedbyllm/</Website>
<TrackingUrl>https://beta.my.umbc.edu/api/v0/pixel/news/146462/guest@my.umbc.edu/ca6832dc7212f2aa8d1e3e650c26f51c/api/pixel</TrackingUrl>
<Tag>ai</Tag>
<Tag>benchmark</Tag>
<Tag>llm</Tag>
<Group token="umbc-ai">UMBC AI</Group>
<GroupUrl>https://beta.my.umbc.edu/groups/umbc-ai</GroupUrl>
<AvatarUrl>https://assets4-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/xsmall.png?1691095779</AvatarUrl>
<AvatarUrl size="original">https://assets2-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/original.png?1691095779</AvatarUrl>
<AvatarUrl size="xxlarge">https://assets1-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/xxlarge.png?1691095779</AvatarUrl>
<AvatarUrl size="xlarge">https://assets1-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/xlarge.png?1691095779</AvatarUrl>
<AvatarUrl size="large">https://assets1-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/large.png?1691095779</AvatarUrl>
<AvatarUrl size="medium">https://assets3-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/medium.png?1691095779</AvatarUrl>
<AvatarUrl size="small">https://assets3-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/small.png?1691095779</AvatarUrl>
<AvatarUrl size="xsmall">https://assets4-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/xsmall.png?1691095779</AvatarUrl>
<AvatarUrl size="xxsmall">https://assets1-beta.my.umbc.edu/system/shared/avatars/groups/000/002/081/cfb27ebe008c2636486089a759ea5c36/xxsmall.png?1691095779</AvatarUrl>
<Sponsor>UMBC AI</Sponsor>
<PawCount>0</PawCount>
<CommentCount>0</CommentCount>
<CommentsAllowed>true</CommentsAllowed>
<PostedAt>Tue, 07 Jan 2025 09:18:50 -0500</PostedAt>
<EditAt>Tue, 07 Jan 2025 09:20:46 -0500</EditAt>
</NewsItem>

</News>
