<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Christian Bock &#8211; Noise</title>
	<atom:link href="https://noise.getoto.net/author/christian-bock/feed/" rel="self" type="application/rss+xml" />
	<link>https://noise.getoto.net</link>
	<description>The collective thoughts of the interwebz</description>
	<lastBuildDate>Wed, 23 Apr 2025 18:36:20 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.8.2</generator>
	<item>
		<title>Amazon introduces SWE-PolyBench, a multilingual benchmark for AI Coding Agents</title>
		<link>https://noise.getoto.net/2025/04/23/amazon-introduces-swe-polybench-a-multilingual-benchmark-for-ai-coding-agents/</link>
		
		<dc:creator><![CDATA[Christian Bock]]></dc:creator>
		<pubDate>Wed, 23 Apr 2025 18:36:20 +0000</pubDate>
				<category><![CDATA[announcements]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[Thought Leadership]]></category>
		<category><![CDATA[Uncategorized]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=0be65389dd60ae99f7ccdf808f2e131d</guid>

					<description><![CDATA[Coding agents powered by large language models have shown impressive capabilities in software engineering tasks, but evaluating their performance across diverse programming languages and real-world scenarios remains challenging. This led to a recent explosion in benchmark creation to assess the coding effectiveness of said systems in controlled environments. In particular, SWE-Bench which measures the performance […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
	</channel>
</rss>

<!--
Performance optimized by W3 Total Cache. Learn more: https://www.boldgrid.com/w3-total-cache/

Object Caching 27/52 objects using Memcached
Page Caching using Disk: Enhanced 
Lazy Loading (feed)
Database Caching using Memcached

Served from: noise.getoto.net @ 2026-02-09 01:53:31 by W3 Total Cache
-->