{"id":16242,"date":"2026-04-27T03:02:00","date_gmt":"2026-04-26T18:02:00","guid":{"rendered":"https:\/\/jore2.com\/ai-6459-why-swe-bench-verified-no-longer-measures-frontier-coding-capabilities\/"},"modified":"2026-04-27T03:02:00","modified_gmt":"2026-04-26T18:02:00","slug":"ai-6459-why-swe-bench-verified-no-longer-measures-frontier-coding-capabilities","status":"publish","type":"post","link":"https:\/\/jore2.com\/?p=16242","title":{"rendered":"SWE-bench Verified, \ub354 \uc774\uc0c1 \ucd5c\uc0c1\uc704 \ucf54\ub529 \ub2a5\ub825\uc744 \uac00\ub2a0\ud560 \uc218 \uc5c6\ub294 \uc774\uc720"},"content":{"rendered":"<div class=\"jore2-editor-byline\">\n<p><strong>\ubc30\uc18c\ub77c<\/strong><\/p>\n<\/div>\n<p>\ucd5c\uadfc AI \uac1c\ubc1c \ucee4\ubba4\ub2c8\ud2f0\uc640 \uae30\uc220 \uc804\ubb38\uac00\ub4e4 \uc0ac\uc774\uc5d0\uc11c SWE-bench Verified\uc758 \uc2e0\ub8b0\uc131\uc5d0 \ub300\ud55c \uc758\ubb38\uc774 \ub728\uac81\uac8c \ub2ec\uc544\uc624\ub974\uace0 \uc788\uc2b5\ub2c8\ub2e4. \uc624\ub7ab\ub3d9\uc548 \ucd5c\ucca8\ub2e8 AI \ubaa8\ub378\uc758 \ucf54\ub529 \ub2a5\ub825\uc744 \uce21\uc815\ud558\ub294 \ub370 \uc788\uc5b4 \uac00\uc7a5 \uacf5\uc2e0\ub825 \uc788\ub294 \uc9c0\ud45c\ub85c \uc5ec\uaca8\uc84c\ub358 \uc774 \ubca4\uce58\ub9c8\ud06c\uac00, \uc774\uc81c\ub294 \uadf8 \ubcf8\ub798\uc758 \uc5ed\ud560\uc744 \uc81c\ub300\ub85c \uc218\ud589\ud558\uc9c0 \ubabb\ud55c\ub2e4\ub294 \uc9c0\uc801\uc774 \uc787\ub530\ub974\uace0 \uc788\uae30 \ub54c\ubb38\uc785\ub2c8\ub2e4. \ud2b9\ud788 \uc624\ud508AI\ub97c \ube44\ub86f\ud55c \uc8fc\uc694 \uae30\uc5c5\ub4e4\uc774 \uc774 \ubca4\uce58\ub9c8\ud06c\ub97c \ub354 \uc774\uc0c1 \ucd5c\uc0c1\uc704 \ubaa8\ub378\uc758 \ucf54\ub529 \ub2a5\ub825\uc744 \ud310\ub2e8\ud558\ub294 \uae30\uc900\uc73c\ub85c \uc0bc\uc9c0 \uc54a\uae30\ub85c \uacf5\uc2dd\uc801\uc73c\ub85c \uc785\uc7a5\uc744 \ubc1d\ud788\uba74\uc11c, \uae30\uc220\uacc4\uc758 \uc2dc\uc120\uc774 \uc9d1\uc911\ub418\uace0 \uc788\uc2b5\ub2c8\ub2e4.<\/p>\n<p>\uc774 \ubcc0\ud654\uc758 \ubc30\uacbd\uc5d0\ub294 \ub450 \uac00\uc9c0 \uacb0\uc815\uc801\uc778 \ubb38\uc81c\uac00 \uc790\ub9ac \uc7a1\uace0 \uc788\uc2b5\ub2c8\ub2e4. \uba3c\uc800, \ubca4\uce58\ub9c8\ud06c \uc790\uccb4\uc758 \ud14c\uc2a4\ud2b8 \ucf00\uc774\uc2a4\uac00 \uac00\uc9c4 \uad6c\uc870\uc801 \uacb0\ud568\uc785\ub2c8\ub2e4. \uc218\ubc31 \uac1c\uc758 \ubb38\uc81c \uc911 \uc0c1\ub2f9\uc218\uac00 \uc9c0\ub098\uce58\uac8c \uad6c\uccb4\uc801\uc778 \uad6c\ud604 \uc138\ubd80\uc0ac\ud56d\uc744 \uc694\uad6c\ud558\uac70\ub098, \ubb38\uc81c \ubb38\uc7a5\uc5d0 \uba85\uc2dc\ub418\uc9c0 \uc54a\uc740 \uae30\ub2a5\uc744 \ud14c\uc2a4\ud2b8\ud558\ub294 \ub4f1 \ub108\ubb34 \uad11\ubc94\uc704\ud55c \uc870\uac74\uc744 \ub2f4\uace0 \uc788\uc5b4, \uc2e4\uc81c\ub85c\ub294 \uc815\uc0c1\uc801\uc73c\ub85c \uc791\ub3d9\ud558\ub294 \uc194\ub8e8\uc158\uae4c\uc9c0\ub3c4 \ud2c0\ub9b0 \uac83\uc73c\ub85c \ud310\uc815\ud558\ub294 \uc624\ub958\uac00 \ubc1c\uc0dd\ud588\uc2b5\ub2c8\ub2e4. \uc774\ub294 \ubaa8\ub378\uc758 \uc9c4\uc815\ud55c \ucf54\ub529 \ub2a5\ub825\uc744 \uc65c\uace1\ud558\uc5ec \ubcf4\uc5ec\uc904 \uc218\ubc16\uc5d0 \uc5c6\ub294 \uce58\uba85\uc801\uc778 \uc57d\uc810\uc774\uc5c8\uc2b5\ub2c8\ub2e4.<\/p>\n<p>\ub354 \ud070 \ubb38\uc81c\ub294 \ud559\uc2b5 \ub370\uc774\ud130 \uc624\uc5fc \ud604\uc0c1\uc785\ub2c8\ub2e4. \ud604\uc7ac \uc2dc\ud310 \uc911\uc778 \ucd5c\ucca8\ub2e8 \ubaa8\ub378\ub4e4\uc774 SWE-bench Verified\uc5d0 \ud3ec\ud568\ub41c \ubb38\uc81c\uc640 \uc815\ub2f5 \ucf54\ub4dc\ub97c \uc774\ubbf8 \ud559\uc2b5 \ub370\uc774\ud130\ub85c \uc811\ud588\uc744 \uac00\ub2a5\uc131\uc774 \ub9e4\uc6b0 \ub192\ub2e4\ub294 \uc0ac\uc2e4\uc774 \ub4dc\ub7ec\ub0ac\uc2b5\ub2c8\ub2e4. \ubaa8\ub378\uc774 \ubb38\uc81c\ub97c \ud478\ub294 \ub2a5\ub825\uc774 \uc544\ub2c8\ub77c, \ub2e8\uc21c\ud788 \uc774\uc804\uc5d0 \ubcf8 \ub370\uc774\ud130\ub97c \uae30\uc5b5\ud574 \ub0b4\ub294 \uc131\ub2a5\uc744 \ubcf4\uc5ec\uc8fc\ub294 \uacbd\uc6b0\uac00 \ub9ce\uc544\uc9c4 \uac83\uc785\ub2c8\ub2e4. \uc774\ub85c \uc778\ud574 \ubca4\uce58\ub9c8\ud06c \uc810\uc218\uc758 \uc0c1\uc2b9\uc774 \uc2e4\uc81c \ucf54\ub529 \ub2a5\ub825\uc758 \ud5a5\uc0c1\ubcf4\ub2e4\ub294 \ud559\uc2b5 \ub370\uc774\ud130 \ub178\ucd9c\uc5d0 \uc758\ud55c \uacb0\uacfc\uc77c \uac00\ub2a5\uc131\uc774 \ud06c\ub2e4\ub294 \ube44\ud310\uc774 \uc81c\uae30\ub418\uc5c8\uc2b5\ub2c8\ub2e4.<\/p>\n<p>\uc774\ub7ec\ud55c \uc0c1\ud669\uc740 \uc5c5\uacc4 \uc804\ubc18\uc5d0 \uc0c8\ub85c\uc6b4 \ud3c9\uac00 \uae30\uc900\uc744 \uc694\uad6c\ud558\ub294 \ud750\ub984\uc744 \ub9cc\ub4e4\uc5c8\uc2b5\ub2c8\ub2e4. \ub2e8\uc21c\ud788 \uacf5\uac1c\ub41c \ub370\uc774\ud130\uc14b\uc744 \uae30\ubc18\uc73c\ub85c \ud55c \ubca4\uce58\ub9c8\ud06c\uac00 \uc544\ub2cc, \ubaa8\ub378 \ucd9c\uc2dc \uc2dc\uc810\uc5d0 \ub9de\ucdb0 \uc0c8\ub85c \uc791\uc131\ub418\uac70\ub098 \ube44\uacf5\uac1c\ub85c \uc720\uc9c0\ub418\ub294 \ubca4\uce58\ub9c8\ud06c\uc758 \ud544\uc694\uc131\uc774 \uac15\uc870\ub418\uace0 \uc788\uc2b5\ub2c8\ub2e4. \ud2b9\ud788 \uc2e4\uc81c \uc5c5\ubb34 \ud658\uacbd\uacfc \uc720\uc0ac\ud55c \ubcf5\uc7a1\ud55c \uacfc\uc81c\ub97c \uc218\ud589\ud558\ub294 \ub2a5\ub825\uc744 \uce21\uc815\ud558\uae30 \uc704\ud574, \ub370\uc774\ud130 \uc624\uc5fc\uc758 \uc6b0\ub824\uac00 \uc801\uc740 SWE-bench Pro\uc640 \uac19\uc740 \ucc28\uc138\ub300 \uc9c0\ud45c\ub85c \ub208\uc744 \ub3cc\ub9ac\ub294 \uc6c0\uc9c1\uc784\uc774 \ud65c\ubc1c\ud574\uc9c0\uace0 \uc788\uc2b5\ub2c8\ub2e4. \uae30\uc220\uc758 \ubc1c\uc804 \uc18d\ub3c4\uac00 \ube68\ub77c\uc9c8\uc218\ub85d \ubca4\uce58\ub9c8\ud06c \uc5ed\uc2dc \ube60\ub974\uac8c \uad6c\uc2dd\uc774 \ub420 \uc218\ubc16\uc5d0 \uc5c6\ub2e4\ub294 \ud604\uc2e4\uc744 \uc9c1\uc2dc\ud558\uba70, \uc5c5\uacc4\ub294 \ub354 \ud22c\uba85\ud558\uace0 \uacf5\uc815\ud55c \ud3c9\uac00 \ubc29\uc2dd\uc744 \ucc3e\uae30 \uc704\ud55c \uace0\ubbfc\uc744 \uc774\uc5b4\uac00\uace0 \uc788\uc2b5\ub2c8\ub2e4.<\/p>\n","protected":false},"excerpt":{"rendered":"<p>\uacfc\uac70 AI \ubaa8\ub378\uc758 \ucf54\ub529 \uc2e4\ub825\uc744 \ud310\ub2e8\ud558\ub358 \uae08\ud45c\uc900 SWE-bench Verified\uac00 \uc774\uc81c \uc2e0\ub8b0\ub97c \uc783\uace0 \uc788\uc2b5\ub2c8\ub2e4. \ud559\uc2b5 \ub370\uc774\ud130 \uc624\uc5fc\uacfc \ud14c\uc2a4\ud2b8 \ucf00\uc774\uc2a4\uc758 \uacb0\ud568\uc774\ub77c\ub294 \ub450 \uac00\uc9c0 \ud575\uc2ec \ubb38\uc81c\uac00 \ub4dc\ub7ec\ub098\uba74\uc11c, \uc5c5\uacc4\ub294 \uc0c8\ub85c\uc6b4 \ud3c9\uac00 \uae30\uc900\uc744 \ubaa8\uc0c9\ud558\uace0 \uc788\uc2b5\ub2c8\ub2e4.<\/p>\n","protected":false},"author":11,"featured_media":16241,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[8858],"tags":[7,11327,8382,11329,11328],"class_list":["post-16242","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-ai","tag-ai","tag-swe-bench","tag-8382","tag-11329","tag-11328"],"featured_image_urls":{"full":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554.png",1280,510,false],"thumbnail":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-150x150.png",150,150,true],"medium":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-300x120.png",300,120,true],"medium_large":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-768x306.png",640,255,true],"large":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-1024x408.png",640,255,true],"1536x1536":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554.png",1280,510,false],"2048x2048":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554.png",1280,510,false],"morenews-large":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-825x510.png",825,510,true],"morenews-medium":["https:\/\/jore2.com\/wp-content\/uploads\/2026\/04\/0000107159-002-20250927200015554-590x410.png",590,410,true]},"author_info":{"info":["\ubc30\uc18c\ub77c"]},"category_info":"<a href=\"https:\/\/jore2.com\/?cat=8858\" rel=\"category\">AI<\/a>","tag_info":"AI","comment_count":"0","_links":{"self":[{"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/posts\/16242","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/users\/11"}],"replies":[{"embeddable":true,"href":"https:\/\/jore2.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=16242"}],"version-history":[{"count":0,"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/posts\/16242\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/jore2.com\/index.php?rest_route=\/wp\/v2\/media\/16241"}],"wp:attachment":[{"href":"https:\/\/jore2.com\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=16242"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/jore2.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=16242"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/jore2.com\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=16242"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}