<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://metr.org/blog/2023-03-18-update-on-recent-evals/</loc>
<lastmod>2023-03-17T08:22:42-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2023-08-01-new-report/</loc>
<lastmod>2023-07-31T13:00:17-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2023-09-19-spin-out-announcement/</loc>
<lastmod>2023-09-19T08:22:42-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2023-09-26-rsp/</loc>
<lastmod>2023-09-26T03:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2023-12-04-metr-announcement/</loc>
<lastmod>2023-12-04T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2023-12-16-bounty-diverse-hard-tasks-for-llm-agents/</loc>
<lastmod>2023-12-16T12:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-02-07-2023-year-in-review/</loc>
<lastmod>2024-02-07T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-02-29-METR-task-standard/</loc>
<lastmod>2024-02-29T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-03-13-autonomy-evaluation-resources/</loc>
<lastmod>2024-03-15T05:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-04-26-emma-abele-executive-director/</loc>
<lastmod>2024-04-26T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-05-16-ml-engineers-needed/</loc>
<lastmod>2024-05-16T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-08-06-update-on-evaluations/</loc>
<lastmod>2024-08-06T10:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-10-09-new-support-through-the-audacious-project/</loc>
<lastmod>2024-10-09T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-11-12-rogue-replication-threat-model/</loc>
<lastmod>2024-11-12T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2024-11-22-evaluating-r-d-capabilities-of-llms/</loc>
<lastmod>2024-11-22T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-01-17-ai-models-dangerous-before-public-deployment/</loc>
<lastmod>2025-01-17T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-01-31-update-sonnet-o1-evals/</loc>
<lastmod>2025-01-31T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-02-14-measuring-automated-kernel-engineering/</loc>
<lastmod>2025-02-14T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-02-27-gpt-4-5-evals/</loc>
<lastmod>2025-02-27T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-03-11-good-for-ai-to-reason-legibly-and-faithfully/</loc>
<lastmod>2025-03-11T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-03-19-measuring-ai-ability-to-complete-long-tasks/</loc>
<lastmod>2025-03-19T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-06-05-recent-reward-hacking/</loc>
<lastmod>2025-06-05T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-06-27-risk-transparency/</loc>
<lastmod>2025-06-27T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-07-10-early-2025-ai-experienced-os-dev-study/</loc>
<lastmod>2025-07-10T05:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-07-14-how-does-time-horizon-vary-across-domains/</loc>
<lastmod>2025-07-14T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-08-08-cot-may-be-highly-informative-despite-unfaithfulness/</loc>
<lastmod>2025-08-08T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-08-11-science-comms-at-metr/</loc>
<lastmod>2025-08-12T05:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-08-12-research-update-towards-reconciling-slowdown-with-time-horizons/</loc>
<lastmod>2025-08-13T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-08-20-forecasting-impacts-of-ai-acceleration/</loc>
<lastmod>2025-08-20T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2025-08-22-claude-gpt-gemini-struggle-evade-monitors/</loc>
<lastmod>2025-08-22T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2025-10-06-early-results-on-monitorability-in-qa-settings/</loc>
<lastmod>2025-10-06T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-10-14-malt-dataset-of-natural-and-prompted-behaviors/</loc>
<lastmod>2025-10-14T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-10-23-gpt-oss-methodology-review/</loc>
<lastmod>2025-10-23T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-10-28-sabotage-report-review/</loc>
<lastmod>2025-10-28T02:47:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2025-12-09-common-elements-of-frontier-ai-safety-policies/</loc>
<lastmod>2025-12-09T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-01-19-early-work-on-monitorability-evaluations/</loc>
<lastmod>2026-01-22T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-01-22-time-horizon-limitations/</loc>
<lastmod>2026-01-22T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-1-29-time-horizon-1-1/</loc>
<lastmod>2026-01-29T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-01-29-frontier-ai-safety-regulations/</loc>
<lastmod>2026-01-29T14:12:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-02-10-simpler-ai-timelines-model/</loc>
<lastmod>2026-02-10T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-02-13-measuring-time-horizon-using-claude-code-and-codex/</loc>
<lastmod>2026-02-13T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-02-17-exploratory-transcript-analysis-for-estimating-time-savings-from-coding-agents/</loc>
<lastmod>2026-02-17T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-02-17-how-we-protect-confidential-information/</loc>
<lastmod>2026-02-17T16:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-02-19-five-lessons-from-ai-biology-rct/</loc>
<lastmod>2026-02-19T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-02-24-uplift-update/</loc>
<lastmod>2026-02-24T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-03-03-balatro-sts-cli/</loc>
<lastmod>2026-03-03T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-03-10-many-swe-bench-passing-prs-would-not-be-merged-into-main/</loc>
<lastmod>2026-03-10T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-03-12-sabotage-risk-report-opus-4-6-review/</loc>
<lastmod>2026-03-12T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-03-19-org-uplift-game/</loc>
<lastmod>2026-03-19T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/notes/2026-03-20-impact-of-modelling-assumptions-on-time-horizon-results/</loc>
<lastmod>2026-03-20T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/blog/2026-03-25-red-teaming-anthropic-agent-monitoring/</loc>
<lastmod>2026-03-26T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/beth-barnes/</loc>
<lastmod>2018-12-19T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/hjalmar-wijk/</loc>
<lastmod>2018-12-19T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/lawrence-chan/</loc>
<lastmod>2018-12-19T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/megan-kinniment/</loc>
<lastmod>2018-12-19T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/rae-she/</loc>
<lastmod>2018-12-19T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/chris-painter/</loc>
<lastmod>2023-07-23T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/kris-chari/</loc>
<lastmod>2023-07-23T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/lucas-sato/</loc>
<lastmod>2023-07-23T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/thomas-broadley/</loc>
<lastmod>2023-07-23T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/adam-gleave/</loc>
<lastmod>2023-09-24T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/yoshua-bengio/</loc>
<lastmod>2023-09-24T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/kit-harris/</loc>
<lastmod>2024-07-04T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/michael-chen/</loc>
<lastmod>2024-07-30T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/david-rein/</loc>
<lastmod>2024-08-11T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/nikola-jurkovic/</loc>
<lastmod>2024-08-11T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/neev-parikh/</loc>
<lastmod>2024-09-15T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/sydney-von-arx/</loc>
<lastmod>2024-10-06T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/rajiv-dattani/</loc>
<lastmod>2024-10-30T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/nate-rush/</loc>
<lastmod>2024-12-02T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/charles-foster/</loc>
<lastmod>2025-04-10T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/luca-righetti/</loc>
<lastmod>2025-04-22T20:00:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/marco-mascorro/</loc>
<lastmod>2025-05-07T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/alec-radford/</loc>
<lastmod>2025-05-11T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/joel-becker/</loc>
<lastmod>2025-05-15T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/bhaskar-chaturvedi/</loc>
<lastmod>2025-06-02T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/jasmine-dhaliwal/</loc>
<lastmod>2025-06-02T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/jingyi-wang/</loc>
<lastmod>2025-07-22T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/thomas-kwa/</loc>
<lastmod>2025-07-22T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/mischa-spiegelmock/</loc>
<lastmod>2025-08-24T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/khalid-mahamud/</loc>
<lastmod>2025-10-08T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/paarth-shah/</loc>
<lastmod>2025-10-08T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/rasmus-faber-espensen/</loc>
<lastmod>2025-10-26T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/vincent-cheng/</loc>
<lastmod>2025-10-31T20:44:30-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/daniel-filan/</loc>
<lastmod>2025-12-15T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/ajeya-cotra/</loc>
<lastmod>2026-01-15T19:00:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/wilder-seitz/</loc>
<lastmod>2026-02-18T19:44:30-08:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/parker-whitfill/</loc>
<lastmod>2026-03-10T14:48:39-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/alexander-barry/</loc>
<lastmod>2026-03-13T17:00:00-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/tom-cunningham/</loc>
<lastmod>2026-03-19T16:24:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/team/manish-shetty/</loc>
<lastmod>2026-03-20T11:23:44-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/CoT_chart_embed.html</loc>
</url>
<url>
<loc>https://metr.org/about</loc>
</url>
<url>
<loc>https://metr.org/bounty</loc>
</url>
<url>
<loc>https://metr.org/careers</loc>
</url>
<url>
<loc>https://metr.org/contact</loc>
</url>
<url>
<loc>https://metr.org/donate</loc>
</url>
<url>
<loc>https://metr.org/fsp</loc>
</url>
<url>
<loc>https://metr.org/hiring</loc>
</url>
<url>
<loc>https://metr.org/</loc>
</url>
<url>
<loc>https://metr.org/horizon-chart-embed</loc>
</url>
<url>
<loc>https://metr.org/blog/</loc>
</url>
<url>
<loc>https://metr.org/language-model-pilot-report/</loc>
</url>
<url>
<loc>https://metr.org/measuring-autonomous-ai-capabilities/</loc>
</url>
<url>
<loc>https://metr.org/notes/</loc>
</url>
<url>
<loc>https://metr.org/research/</loc>
</url>
<url>
<loc>https://metr.org/rsp-key-components/</loc>
</url>
<url>
<loc>https://metr.org/search</loc>
</url>
<url>
<loc>https://metr.org/subscribe</loc>
</url>
<url>
<loc>https://metr.org/tasks</loc>
</url>
<url>
<loc>https://metr.org/taskstandard</loc>
</url>
<url>
<loc>https://metr.org/time-horizons/</loc>
</url>
<url>
<loc>https://metr.org/2024-10-11-response-to-bureau-of-industry-and-security-proposed-reporting-requirements.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/AI_R_D_Evaluation_Report.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/ARC-NTIA-comment.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/AR_report.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/Early_2025_AI_Experienced_OS_Devs_Study-paper.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/Evaluating_LMAs_Realistic_Tasks.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/METR_ai_action_plan_comment.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/agi.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/2025-SOC-2-Type-1-Report.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/2025_pilot_risk_report_metr_review.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/common-elements-mar-2025.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/common-elements-nov-2024.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/common_elements_of_frontier_ai_safety_policies.pdf</loc>
<lastmod>2026-04-03T14:06:23-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/sabotage-risk-report-opus-4-6-review-feb-2026.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/assets/sabotage-risk-report-opus-4-6-review-mar-2026.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/common-elements.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/february-2026-progress-report.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/frontier-ai-regulations.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/hcast.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/pre-frontier-safety-framework.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/risk-transparency-paper.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework-april-2025.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework-aug-2025.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework-diff-nov-2025.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework-fr.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework-zh.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/safety-security-framework.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
<url>
<loc>https://metr.org/taskrabbit.pdf</loc>
<lastmod>2026-04-03T14:06:24-07:00</lastmod>
</url>
</urlset>
