<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url><loc>https://apartresearch.com/donate</loc></url>
<url><loc>https://apartresearch.com/impact/testimonials</loc></url>
<url><loc>https://apartresearch.com/donate/2025</loc></url>
<url><loc>https://apartresearch.com/impact</loc></url>
<url><loc>https://apartresearch.com/sponsorship</loc></url>
<url><loc>https://apartresearch.com/research</loc></url>
<url><loc>https://apartresearch.com/media-kit</loc></url>
<url><loc>https://apartresearch.com/old/denmark</loc></url>
<url><loc>https://apartresearch.com/sprints</loc></url>
<url><loc>https://apartresearch.com/careers</loc></url>
<url><loc>https://apartresearch.com/sprints/prize-terms</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/submit</loc></url>
<url><loc>https://apartresearch.com/news</loc></url>
<url><loc>https://apartresearch.com/sprints/all</loc></url>
<url><loc>https://apartresearch.com/sprints/locations</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/effective-altruism-denmark</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/ceealar</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/effective-altruism-singapore</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/ai-alignment-bangalore</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/technology-and-policy-society-at-johns-hopkins</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/ai-safety-initiative-at-georgia-tech</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/ai-safety-arc</loc></url>
<url><loc>https://apartresearch.com/sprints/locations/singapore-ai-safety-hub</loc></url>
<url><loc>https://apartresearch.com/sprints/aixbio-hackathon-2026-04-24-to-2026-04-26</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-control-hackathon-2026-03-20-to-2026-03-22</loc></url>
<url><loc>https://apartresearch.com/sprints/the-technical-ai-governance-challenge-2026-01-30-to-2026-02-01</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-manipulation-hackathon-2026-01-09-to-2026-01-11</loc></url>
<url><loc>https://apartresearch.com/sprints/def-acc-hackathon-2025-11-21-to-2025-11-23</loc></url>
<url><loc>https://apartresearch.com/sprints/the-ai-forecasting-hackathon-2025-10-31-to-2025-11-02</loc></url>
<url><loc>https://apartresearch.com/sprints/arena-6-mechanistic-interpretability-hackathon-2025-09-13-to-2025-09-14</loc></url>
<url><loc>https://apartresearch.com/sprints/cbrn-ai-risks-sprint-2025-09-12-to-2025-09-14</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-safety-x-physics-grand-challenge-2025-07-25-to-2025-07-27</loc></url>
<url><loc>https://apartresearch.com/sprints/red-teaming-a-narrow-path-control-ai-policy-sprint-2025-06-13-to-2025-06-13</loc></url>
<url><loc>https://apartresearch.com/sprints/apart-x-martian-mechanistic-router-interpretability-hackathon-2025-05-30-to-2025-06-01</loc></url>
<url><loc>https://apartresearch.com/sprints/economics-of-transformative-ai-research-sprint-2025-04-25-to-2025-04-27</loc></url>
<url><loc>https://apartresearch.com/sprints/berkeley-ai-policy-hackathon-2025-04-14-to-2025-04-26</loc></url>
<url><loc>https://apartresearch.com/sprints/georgia-tech-aisi-policy-hackathon-2025-04-05-to-2025-04-06</loc></url>
<url><loc>https://apartresearch.com/sprints/dark-patterns-in-agi-hackathon-at-zaia-2025-04-04-to-2025-04-05</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-control-hackathon-2025-03-29-to-2025-03-30</loc></url>
<url><loc>https://apartresearch.com/sprints/women-in-ai-safety-hackathon-2025-03-07-to-2025-03-14</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-safety-entrepreneurship-hackathon-2025-01-17-to-2025-01-20</loc></url>
<url><loc>https://apartresearch.com/sprints/blackpoolautostructuring-2024-11-23-to-2024-11-25</loc></url>
<url><loc>https://apartresearch.com/sprints/reprogramming-ai-models-hackathon-2024-11-22-to-2024-11-25</loc></url>
<url><loc>https://apartresearch.com/sprints/howard-university-ai-safety-summit-policy-hackathon-2024-11-21-to-2024-11-22</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-policy-hackathon-at-johns-hopkins-university-2024-10-26-to-2024-10-28</loc></url>
<url><loc>https://apartresearch.com/sprints/agent-security-hackathon-2024-10-04-to-2024-10-07</loc></url>
<url><loc>https://apartresearch.com/sprints/arena-4-interp-hackathon-2024-09-15-to-2024-09-15</loc></url>
<url><loc>https://apartresearch.com/sprints/the-concordia-contest-2024-09-06-to-2024-09-09</loc></url>
<url><loc>https://apartresearch.com/sprints/hackathon-for-technical-ai-safety-startups-2024-09-22-to-2024-09-25</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-capabilities-and-risks-demo-jam-2024-08-23-to-2024-08-26</loc></url>
<url><loc>https://apartresearch.com/sprints/research-augmentation-hackathon-2024-07-26-to-2024-07-29</loc></url>
<url><loc>https://apartresearch.com/sprints/deception-detection-hackathon-preventing-ai-deception-2024-06-28-to-2024-07-01</loc></url>
<url><loc>https://apartresearch.com/sprints/computational-mechanics-hackathon-2024-06-01-to-2024-06-03</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-security-evaluation-hackathon-2024-05-24-to-2024-05-27</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-and-democracy-hackathon-2024-05-03-to-2024-05-06</loc></url>
<url><loc>https://apartresearch.com/sprints/interpvis-2024-03-12-to-2024-03-14</loc></url>
<url><loc>https://apartresearch.com/sprints/llm-psychology-hackathon-2024-04-05-to-2024-04-07</loc></url>
<url><loc>https://apartresearch.com/sprints/code-red-hackathon-2024-03-22-to-2024-03-25</loc></url>
<url><loc>https://apartresearch.com/sprints/multi-agent-security-research-sprint-2024-02-09-to-2024-02-11</loc></url>
<url><loc>https://apartresearch.com/sprints/the-ai-governance-research-sprint-2024-01-05-to-2024-05-07</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-model-evaluations-hackathon-2023-11-24-to-2023-11-26</loc></url>
<url><loc>https://apartresearch.com/sprints/multi-agent-safety-hackathon-2024-09-29-to-2023-11-01</loc></url>
<url><loc>https://apartresearch.com/sprints/the-agency-foundations-challenge-2023-09-08-to-2023-09-24</loc></url>
<url><loc>https://apartresearch.com/sprints/distillation-write-a-thon-2023-08-24-to-2023-08-26</loc></url>
<url><loc>https://apartresearch.com/sprints/llm-evals-hackathon-2023-08-18-to-2023-08-20</loc></url>
<url><loc>https://apartresearch.com/sprints/interpretability-hackathon-2023-07-14-to-2023-07-16</loc></url>
<url><loc>https://apartresearch.com/sprints/safety-benchmarks-hackathon-2023-06-30-to-2023-07-02</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-governance-hackathon-2023-06-16-to-2023-06-18</loc></url>
<url><loc>https://apartresearch.com/sprints/ml-reliability-hackathon-2023-05-26-to-2023-05-28</loc></url>
<url><loc>https://apartresearch.com/sprints/ml-verifiability-hackathon-2023-05-26-to-2023-05-28</loc></url>
<url><loc>https://apartresearch.com/sprints/the-interpretability-hackathon-2023-04-14-to-2023-04-17</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-governance-2023-03-24-to-2023-03-27</loc></url>
<url><loc>https://apartresearch.com/sprints/scale-oversight-for-machine-learning-hackathon-2023-02-10-to-2023-02-13</loc></url>
<url><loc>https://apartresearch.com/sprints/mechanistic-interpretability-hackathon-2023-01-20-to-2023-01-23</loc></url>
<url><loc>https://apartresearch.com/sprints/eagx-latam-epoch-ai-hackathon-2023-01-09-to-2023-01-11</loc></url>
<url><loc>https://apartresearch.com/sprints/ai-testing-2022-12-15-to-2022-12-17</loc></url>
<url><loc>https://apartresearch.com/sprints/the-interpretability-hackathon-2022-11-11-to-2022-11-13</loc></url>
<url><loc>https://apartresearch.com/sprints/language-model-hackathon-2022-09-29-to-2022-10-01</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/howard-university-ai-safety-summit-policy-hackathon-2024-11-21-to-2024-11-22</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/blackpoolautostructuring-2024-11-23-to-2024-11-25</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/berkeley-ai-policy-hackathon-2025-04-14-to-2025-04-26</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/georgia-tech-aisi-policy-hackathon-2025-04-05-to-2025-04-06</loc></url>
<url><loc>https://apartresearch.com/sprints/collaborations/red-teaming-a-narrow-path-2025-06-14-to-2025-06-14</loc></url>
<url><loc>https://apartresearch.com/project/intersession-attacks-distributing-highstakes-sabotage-across-independentlymonitored-sessions-to-evade-detection-dwlw</loc></url>
<url><loc>https://apartresearch.com/project/constraint-dilemma-udka</loc></url>
<url><loc>https://apartresearch.com/project/securebox-a-layered-control-protocol-for-safe-aiassisted-coding-988z</loc></url>
<url><loc>https://apartresearch.com/project/chiron-agentic-platform-for-automated-setting-design-and-redblue-protocol-optimization-in-controlarena-52r0</loc></url>
<url><loc>https://apartresearch.com/project/can-language-models-tell-when-they-are-being-evaluated-hyae</loc></url>
<url><loc>https://apartresearch.com/project/hydra-gep4</loc></url>
<url><loc>https://apartresearch.com/project/loyal-5opm</loc></url>
<url><loc>https://apartresearch.com/project/posthoc-training-interventions-against-naturally-emergent-misalignment-3tvj</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-multiagent-systems-in-ai-control-evaluations-fx32</loc></url>
<url><loc>https://apartresearch.com/project/monitoraware-attack-policies-60t4</loc></url>
<url><loc>https://apartresearch.com/project/frankenstein-ducks-the-linear-probes-dcz9</loc></url>
<url><loc>https://apartresearch.com/project/reconnaissanceexecution-boundaries-as-a-control-protocol-jgku</loc></url>
<url><loc>https://apartresearch.com/project/kernelarena-83z5</loc></url>
<url><loc>https://apartresearch.com/project/resample-with-trusted-comparison-u6bu</loc></url>
<url><loc>https://apartresearch.com/project/stateful-monitor-t8dd</loc></url>
<url><loc>https://apartresearch.com/project/catching-agentic-attacks-in-latent-space-0gze</loc></url>
<url><loc>https://apartresearch.com/project/odrarena-rigorously-evaluating-deep-research-control-policies-mgzr</loc></url>
<url><loc>https://apartresearch.com/project/linuxarena-expansion-threshold-manipulation-utm2</loc></url>
<url><loc>https://apartresearch.com/project/omission-attacks-when-doing-nothing-is-the-attack-0y1v</loc></url>
<url><loc>https://apartresearch.com/project/steganography-detection-control-tghx</loc></url>
<url><loc>https://apartresearch.com/project/veria-researchintegrity-control-for-autonomous-ai-rd-3iwx</loc></url>
<url><loc>https://apartresearch.com/project/beyond-backdoors-evaluating-ai-control-against-adversarial-persuasion-in-multiagent-deliberation-3nv6</loc></url>
<url><loc>https://apartresearch.com/project/who-the-model-is-matters-personas-for-llm-safety-and-control-wrjn</loc></url>
<url><loc>https://apartresearch.com/project/sabotage-under-the-ratchet-can-autonomous-research-agents-hide-backdoors-while-optimizing-metrics-hd6z</loc></url>
<url><loc>https://apartresearch.com/project/honeypot-protocol-hmsb</loc></url>
<url><loc>https://apartresearch.com/project/hidden-in-plain-sight-representational-adversarial-steganography-in-colluding-llms-sekh</loc></url>
<url><loc>https://apartresearch.com/project/multiagent-collusion-br1m</loc></url>
<url><loc>https://apartresearch.com/project/controlling-the-researcher-ai-control-evaluations-for-automated-ai-rd-ze22</loc></url>
<url><loc>https://apartresearch.com/project/diffuse-influence-threats-in-ai-control-planning-execution-and-chainofthought-detection-ls54</loc></url>
<url><loc>https://apartresearch.com/project/blue-beam-yf5l</loc></url>
<url><loc>https://apartresearch.com/project/look-before-you-click-sparse-criticalaction-review-for-computeruse-agent-control-lcb5</loc></url>
<url><loc>https://apartresearch.com/project/trojancot-adversarial-evasion-of-llmbased-code-sanitization-c7tf</loc></url>
<url><loc>https://apartresearch.com/project/persona-drift-sabotage-benchmarking-covert-weakening-of-personasafety-interventions-3qin</loc></url>
<url><loc>https://apartresearch.com/project/trusted-interrogation-protocol-for-multiround-agent-control-lck2</loc></url>
<url><loc>https://apartresearch.com/project/structured-ethical-justification-protocol-sejp-ordainedethics-enforcement-and-reasoningalignment-monitoring-for-ai-systems-4s34</loc></url>
<url><loc>https://apartresearch.com/project/how-detectable-are-covert-signals-in-ai-agent-transcripts-642m</loc></url>
<url><loc>https://apartresearch.com/project/taintguard-01ph</loc></url>
<url><loc>https://apartresearch.com/project/safe-sandboxed-actions-forensics-and-evaluation-for-ai-control-via-actionaware-monitoring-h3fi</loc></url>
<url><loc>https://apartresearch.com/project/one-probe-is-not-enough-the-bipolar-geometry-of-deception-in-llm-negotiation-agents-q4u8</loc></url>
<url><loc>https://apartresearch.com/project/bugs-over-backdoors-efficient-and-evasive-sabotage-via-plausible-code-bugs-in-linuxarena-fcp6</loc></url>
<url><loc>https://apartresearch.com/project/attacker-pressure-flips-ai-control-conclusions-lvu9</loc></url>
<url><loc>https://apartresearch.com/project/trajectory-blindness-detection-latency-in-conversational-monitoring-2jaf</loc></url>
<url><loc>https://apartresearch.com/project/stitchguard-cslo</loc></url>
<url><loc>https://apartresearch.com/project/trigger-happy-trusted-monitors-mistake-noisy-failures-for-adversarial-intent-xeoz</loc></url>
<url><loc>https://apartresearch.com/project/toolchain-adversaries-a-control-setting-for-supplychain-attacks-on-ai-agent-pipelines-pb3g</loc></url>
<url><loc>https://apartresearch.com/project/monitors-are-fragile-under-information-asymmetry-iq2d</loc></url>
<url><loc>https://apartresearch.com/project/beyond-prompt-injection-offensive-security-tradecraft-exposes-architectural-blind-spot-classes-in-ai-control-monitors-lwy7</loc></url>
<url><loc>https://apartresearch.com/project/covertcollude-a-control-setting-for-steganographic-multiagent-collusion-vc55</loc></url>
<url><loc>https://apartresearch.com/project/denoising-trajectories-as-earlywarning-signals-for-diffusion-language-model-control-31cb</loc></url>
<url><loc>https://apartresearch.com/project/taxonomy-without-complementarity-a-necessary-precondition-for-routing-monitor-ensembles-4t9w</loc></url>
<url><loc>https://apartresearch.com/project/surrogate-steering-vector-monitors-track-2-5w36</loc></url>
<url><loc>https://apartresearch.com/project/tokenization-drift-as-a-hidden-channel-for-alignment-evasion-in-language-models-wooi</loc></url>
<url><loc>https://apartresearch.com/project/boxarena-an-oci-runtime-escape-benchmark-elyw</loc></url>
<url><loc>https://apartresearch.com/project/layoutarena-a-control-setting-for-toolusing-design-agents-elem</loc></url>
<url><loc>https://apartresearch.com/project/context-compression-as-an-inadvertent-accomplice-how-tokensaving-summaries-undermine-safety-monitoring-in-multiagent-pipelines-462o</loc></url>
<url><loc>https://apartresearch.com/project/track-1-vaultrix-control-twqz</loc></url>
<url><loc>https://apartresearch.com/project/narrow-capabilities-could-be-used-for-perfect-information-steganography-smes</loc></url>
<url><loc>https://apartresearch.com/project/performative-subversion-who-monitors-the-monitor-5nj6</loc></url>
<url><loc>https://apartresearch.com/project/suspicios-kcta</loc></url>
<url><loc>https://apartresearch.com/project/context-augmentation-in-llm-monitors-exploratory-evidence-from-paired-repeated-evaluation-w6oj</loc></url>
<url><loc>https://apartresearch.com/project/investigating-structural-safety-guarantees-for-agentic-ai-via-goaloriented-action-planning-lx3u</loc></url>
<url><loc>https://apartresearch.com/project/interrogation-protocols-as-a-control-primitive-for-misaligned-agent-detection-ho2h</loc></url>
<url><loc>https://apartresearch.com/project/logitweighted-suspicion-scoring-in-ai-control-ktmf</loc></url>
<url><loc>https://apartresearch.com/project/testing-oocr-transfer-from-evasion-technique-descriptions-to-chainofthought-monitor-avoidance-6edf</loc></url>
<url><loc>https://apartresearch.com/project/trust-but-verify-a-dualtask-evaluation-pipeline-for-capability-monitor-effectiveness-and-covert-misalignment-l1c7</loc></url>
<url><loc>https://apartresearch.com/project/crossexamine-interrogation-protocol-for-ai-control-8y9o</loc></url>
<url><loc>https://apartresearch.com/project/rag-faithfulness-evaluator-mnv0</loc></url>
<url><loc>https://apartresearch.com/project/geometric-detection-of-triggeractivated-sleeper-agents-a-weightspace-control-protocol-t93j</loc></url>
<url><loc>https://apartresearch.com/project/syscon-kernellevel-syscall-monitoring-for-ai-agent-control-in-sandboxed-environments-guun</loc></url>
<url><loc>https://apartresearch.com/project/you-cant-fool-all-of-them-behavioral-comparison-for-ai-control-against-sophisticated-code-injection-uxls</loc></url>
<url><loc>https://apartresearch.com/project/omissioncontrol-a-controlarena-setting-for-selective-omission-attacks-in-multiagent-pipelines-1gvm</loc></url>
<url><loc>https://apartresearch.com/project/finetuning-a-monitor-for-ai-control-nai0</loc></url>
<url><loc>https://apartresearch.com/project/multiepisode-evaluation-measuring-strategic-patience-attacks-oc91</loc></url>
<url><loc>https://apartresearch.com/project/automated-security-side-task-generation-for-ai-control-yqpv</loc></url>
<url><loc>https://apartresearch.com/project/tdmf-trajectory-deviation-monitor-with-forensic-deepdive-rmql</loc></url>
<url><loc>https://apartresearch.com/project/shadow-commit-0vhf</loc></url>
<url><loc>https://apartresearch.com/project/passing-the-test-breaking-the-system-latent-failures-in-software-engineering-agents-sisu</loc></url>
<url><loc>https://apartresearch.com/project/detecting-llm-subversion-in-vulnerability-patching-settings-gagj</loc></url>
<url><loc>https://apartresearch.com/project/recruitmentarena-ai-control-setting-for-multiagent-recruitment-manipulation-and-collusion-5mo2</loc></url>
<url><loc>https://apartresearch.com/project/latent-sabotage-geometric-fingerprints-of-deceptive-alignment-in-code-language-models-8owa</loc></url>
<url><loc>https://apartresearch.com/project/does-structured-identity-context-improve-llmbased-monitoring-a-controlarena-evaluation-zan5</loc></url>
<url><loc>https://apartresearch.com/project/activation-sparsity-as-a-scheming-signal-hqj5</loc></url>
<url><loc>https://apartresearch.com/project/lidared-controlarena-redteam-dataset-generator-uirn</loc></url>
<url><loc>https://apartresearch.com/project/a-comparative-analysis-of-ensemble-protocols-for-ai-control-0usy</loc></url>
<url><loc>https://apartresearch.com/project/the-honest-liar-ntms</loc></url>
<url><loc>https://apartresearch.com/project/evaluation-of-trusted-debate-in-linuxarena-9g7s</loc></url>
<url><loc>https://apartresearch.com/project/somebody-poisoned-the-waterhole-evaluating-coding-agent-vulnerability-to-adversarial-github-issues-2nts</loc></url>
<url><loc>https://apartresearch.com/project/crossexamination-testing-surrogate-interrogation-as-a-control-protocol-for-untrusted-ai-agents-w4kb</loc></url>
<url><loc>https://apartresearch.com/project/defenseindepth-against-ai-agent-sabotage-lt9z</loc></url>
<url><loc>https://apartresearch.com/project/safechain-ai-control-in-the-wild-o2sg</loc></url>
<url><loc>https://apartresearch.com/project/undoing-the-fix-cve-regression-as-an-ai-control-setting-f855</loc></url>
<url><loc>https://apartresearch.com/project/gaslight-detector-untrusted-explanation-twostage-monitoring-u3aa</loc></url>
<url><loc>https://apartresearch.com/project/grant-trust-system-3sdg</loc></url>
<url><loc>https://apartresearch.com/project/parity-swarm-using-populationbased-social-simulation-to-discover-ai-safety-monitor-blind-spots-c9qc</loc></url>
<url><loc>https://apartresearch.com/project/interrogation-control-protocol-does-open-monitoring-outperform-surprise-scrutiny-in-catching-adversarial-ai-agents-svad</loc></url>
<url><loc>https://apartresearch.com/project/sandbagging-is-an-absence-signal-04xh</loc></url>
<url><loc>https://apartresearch.com/project/counterfactual-components-for-ai-control-protocols-ibli</loc></url>
<url><loc>https://apartresearch.com/project/testing-monitoring-models-with-encoded-transcripts-sohm</loc></url>
<url><loc>https://apartresearch.com/project/monitor-capture-a-myersonsatterthwaite-impossibility-for-ai-oversight-protocols-qtr5</loc></url>
<url><loc>https://apartresearch.com/project/control-setting-design-vulnerability-hoarding-a3sc</loc></url>
<url><loc>https://apartresearch.com/project/reasoninglevel-poisoning-of-trusted-monitors-a-systematic-redteaming-methodology-x0th</loc></url>
<url><loc>https://apartresearch.com/project/perturbationbased-generation-profiling-detects-covert-ai-agent-attacks-where-tokenlevel-statistics-fail-09im</loc></url>
<url><loc>https://apartresearch.com/project/redteaming-automated-pull-request-reviews-with-vulnerabilitycontributing-commits-1k5r</loc></url>
<url><loc>https://apartresearch.com/project/traceguard-structured-multidimensional-monitoring-as-a-collusionresistant-control-protocol-dthe</loc></url>
<url><loc>https://apartresearch.com/project/actionlens-preexecution-environment-probing-for-agent-action-approval-xy22</loc></url>
<url><loc>https://apartresearch.com/project/autocontrol-arena-synthesizing-executable-redteaming-environments-for-frontier-ai-risk-evaluation-ikz1</loc></url>
<url><loc>https://apartresearch.com/project/cultural-translation-as-an-ai-control-failure-mode-regional-degradation-and-crosslingual-safety-confounds-in-bulgarianslavic-contexts-ie7g</loc></url>
<url><loc>https://apartresearch.com/project/when-safety-becomes-the-vulnerability-gi2u</loc></url>
<url><loc>https://apartresearch.com/project/layered-scopeboundary-monitoring-costaware-control-for-untrusted-ai-agents-9dr7</loc></url>
<url><loc>https://apartresearch.com/project/beyond-the-blocklist-using-character-aliases-to-bypass-ai-image-safety-5ewv</loc></url>
<url><loc>https://apartresearch.com/project/multiturn-optimisation-for-runtime-monitoring-ntb1</loc></url>
<url><loc>https://apartresearch.com/project/detecting-hidden-nonminimal-behavior-in-llmgenerated-ui-code-9u6v</loc></url>
<url><loc>https://apartresearch.com/project/katechon-empirical-benchmarking-of-ai-control-protocols-in-a-proactive-defense-setting-kxbo</loc></url>
<url><loc>https://apartresearch.com/project/incontext-trajectory-poisoning-blackbox-natural-language-attacks-on-llm-agent-monitors-d3gz</loc></url>
<url><loc>https://apartresearch.com/project/monitolr-hunting-for-honesty-improves-safety-at-low-audit-budgets-3mvi</loc></url>
<url><loc>https://apartresearch.com/project/linguistic-asymmetry-and-the-limitations-of-ai-oversight-sih2</loc></url>
<url><loc>https://apartresearch.com/project/supply-chain-malware-as-ground-truth-a-tracebased-agent-safety-monitor-trained-on-real-credential-exfiltration-patterns-5zjk</loc></url>
<url><loc>https://apartresearch.com/project/afriii-adaptive-framework-for-repeated-inspection-of-instrumental-integrity-in-ai-em6w</loc></url>
<url><loc>https://apartresearch.com/project/bgt-as-a-domainaware-trusted-monitor-in-basharena-governancestyle-scoring-for-tool-call-authorization-b5tw</loc></url>
<url><loc>https://apartresearch.com/project/autored-measuring-the-elicitation-gap-via-automated-redblue-optimization-01dg</loc></url>
<url><loc>https://apartresearch.com/project/sspace-steering-for-evalawareness-control-in-reasoning-models-7j1i</loc></url>
<url><loc>https://apartresearch.com/project/operator-dynamics-in-transformer-residual-streams-a-unified-framework-for-interpretability-adversarial-detection-causal-control-and-topological-model-fingerprinting-yqjx</loc></url>
<url><loc>https://apartresearch.com/project/the-blind-spot-how-mechanistic-interpretability-workflows-enable-rogue-deployment-9fce</loc></url>
<url><loc>https://apartresearch.com/project/structural-code-monitors-graph-matching-networks-on-code-property-graphs-for-topologyaware-trusted-monitoring-iwyy</loc></url>
<url><loc>https://apartresearch.com/project/geographic-blind-spots-in-ai-control-monitors-a-crossnational-audit-of-claude-opus-46-kmr2</loc></url>
<url><loc>https://apartresearch.com/project/designed-fragilities-overseer-manipulation-as-a-fourth-ai-control-threat-model-07iz</loc></url>
<url><loc>https://apartresearch.com/project/systematic-crossregulation-threat-topology-for-eu-ai-governance-otso</loc></url>
<url><loc>https://apartresearch.com/project/aegis-lube</loc></url>
<url><loc>https://apartresearch.com/project/maxwell-xqox</loc></url>
<url><loc>https://apartresearch.com/project/technical-ai-governance-via-an-agentic-bill-of-materials-and-risk-tiering-uuts</loc></url>
<url><loc>https://apartresearch.com/project/markov-chain-lock-watermarking-provably-secure-authentication-for-llm-outputs-l8oe</loc></url>
<url><loc>https://apartresearch.com/project/prototyping-an-embedded-offswitch-for-ai-compute-65pz</loc></url>
<url><loc>https://apartresearch.com/project/ai-safety-template-dz3h</loc></url>
<url><loc>https://apartresearch.com/project/verification-mechanism-feasibility-scorer-vmfs-8lxs</loc></url>
<url><loc>https://apartresearch.com/project/domain-ownership-probing-gt3j</loc></url>
<url><loc>https://apartresearch.com/project/moltbook-riskmap-postdeployment-monitoring-of-autonomous-agent-misalignment-in-the-wild-39db</loc></url>
<url><loc>https://apartresearch.com/project/attested-multiagent-conversation-logs-a-tamperevident-black-box-for-ai-governance-du9i</loc></url>
<url><loc>https://apartresearch.com/project/fingerprinting-all-ai-cluster-io-without-mutually-trusted-processors-d81l</loc></url>
<url><loc>https://apartresearch.com/project/the-sentinel-engine-solving-the-observability-trilemma-via-differential-precision-probing-noqd</loc></url>
<url><loc>https://apartresearch.com/project/red30-ai-red-lines-tracker-a-comprehensive-technical-infrastructure-for-monitoring-frontier-model-proximity-to-critical-safety-thresholds-jole</loc></url>
<url><loc>https://apartresearch.com/project/red-lines-forecasting-when-will-frontier-ai-cross-compute-thresholds-6mit</loc></url>
<url><loc>https://apartresearch.com/project/blind-audit-qbtg</loc></url>
<url><loc>https://apartresearch.com/project/safetygap-coordination-infrastructure-auditing-and-tools-for-multilingual-ai-safety-1yx1</loc></url>
<url><loc>https://apartresearch.com/project/modelling-the-impact-of-verification-in-crossborder-ai-training-projects-go92</loc></url>
<url><loc>https://apartresearch.com/project/panopticon-ja2g</loc></url>
<url><loc>https://apartresearch.com/project/automated-compliance-measurement-for-frontier-ai-models-evidencebased-scoring-of-model-card-disclosures-4njc</loc></url>
<url><loc>https://apartresearch.com/project/rsp-harmonization-engine-automated-analysis-and-harmonization-of-responsible-scaling-policies-mzkb</loc></url>
<url><loc>https://apartresearch.com/project/ai-safety-threshold-tracker-fnxw</loc></url>
<url><loc>https://apartresearch.com/project/veritrain-formal-verification-for-ai-governance-compliance-gvyv</loc></url>
<url><loc>https://apartresearch.com/project/same-question-different-lies-crosscontext-consistency-c3-for-blackbox-sandbagging-detection-7r2i</loc></url>
<url><loc>https://apartresearch.com/project/political-intelligence-for-ai-safety-the-ai-risk-attitudes-survey-airas-dlpz</loc></url>
<url><loc>https://apartresearch.com/project/no-one-thanks-you-for-disasters-that-never-happened-pricing-ai-risk-while-making-ai-safety-investable-gjwu</loc></url>
<url><loc>https://apartresearch.com/project/lidasim-testing-ai-policies-with-personabased-simulations-o8x6</loc></url>
<url><loc>https://apartresearch.com/project/ai-dual-use-risk-assessor-i3iw</loc></url>
<url><loc>https://apartresearch.com/project/insurancegrade-data-infrastructure-for-frontier-ai-governance-x52g</loc></url>
<url><loc>https://apartresearch.com/project/ig-a-unified-platform-for-governed-ai-agent-execution-with-humanintheloop-tool-verification-1ol1</loc></url>
<url><loc>https://apartresearch.com/project/selfgovernance-under-revision-s0az</loc></url>
<url><loc>https://apartresearch.com/project/risks-and-benefits-of-emerging-cryptographic-primitives-for-compute-governance-4w1w</loc></url>
<url><loc>https://apartresearch.com/project/the-halflife-of-compute-thresholds-260u</loc></url>
<url><loc>https://apartresearch.com/project/participatory-alignment-verification-j9tu</loc></url>
<url><loc>https://apartresearch.com/project/atrain-mvbo</loc></url>
<url><loc>https://apartresearch.com/project/neurover-gg0w</loc></url>
<url><loc>https://apartresearch.com/project/line-operationalizing-the-edge-of-ai-risk-jj9e</loc></url>
<url><loc>https://apartresearch.com/project/global-ai-bias-audit-for-technical-governance-q1t8</loc></url>
<url><loc>https://apartresearch.com/project/global-ai-safety-notary-a-decentralised-protocol-for-international-ai-incident-reporting-jlzp</loc></url>
<url><loc>https://apartresearch.com/project/ai-governance-transparency-ledger-2149</loc></url>
<url><loc>https://apartresearch.com/project/zkgovproof-composable-zeroknowledge-proofs-for-ai-governance-ulz0</loc></url>
<url><loc>https://apartresearch.com/project/eu-ai-act-compliance-form-builder-automating-article-53-documentation-for-general-purpose-ai-models-z40g</loc></url>
<url><loc>https://apartresearch.com/project/crossborder-agentic-ai-compliance-cbaac-embedding-regulatory-and-cultural-risk-compliance-into-agentic-communication-p4oo</loc></url>
<url><loc>https://apartresearch.com/project/frontier-ai-risk-threshold-analyzer-g8zp</loc></url>
<url><loc>https://apartresearch.com/project/operationalizing-frontier-ai-safety-a-canadian-framework-for-risk-thresholds-compliance-infrastructure-and-healthcare-agentic-ai-governance-rf9j</loc></url>
<url><loc>https://apartresearch.com/project/audit-7hmj</loc></url>
<url><loc>https://apartresearch.com/project/coherenceguard-1fht</loc></url>
<url><loc>https://apartresearch.com/project/adversarial-dialectics-mitigating-ai-persuasion-risks-through-highfidelity-multiagent-debate-c9vw</loc></url>
<url><loc>https://apartresearch.com/project/whispers-multiagent-persuasion-learning-with-memoryemergent-strategies-igp0</loc></url>
<url><loc>https://apartresearch.com/project/faithful-adversarial-mcts-for-persuasive-cot-manipulation-check-a-cooperative-ai-lens-813p</loc></url>
<url><loc>https://apartresearch.com/project/the-persuasive-power-of-personas-testing-ai-policies-in-the-lab-fe87</loc></url>
<url><loc>https://apartresearch.com/project/the-alignment-gap-measuring-regressive-sycophancy-in-ai-driven-medical-advice-0m6o</loc></url>
<url><loc>https://apartresearch.com/project/goodharts-village-using-llmmafia-to-study-deception-9jo6</loc></url>
<url><loc>https://apartresearch.com/project/personaawaredialoguemanipulation-bpvz</loc></url>
<url><loc>https://apartresearch.com/project/vexreinforce-uhra</loc></url>
<url><loc>https://apartresearch.com/project/measuring-ai-manipulation-through-parasocial-intimacy-qji7</loc></url>
<url><loc>https://apartresearch.com/project/fvdeception-z2li</loc></url>
<url><loc>https://apartresearch.com/project/sandbagging-detection-via-static-analysis-87ip</loc></url>
<url><loc>https://apartresearch.com/project/reputation-hacking-in-a-simulated-rl-environment-rrs6</loc></url>
<url><loc>https://apartresearch.com/project/risklab-w0fy</loc></url>
<url><loc>https://apartresearch.com/project/eliciting-deception-on-generative-search-engines-6nuu</loc></url>
<url><loc>https://apartresearch.com/project/hallucination-heatmap-cognitive-cartography-for-ai-knowledge-boundaries-vnwu</loc></url>
<url><loc>https://apartresearch.com/project/agentredline-propensity-evaluations-for-emergent-intermodel-manipulation-in-agentic-ai-systems-swnl</loc></url>
<url><loc>https://apartresearch.com/project/probing-for-emergent-deception-in-multiagent-negotiations-522l</loc></url>
<url><loc>https://apartresearch.com/project/dgamm-a-multiturn-benchmark-for-darkpatterns-and-gradual-autonomy-manipulation-8l7j</loc></url>
<url><loc>https://apartresearch.com/project/mapping-escalation-turnbyturn-detection-of-manipulation-accumulation-in-multiturn-ai-conversations-x489</loc></url>
<url><loc>https://apartresearch.com/project/veilbench-pb5u</loc></url>
<url><loc>https://apartresearch.com/project/vector-forge-ckcl</loc></url>
<url><loc>https://apartresearch.com/project/sycophantsee-activationbased-diagnostics-for-prompt-engineering-monitoring-sycophancy-at-prompt-and-generation-time-ys27</loc></url>
<url><loc>https://apartresearch.com/project/who-does-your-ai-serve-manipulation-by-and-of-ai-assistants-77xx</loc></url>
<url><loc>https://apartresearch.com/project/stopping-ai-manipulation-conditional-alignment-at-zero-capability-cost-2kt9</loc></url>
<url><loc>https://apartresearch.com/project/sup-sycophancy-under-pressure-ebx4</loc></url>
<url><loc>https://apartresearch.com/project/seed-framework-evaluation-qj3m</loc></url>
<url><loc>https://apartresearch.com/project/deception-scales-how-strategic-manipulation-emerges-in-complex-llm-negotiations-z3hk</loc></url>
<url><loc>https://apartresearch.com/project/thoughtguards-realtime-chainofthought-monitoring-for-ai-manipulation-detection-srvz</loc></url>
<url><loc>https://apartresearch.com/project/neuroguard-gb0p</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-the-technical-effectiveness-and-legislative-practicality-of-ai-safety-frameworks-t2ku</loc></url>
<url><loc>https://apartresearch.com/project/governing-ai-manipulation-in-real-time-with-conceptbased-mechanistic-interpretability-bmfp</loc></url>
<url><loc>https://apartresearch.com/project/manipulation-radar-aipowered-detection-of-manipulation-patterns-in-conversational-ai-2kki</loc></url>
<url><loc>https://apartresearch.com/project/adversarial-prompting-for-sycophancy-detection-span-annotation-and-multiturn-analysis-u6bc</loc></url>
<url><loc>https://apartresearch.com/project/darkpatternmonitor-6q25</loc></url>
<url><loc>https://apartresearch.com/project/ai-chat-analyzer-wyud</loc></url>
<url><loc>https://apartresearch.com/project/dark-drift-emergent-psychopathic-traits-and-information-distortion-in-llmmediated-communication-chain-dca4</loc></url>
<url><loc>https://apartresearch.com/project/manipulation-playground-siwg</loc></url>
<url><loc>https://apartresearch.com/project/deeblearn-diverse-evaluation-evasion-benchmark-09zw</loc></url>
<url><loc>https://apartresearch.com/project/manipulation-monitor-activationbased-detection-and-mitigation-of-sycophancy-in-llms-kzf4</loc></url>
<url><loc>https://apartresearch.com/project/curvatureaware-sycophancy-reduction-ucc4</loc></url>
<url><loc>https://apartresearch.com/project/stargent-valley-i6ro</loc></url>
<url><loc>https://apartresearch.com/project/ai-swarms-manipulation-how-coordinated-infiltrator-agents-shift-community-beliefs-9ek9</loc></url>
<url><loc>https://apartresearch.com/project/testing-manipulation-tendencies-of-llms-when-crafting-pr-statements-oidt</loc></url>
<url><loc>https://apartresearch.com/project/emergent-strategic-behavior-in-multiagent-llm-systems-a-study-of-cooperation-deception-and-coalition-formation-fus9</loc></url>
<url><loc>https://apartresearch.com/project/crosslinguistic-sycophancy-in-frontier-llms-a-benchmark-study-w55u</loc></url>
<url><loc>https://apartresearch.com/project/think-right-answer-wrong-loku</loc></url>
<url><loc>https://apartresearch.com/project/dangerous-affirmation-or-responsible-correction-nf1u</loc></url>
<url><loc>https://apartresearch.com/project/we-bring-out-the-worst-in-each-other-eliciting-social-sycophancy-in-llms-via-selfplay-tdi5</loc></url>
<url><loc>https://apartresearch.com/project/convograph-uncovering-structural-sycophancy-via-heterogeneous-graph-transformers-p94x</loc></url>
<url><loc>https://apartresearch.com/project/sandwatch-assessing-sandbagging-potential-in-large-language-models-b57c</loc></url>
<url><loc>https://apartresearch.com/project/accessible-ai-and-election-integrity-societal-risks-of-aienabled-voter-suppression-k64u</loc></url>
<url><loc>https://apartresearch.com/project/playing-dumb-detecting-sandbagging-in-frontier-llms-via-consistency-checks-sntk</loc></url>
<url><loc>https://apartresearch.com/project/biased-attractiveness-bench-bab-image-reward-models-confuse-attractiveness-with-realism-sk7o</loc></url>
<url><loc>https://apartresearch.com/project/commitcheck-measuring-and-mitigating-commitment-violations-in-tool-using-ai-agents-iy8g</loc></url>
<url><loc>https://apartresearch.com/project/chainofthought-manipulation-monitor-detection-of-deceptive-reasoning-in-llms-2wnx</loc></url>
<url><loc>https://apartresearch.com/project/intent-matters-detecting-manipulative-adaptation-in-ai-systems-4av5</loc></url>
<url><loc>https://apartresearch.com/project/even-the-best-ai-would-hurt-us-ji74</loc></url>
<url><loc>https://apartresearch.com/project/hackathon-sycophancy-project-elbs</loc></url>
<url><loc>https://apartresearch.com/project/intransient-tweettracker-l238</loc></url>
<url><loc>https://apartresearch.com/project/agent-attacks-via-memory-injection-izfz</loc></url>
<url><loc>https://apartresearch.com/project/mind-the-gap-benchmarks-vs-realworld-manipulation-in-llms-zng7</loc></url>
<url><loc>https://apartresearch.com/project/uer-universal-expert-registry-ecve</loc></url>
<url><loc>https://apartresearch.com/project/sandbagging-detection-via-consistency-probing-32b5</loc></url>
<url><loc>https://apartresearch.com/project/the-devils-tongue-inferencetime-scaling-laws-and-universality-of-ai-sycophancy-xvvc</loc></url>
<url><loc>https://apartresearch.com/project/language-as-a-manipulation-vector-detecting-ideological-bias-and-value-instability-in-multilingual-llms-amzu</loc></url>
<url><loc>https://apartresearch.com/project/seed-aware-evaluation-of-semantic-stability-in-textto-image-diffusion-models-iuq0</loc></url>
<url><loc>https://apartresearch.com/project/detecting-adversarial-prompts-in-business-context-wv35</loc></url>
<url><loc>https://apartresearch.com/project/nexus-station-hvs0</loc></url>
<url><loc>https://apartresearch.com/project/deceptionlens-novz</loc></url>
<url><loc>https://apartresearch.com/project/terrain-gossip-peer-to-peer-gossip-protocol-enabling-decentralized-continuous-behaviour-benchmarking-of-large-language-models-gyg6</loc></url>
<url><loc>https://apartresearch.com/project/tees-as-a-cryptographic-nervous-system-for-onshored-humanoid-robots-m4e9</loc></url>
<url><loc>https://apartresearch.com/project/wikigen-biological-safeguards-for-collaborative-aiml-on-sensitive-data-jpew</loc></url>
<url><loc>https://apartresearch.com/project/helixaegis-llm-based-screening-for-biosequences-nhgx</loc></url>
<url><loc>https://apartresearch.com/project/detecting-piecewise-cyber-espionage-in-model-apis-a8gx</loc></url>
<url><loc>https://apartresearch.com/project/aegis-sentinel-multidomain-defensive-acceleration-platform-for-critical-infrastructure-protection-xnmb</loc></url>
<url><loc>https://apartresearch.com/project/opening-doors-to-multimodal-deception-egr7</loc></url>
<url><loc>https://apartresearch.com/project/gene-guard-realtime-genomic-data-leak-prevention-qrnl</loc></url>
<url><loc>https://apartresearch.com/project/tinyrod-gk5k</loc></url>
<url><loc>https://apartresearch.com/project/zero-trust-agency-mitigating-the-confused-deputy-in-autonomous-ai-systems-uea3</loc></url>
<url><loc>https://apartresearch.com/project/pathwatch-environmental-pathogen-surveillance-system-jgil</loc></url>
<url><loc>https://apartresearch.com/project/humane-antispam-messaging-visavis-agentic-generative-ai-a65k</loc></url>
<url><loc>https://apartresearch.com/project/vulnodin-235v</loc></url>
<url><loc>https://apartresearch.com/project/biosecure-knowyourcustomer-system-for-dna-synthesis-companies-pkjb</loc></url>
<url><loc>https://apartresearch.com/project/efficient-defencedominant-adversarial-robustness-using-moving-target-defence-mad0</loc></url>
<url><loc>https://apartresearch.com/project/rial-7lzf</loc></url>
<url><loc>https://apartresearch.com/project/ciris-agent-selfconfiguration-wizard-l1pe</loc></url>
<url><loc>https://apartresearch.com/project/automating-privacypreserving-model-deployment-7hoj</loc></url>
<url><loc>https://apartresearch.com/project/littlebrotherai-yzzx</loc></url>
<url><loc>https://apartresearch.com/project/durinn-calibration-3vub</loc></url>
<url><loc>https://apartresearch.com/project/trusted-model-supervisor-8o2r</loc></url>
<url><loc>https://apartresearch.com/project/safetybench-xh8g</loc></url>
<url><loc>https://apartresearch.com/project/elephant-in-the-code-dcma</loc></url>
<url><loc>https://apartresearch.com/project/swaipe-microlearning-retention-platform-for-cognitive-ai-defense-0xt4</loc></url>
<url><loc>https://apartresearch.com/project/inoculating-insecurely-finetuned-code-models-against-emergent-misalignment-yxos</loc></url>
<url><loc>https://apartresearch.com/project/veridian-ai-ai-defense-as-a-service-bm4z</loc></url>
<url><loc>https://apartresearch.com/project/llms-enable-large-scale-design-of-nanobodies-27uz</loc></url>
<url><loc>https://apartresearch.com/project/current-limits-on-dna-screening-methods-and-how-to-make-them-more-robust-potentialinfohazard-vs58</loc></url>
<url><loc>https://apartresearch.com/project/chimera-def-acc-hackathon-qw3d</loc></url>
<url><loc>https://apartresearch.com/project/opener-of-the-ways-protecting-against-malicious-website-crawlers-via-did-keybased-authentication-tacg</loc></url>
<url><loc>https://apartresearch.com/project/robust-llm-neural-activationmediated-alignment-ttk5</loc></url>
<url><loc>https://apartresearch.com/project/raccognize-have-ai-companies-stolen-my-images-wqfu</loc></url>
<url><loc>https://apartresearch.com/project/jailbreak-genome-scanner-q5y7</loc></url>
<url><loc>https://apartresearch.com/project/alphascreening-vd1a</loc></url>
<url><loc>https://apartresearch.com/project/hgtbioguard-a-global-heterogeneous-graph-transformer-for-earlywarning-biosurveillance-vzdl</loc></url>
<url><loc>https://apartresearch.com/project/firefly-ai-safe-web-browsing-for-ai-agents-h5sd</loc></url>
<url><loc>https://apartresearch.com/project/modx-inference-time-detection-of-anomalous-behavior-using-sparse-autoencoders-1nfc</loc></url>
<url><loc>https://apartresearch.com/project/snow-white-detecting-persistent-trust-decay-context-poisoning-in-llms-an-attack-surface-characterization-cuu2</loc></url>
<url><loc>https://apartresearch.com/project/sentinel-a-decentralized-threat-telemetry-network-yxzk</loc></url>
<url><loc>https://apartresearch.com/project/defending-the-defenceless-halting-aiagentic-behaviours-on-local-environments-with-rulesbased-cyber-architecture-bsrl</loc></url>
<url><loc>https://apartresearch.com/project/sigmaforge-pyf6</loc></url>
<url><loc>https://apartresearch.com/project/emergency-response-coordination-system-jsp7</loc></url>
<url><loc>https://apartresearch.com/project/chacha-a-control-plane-for-longitudinal-threat-detection-in-llm-applications-kp70</loc></url>
<url><loc>https://apartresearch.com/project/from-hallucinations-to-misalignment-evaluating-edfl-as-a-misalignment-checker-on-gpt4omini-and-sleeper-agents-gshe</loc></url>
<url><loc>https://apartresearch.com/project/guardian-guarded-universal-architecture-for-defensive-interpretation-and-translation-vqgy</loc></url>
<url><loc>https://apartresearch.com/project/actions-speak-louder-than-words-evaluating-tool-usage-risk-in-openweight-ai-for-defensive-deployment-g3k0</loc></url>
<url><loc>https://apartresearch.com/project/ai-sentinel-ounq</loc></url>
<url><loc>https://apartresearch.com/project/biocast-ai-yzht</loc></url>
<url><loc>https://apartresearch.com/project/comparative-llm-methods-for-social-media-bot-detection-u9s4</loc></url>
<url><loc>https://apartresearch.com/project/deep-confidence-for-ai-safety-6d56</loc></url>
<url><loc>https://apartresearch.com/project/sentinel-trace-opensource-ai-monitoring-dashboard-with-pretraining-data-tracing-and-inflight-dpo-dataset-creation-fj4c</loc></url>
<url><loc>https://apartresearch.com/project/medomitdetect-ensuring-safety-in-patientfacing-medical-llm-k6q3</loc></url>
<url><loc>https://apartresearch.com/project/thewizard-u2dk</loc></url>
<url><loc>https://apartresearch.com/project/honeypots-sparse-autoencoders-and-adversarial-probes-a-practical-toolkit-for-evaluating-safety-monitors-in-reasoning-models-lvia</loc></url>
<url><loc>https://apartresearch.com/project/a-defensive-ai-agent-against-large-language-model-llmassisted-polymorphic-malware-g2pf</loc></url>
<url><loc>https://apartresearch.com/project/project-gabriel-aiaccelerated-formally-verified-fpga-security-for-critical-infrastructure-4gs9</loc></url>
<url><loc>https://apartresearch.com/project/automated-jailbreak-redteaming-9l05</loc></url>
<url><loc>https://apartresearch.com/project/voyager-selfevolving-ai-control-platform-72m9</loc></url>
<url><loc>https://apartresearch.com/project/llmexecguard-realtime-detection-of-malicious-shell-behavior-in-llm-agents-p3fj</loc></url>
<url><loc>https://apartresearch.com/project/wastewater-metagenomic-surveillance-for-novel-viruses-how-much-sequencing-is-enough-and-at-what-cost-07q9</loc></url>
<url><loc>https://apartresearch.com/project/aisafetydriven-system-for-predicting-crosspollination-risk-and-optimizing-gmo-testing-in-soybean-fields-ulor</loc></url>
<url><loc>https://apartresearch.com/project/dunebox-prompt-injection-detection-with-slm-in-local-sandbox-lcjc</loc></url>
<url><loc>https://apartresearch.com/project/arghus-automated-verification-defences-against-scammers-and-identity-thieves-r08f</loc></url>
<url><loc>https://apartresearch.com/project/tinder-for-biorisks-mr91</loc></url>
<url><loc>https://apartresearch.com/project/cognitive-canary-active-defense-against-neural-inference-oqvd</loc></url>
<url><loc>https://apartresearch.com/project/economic-finality-for-attested-journalism-multidimensional-trust-for-misinformation-resistance-m88z</loc></url>
<url><loc>https://apartresearch.com/project/ghost-marks-in-the-machine-a-critical-review-of-synthid-for-code-provenance-monitoring-ov2c</loc></url>
<url><loc>https://apartresearch.com/project/a-prospect-theoretic-approach-to-agentic-ai-safety-ilil</loc></url>
<url><loc>https://apartresearch.com/project/teliclens-qp3x</loc></url>
<url><loc>https://apartresearch.com/project/mechanistic-watchdog-klay</loc></url>
<url><loc>https://apartresearch.com/project/epicurus-c4il</loc></url>
<url><loc>https://apartresearch.com/project/neops-devsecops-for-the-ai-era-kqto</loc></url>
<url><loc>https://apartresearch.com/project/biocast-ai-v8s3</loc></url>
<url><loc>https://apartresearch.com/project/verity-ai-red-team-assist-cajq</loc></url>
<url><loc>https://apartresearch.com/project/aipatch-llm-assisted-patch-copilot-for-critical-open-source-infrastructure-fxlx</loc></url>
<url><loc>https://apartresearch.com/project/patchwork-irwu</loc></url>
<url><loc>https://apartresearch.com/project/adaptive-ai-security-mesh-37f2</loc></url>
<url><loc>https://apartresearch.com/project/llm-security-evaluation-ihbx</loc></url>
<url><loc>https://apartresearch.com/project/image-text-prompt-detection-n2t1</loc></url>
<url><loc>https://apartresearch.com/project/mindpatch-eja9</loc></url>
<url><loc>https://apartresearch.com/project/assisted-audit-of-solana-programs-iexy</loc></url>
<url><loc>https://apartresearch.com/project/neuroseal-2ybz</loc></url>
<url><loc>https://apartresearch.com/project/cmido-firewall-contextmasked-iterative-defensive-optimization-for-safer-llm-deployment-11vm</loc></url>
<url><loc>https://apartresearch.com/project/applying-to-the-canadian-armed-forces-cyber-command-reserves-3192</loc></url>
<url><loc>https://apartresearch.com/project/mirage-evhs</loc></url>
<url><loc>https://apartresearch.com/project/zynq-verifiable-zeroknowledge-ai-redteam-and-auditing-platform-8art</loc></url>
<url><loc>https://apartresearch.com/project/forecasting-autonomous-ai-biothreat-design-capabilities-six-models-converge-on-2031-3gpn</loc></url>
<url><loc>https://apartresearch.com/project/ai-for-environmental-decision-intelligence-the-ai-forecasting-hackathon-iptd</loc></url>
<url><loc>https://apartresearch.com/project/forecasting-agi-a-granular-chcbased-approach-9n7z</loc></url>
<url><loc>https://apartresearch.com/project/table-top-agents-i2zx</loc></url>
<url><loc>https://apartresearch.com/project/beyond-capabilities-a-framework-for-integrating-moral-patiency-indicators-into-ai-forecasting-and-governance-cvuy</loc></url>
<url><loc>https://apartresearch.com/project/ais-impact-on-video-and-game-generation-xzdj</loc></url>
<url><loc>https://apartresearch.com/project/empirical-measurements-of-technique-effectiveness-across-model-sizes-swyd</loc></url>
<url><loc>https://apartresearch.com/project/economic-agency-y00o</loc></url>
<url><loc>https://apartresearch.com/project/llmbased-scenario-generation-2ag7</loc></url>
<url><loc>https://apartresearch.com/project/a-multidomain-stochastic-framework-for-forecasting-catastrophic-risk-from-artificial-intelligence-development-through-2030-wzzl</loc></url>
<url><loc>https://apartresearch.com/project/a-critique-of-metrs-time-horizon-forecasting-ttp1</loc></url>
<url><loc>https://apartresearch.com/project/foretells-vf43</loc></url>
<url><loc>https://apartresearch.com/project/eu-forecasthub-6wiz</loc></url>
<url><loc>https://apartresearch.com/project/exogenousai</loc></url>
<url><loc>https://apartresearch.com/project/forecasting-multiagent-systems-1qhn</loc></url>
<url><loc>https://apartresearch.com/project/ai-incidents-forecasting-w92p</loc></url>
<url><loc>https://apartresearch.com/project/ai-capability-terrain-ixd9</loc></url>
<url><loc>https://apartresearch.com/project/ai-treaty-momentum-index-atmi-lst4</loc></url>
<url><loc>https://apartresearch.com/project/ai-shared-socioeconomic-pathways-xzni</loc></url>
<url><loc>https://apartresearch.com/project/threat-snapshot-1r9q</loc></url>
<url><loc>https://apartresearch.com/project/does-the-direct-method-predict-general-capability-f7t7</loc></url>
<url><loc>https://apartresearch.com/project/the-cognitive-debt-crisis-a-datadriven-forecast-analysis-of-ais-impact-on-human-thinking-ob8w</loc></url>
<url><loc>https://apartresearch.com/project/modeling-the-political-process-to-forecast-the-outcomes-of-hypothetical-ai-governance-proposals-0n2c</loc></url>
<url><loc>https://apartresearch.com/project/system-dynamics-gametheoretic-model-of-the-ai-development-race-dqe3</loc></url>
<url><loc>https://apartresearch.com/project/rashomon-multiple-views-of-the-same-ai-timeline-forecasts-cyun</loc></url>
<url><loc>https://apartresearch.com/project/3-ai-progress-monitoring-early-warning-systems-sorry-we-forgot-to-add-code-link-in-previous-submit-ds1e</loc></url>
<url><loc>https://apartresearch.com/project/ai-risk-hotspots-early-warning-system-qtu1</loc></url>
<url><loc>https://apartresearch.com/project/lucr-linking-utility-and-compute-rate-rzeg</loc></url>
<url><loc>https://apartresearch.com/project/ai-sentinel-agi-multimetric-forecast-framework-h0uq</loc></url>
<url><loc>https://apartresearch.com/project/quantifying-the-political-prism-a-framework-for-erroraware-ai-governance-forecasting-xtau</loc></url>
<url><loc>https://apartresearch.com/project/can-ai-predict-its-own-future-ij7h</loc></url>
<url><loc>https://apartresearch.com/project/simulating-automation-timelines-through-laborcapability-modeling-a5dh</loc></url>
<url><loc>https://apartresearch.com/project/simulating-automation-timelines-through-laborcapability-quvk</loc></url>
<url><loc>https://apartresearch.com/project/can-ai-predict-its-own-future-0hdy</loc></url>
<url><loc>https://apartresearch.com/project/nexight-nw3y</loc></url>
<url><loc>https://apartresearch.com/project/when-guardrails-fail-dual-use-misuse-of-ai-in-retrosynthesis-through-iterative-refinement-induced-self-jailbreaking-4zzi</loc></url>
<url><loc>https://apartresearch.com/project/policy-brief-harnessing-open-source-intelligence-for-ai-risk-management-2m5x</loc></url>
<url><loc>https://apartresearch.com/project/cbrn-safe-eval-transparent-escalation-framework</loc></url>
<url><loc>https://apartresearch.com/project/robustcbrn-eval-a-practical-benchmark-robustification-toolkit-6m2t</loc></url>
<url><loc>https://apartresearch.com/project/towards-agnostic-viral-engineering-detection-9r3k</loc></url>
<url><loc>https://apartresearch.com/project/thoughttrim-4h8w</loc></url>
<url><loc>https://apartresearch.com/project/arbiter-automated-review-of-bio-ai-tools-for-emerging-risk-2n5p</loc></url>
<url><loc>https://apartresearch.com/project/navigating-safety-measures-for-nuclear-nonproliferation-ai-enabled-early-warning-systems-governance-system-for-detecting-nuclear-enrichment-1z7e</loc></url>
<url><loc>https://apartresearch.com/project/molecules-under-watch-multi-modal-ai-driven-threat-emergence-detection-for-biosecurity-7x9q</loc></url>
<url><loc>https://apartresearch.com/project/enhancing-genomic-foundation-model-robustness-through-iterative-black-box-adversarial-training-8k3m</loc></url>
<url><loc>https://apartresearch.com/project/collective-deliberation-for-safer-cbrn-decisions-a-multi-agent-llm-debate-pipeline-3w8q</loc></url>
<url><loc>https://apartresearch.com/project/internal-defence-system-5y4n</loc></url>
<url><loc>https://apartresearch.com/project/foundation-4zzi</loc></url>
<url><loc>https://apartresearch.com/project/dualrg-alignment-probing-safety-phase-transitions-in-language-models-fu9i</loc></url>
<url><loc>https://apartresearch.com/project/local-learning-coefficients-predict-developmental-milestones-during-group-relative-policy-optimization-2te2</loc></url>
<url><loc>https://apartresearch.com/project/idempotent-gpts-actually-may-provide-robustness-by-design-gxki</loc></url>
<url><loc>https://apartresearch.com/project/exploration-track-interpreting-lrms-qh2i</loc></url>
<url><loc>https://apartresearch.com/project/broad-misalignment-from-persuasive-finetuning-pm56</loc></url>
<url><loc>https://apartresearch.com/project/comments-extensions-of-subliminal-learning-ui8u</loc></url>
<url><loc>https://apartresearch.com/project/ai-agentic-system-epidemiology-b83r</loc></url>
<url><loc>https://apartresearch.com/project/diffusion-paths-a-geodesic-lens-on-noising-schedules-rpaq</loc></url>
<url><loc>https://apartresearch.com/project/rl-vs-active-inference-with-respect-to-reward-hacking-8h3s</loc></url>
<url><loc>https://apartresearch.com/project/momentumpointperplexity-mechanics-in-large-language-models-v1nc</loc></url>
<url><loc>https://apartresearch.com/project/finding-the-boundaries-of-universality-a-stress-test-on-crossdomain-embedding-translation-jbel</loc></url>
<url><loc>https://apartresearch.com/project/estimating-local-learning-coefficients-to-probe-loss-landscape-robustness-setk</loc></url>
<url><loc>https://apartresearch.com/project/sequential-cascaded-hamiltonian-neural-networks-4zzi</loc></url>
<url><loc>https://apartresearch.com/project/layerwise-development-of-compositional-functional-representations-across-architectures-1zgq</loc></url>
<url><loc>https://apartresearch.com/project/a-geometric-analysis-of-transformer-representations-via-optimal-transport-qjdf</loc></url>
<url><loc>https://apartresearch.com/project/thermodynamicsinspired-ood-detection-hp7p</loc></url>
<url><loc>https://apartresearch.com/project/constrained-belief-updates-and-geometric-structures-in-transformer-representations-for-the-rrxor-process-gsok</loc></url>
<url><loc>https://apartresearch.com/project/toy-model-of-superposition-control-lv0i</loc></url>
<url><loc>https://apartresearch.com/project/a-mechanism-for-the-emergence-of-superposition-in-toy-models-tf73</loc></url>
<url><loc>https://apartresearch.com/project/ewml-explicit-world-model-learning-lkls</loc></url>
<url><loc>https://apartresearch.com/project/spectral-regularization-as-a-safetycritical-inductive-bias-zev7</loc></url>
<url><loc>https://apartresearch.com/project/jasontest-guardianloop-mechanistically-interpretable-microjudges-with-adversarial-selfimprovement-1b2p</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-treaty-enforcement-in-china-vb6b</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-policy-5-of-a-narrow-path-evaluating-the-threat-resilience-of-ai-licensing-regimes-zpgj</loc></url>
<url><loc>https://apartresearch.com/project/malicious-defense-red-teaming-phase-0-of-a-narrow-path-w6r6</loc></url>
<url><loc>https://apartresearch.com/project/phase-0-reinforcement-toolkit-ulxx</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-gedica-v2-bdjr</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-controlai-policy-sprint-fjwu</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-controlai-policy-sprint-by-aryan-goenka-g5ik</loc></url>
<url><loc>https://apartresearch.com/project/a-narrow-line-edit-controlai-policy-sprint-ow76</loc></url>
<url><loc>https://apartresearch.com/project/ai-assistance-in-ai-alignment-improvement-allow-it-oru2</loc></url>
<url><loc>https://apartresearch.com/project/safety-cases-and-licensing-a-deeper-look-2sb5</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-a-critical-analysis-84oh</loc></url>
<url><loc>https://apartresearch.com/project/algorithmic-governance-for-a-narrow-path-06sv</loc></url>
<url><loc>https://apartresearch.com/project/four-paths-to-failure-red-teaming-asi-governance-se53</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-an-analysis-of-phase-0-policies-for-artificial-superintelligence-prevention-suou</loc></url>
<url><loc>https://apartresearch.com/project/mapping-the-narrow-path-avoiding-the-quicksand-h6q1</loc></url>
<url><loc>https://apartresearch.com/project/power-proxies-and-people-redteaming-phase-0-of-a-narrow-path-to-stop-ai-superintelligence-o0s6</loc></url>
<url><loc>https://apartresearch.com/project/the-hidden-threat-of-recursive-selfimproving-llms-x5f0</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-controlai-policy-sprint-by-aritra-das-and-vaani-goenka-w5w9</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-controlai-policy-sprint-9syc</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-a-narrow-path-controlai-policy-sprint-s3t9</loc></url>
<url><loc>https://apartresearch.com/project/people-planet-parity-governance-framework-h3ks</loc></url>
<url><loc>https://apartresearch.com/project/llm-fingerprinting-through-semantic-variability-6pof</loc></url>
<url><loc>https://apartresearch.com/project/approximating-human-preferences-using-a-multijudge-learned-system-v3im</loc></url>
<url><loc>https://apartresearch.com/project/manipulating-selfpreference-for-large-language-models-c4wm</loc></url>
<url><loc>https://apartresearch.com/project/mechanistic-router-for-interpretable-agent-orchestration-dio5</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-safety-judge-design-against-adversarial-attacks-57w1</loc></url>
<url><loc>https://apartresearch.com/project/adversarial-vulnerabilities-in-ai-judge-models-martian-x-apart-research-study-erjl</loc></url>
<url><loc>https://apartresearch.com/project/a-generalist-router-for-inspect-reasoning-router-demonstration-dc46</loc></url>
<url><loc>https://apartresearch.com/project/a-multidimensional-judge-model-for-safe-consistent-and-ethical-ai-orchestration-2l0c</loc></url>
<url><loc>https://apartresearch.com/project/crosslingual-bias-detection-in-large-language-models-through-mechanistic-judge-model-evaluation-iflu</loc></url>
<url><loc>https://apartresearch.com/project/mechanistically-eliciting-misjudgements-in-large-language-models-ah8l</loc></url>
<url><loc>https://apartresearch.com/project/mechanistic-judging-and-llm-routing-evaluation-taskspecific-vulnerabilities-and-exploitable-failure-mode-751n</loc></url>
<url><loc>https://apartresearch.com/project/guardianloop-mechanistically-interpretable-microjudges-with-adversarial-selfimprovement-1b2p</loc></url>
<url><loc>https://apartresearch.com/project/tobias-better-web-pages-through-intelligent-routing-and-judgement-ea8h</loc></url>
<url><loc>https://apartresearch.com/project/routing-llms-using-distilled-predictors-and-confidence-thresholding-v5m6</loc></url>
<url><loc>https://apartresearch.com/project/reliability-judge-enhancing-llm-reliability-through-multimodel-judging-tdpp</loc></url>
<url><loc>https://apartresearch.com/project/leveraging-benford-law-for-computational-complexity</loc></url>
<url><loc>https://apartresearch.com/project/judge-using-sae-features-y1r1</loc></url>
<url><loc>https://apartresearch.com/project/escalation</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-the-risk-of-job-displacement-by-transformative-ai-automation-in-developing-countries-a-case-study-on-brazil-829h</loc></url>
<url><loc>https://apartresearch.com/project/the-early-economic-impacts-of-transformative-ai-a-focus-on-temporal-coherence-ipql</loc></url>
<url><loc>https://apartresearch.com/project/the-rate-of-ai-adoption-and-its-implications-for-economic-growth-and-disparities-zlg6</loc></url>
<url><loc>https://apartresearch.com/project/economics-of-tai-sprint-submission-a-recursivelyinspired-framework-and-simulation-results-for-evaluating-a-valuebased-ubi-policy-mhn0</loc></url>
<url><loc>https://apartresearch.com/project/us1-full-ai-nationalization-can-cause-misaligned-economic-incentives-h9ne</loc></url>
<url><loc>https://apartresearch.com/project/economic-impact-analysis-the-impact-of-ai-on-the-indian-it-sector-hrpy</loc></url>
<url><loc>https://apartresearch.com/project/economics-of-tai-sprint-submission-redistributing-the-ai-dividend</loc></url>
<url><loc>https://apartresearch.com/project/economic-feasibility-of-universal-high-income-uhi-in-an-age-of-advanced-automation-jn3g</loc></url>
<url><loc>https://apartresearch.com/project/economics-of-tai-sprint-mitigating-ai-driven-income-equality</loc></url>
<url><loc>https://apartresearch.com/project/economics-of-ai-data-center-energy-infrastructure-strategic-blueprint-for-2030-scim</loc></url>
<url><loc>https://apartresearch.com/project/impact-of-generative-ai-on-tobacco-investment-and-tourism-industry-h8ql</loc></url>
<url><loc>https://apartresearch.com/project/data-as-capital-in-tai-economies-a-biomorphic-framework-oiez</loc></url>
<url><loc>https://apartresearch.com/project/recursive-fitness-alignment-protocol-rfap-29xi</loc></url>
<url><loc>https://apartresearch.com/project/calsandbox-and-the-clear-ai-act-a-stateled-vision-for-responsible-ai-governance-8g21</loc></url>
<url><loc>https://apartresearch.com/project/california-law-for-ethical-and-accountable-regulation-of-artificial-intelligence-clear-ai-act-xo4v</loc></url>
<url><loc>https://apartresearch.com/project/recommendation-to-establish-the-california-ai-accountability-and-redress-act-buqi</loc></url>
<url><loc>https://apartresearch.com/project/round-1-submission-9ven</loc></url>
<url><loc>https://apartresearch.com/project/flexheg-devices-to-enable-implementation-of-ai-intelsat-za6e</loc></url>
<url><loc>https://apartresearch.com/project/smart-governance-safer-innovation-a-california-ai-sandbox-with-guardrails-gq7c</loc></url>
<url><loc>https://apartresearch.com/project/flexheg-devices-to-enable-implementation-of-ai-intelsat-qx72</loc></url>
<url><loc>https://apartresearch.com/project/a-call-for-green-ai-in-california-evaluation-of-existing-and-alternative-regulations-qs1r</loc></url>
<url><loc>https://apartresearch.com/project/data-trusts-in-ai-governance-nhna</loc></url>
<url><loc>https://apartresearch.com/project/from-sandbox-to-standards-a-riskbased-strategy-for-responsible-ai-innovation-in-california-m9ul</loc></url>
<url><loc>https://apartresearch.com/project/the-incentive-gap-extending-darkbench-to-reveal-conflict-of-value-biases-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/21st-century-healthcare-20th-century-rules-bridging-the-ai-regulation-gap-3ooz</loc></url>
<url><loc>https://apartresearch.com/project/ai-risk-management-framework-for-the-healthcare-sector-3gol</loc></url>
<url><loc>https://apartresearch.com/project/building-global-trust-and-security-a-framework-for-aidriven-criminal-scoring-in-immigration-systems-m2w4</loc></url>
<url><loc>https://apartresearch.com/project/leading-ai-governance-new-york-states-adaptive-risktiered-framework-policy-brief-wmqw</loc></url>
<url><loc>https://apartresearch.com/project/dark-patterns-and-emergent-alignment-faking</loc></url>
<url><loc>https://apartresearch.com/project/dimseat-evaluating-chain-of-thought-reasoning-models-for-dark-patterns</loc></url>
<url><loc>https://apartresearch.com/project/mechanisms-of-causal-reasoning</loc></url>
<url><loc>https://apartresearch.com/project/ai-control-via-debate-can-model-debate-catch-adversarial-code-6p6e</loc></url>
<url><loc>https://apartresearch.com/project/honeypotting-deceptive-ai-models-to-share-their-misinformation-goals-x3q7</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-ai-debate-mechanisms-for-backdoor-detection-as-a-part-of-ai-control-setting-thsv</loc></url>
<url><loc>https://apartresearch.com/project/model-models-simulating-a-trusted-monitor-r682</loc></url>
<url><loc>https://apartresearch.com/project/debate-monitoring-comparitive-experiment-0sxl</loc></url>
<url><loc>https://apartresearch.com/project/collusion-and-mitigation-in-ai-control-pm60</loc></url>
<url><loc>https://apartresearch.com/project/eficas-wpfo</loc></url>
<url><loc>https://apartresearch.com/project/adding-document-summaries-to-control-arena-fggr</loc></url>
<url><loc>https://apartresearch.com/project/if-everythings-suspicious-nothing-is-28zn</loc></url>
<url><loc>https://apartresearch.com/project/stop-hitting-yourself-leveraging-helpful-assistance-as-an-attack-vector-w5rt</loc></url>
<url><loc>https://apartresearch.com/project/can-models-use-their-chainofthought-to-attack-overseers-prcv</loc></url>
<url><loc>https://apartresearch.com/project/interactive-monitoring-control-hackathon</loc></url>
<url><loc>https://apartresearch.com/project/schelling-coordination-via-agentic-loops-azvd</loc></url>
<url><loc>https://apartresearch.com/project/token-of-power-top-4ome</loc></url>
<url><loc>https://apartresearch.com/project/kernel-of-trust-evaluating-ai-control-protocols-using-opensource-data-148y</loc></url>
<url><loc>https://apartresearch.com/project/ai-control-through-majority-voting-uiaa</loc></url>
<url><loc>https://apartresearch.com/project/exploration-chatbased-social-engineering-fkqa</loc></url>
<url><loc>https://apartresearch.com/project/safety-metric-and-prompt-engineering-for-red-team-q2d6</loc></url>
<url><loc>https://apartresearch.com/project/deceptive-ai-a-new-control-setting-for-human-manipulation-in-decisionmaking-environments-ub38</loc></url>
<url><loc>https://apartresearch.com/project/ai-safety-escape-room</loc></url>
<url><loc>https://apartresearch.com/project/inspiring-people-to-go-into-rl-interp</loc></url>
<url><loc>https://apartresearch.com/project/a-noise-audit-of-llm-reasoning-in-legal-decisions</loc></url>
<url><loc>https://apartresearch.com/project/feature-based-analysis-of-cooperation-relevant-behaviour-in-prisoner-s-dilemma</loc></url>
<url><loc>https://apartresearch.com/project/red-teaming-with-mech-interpretability</loc></url>
<url><loc>https://apartresearch.com/project/attention-pattern-based-information-flow-visualization-tool-e19d</loc></url>
<url><loc>https://apartresearch.com/project/llm-military-decision-making-under-uncertainty-a-simulation-study</loc></url>
<url><loc>https://apartresearch.com/project/morph-ai-safety-education-adaptable-to-(almost)-anyone</loc></url>
<url><loc>https://apartresearch.com/project/interactive-assessments-for-ai-safety-a-gamified-approach-to-evaluation-and-personal-journey-mapping</loc></url>
<url><loc>https://apartresearch.com/project/mechanistic-interpretability-track-neuronal-pathway-coverage</loc></url>
<url><loc>https://apartresearch.com/project/preparing-for-accelerated-agi-timelines</loc></url>
<url><loc>https://apartresearch.com/project/identification-if-ai-generated-content</loc></url>
<url><loc>https://apartresearch.com/project/superposition-but-at-a-cross-mlp-layers-view</loc></url>
<url><loc>https://apartresearch.com/project/hikayat-interactive-stories-to-learn-ai-safety</loc></url>
<url><loc>https://apartresearch.com/project/medical-agent-controller</loc></url>
<url><loc>https://apartresearch.com/project/hallushield-a-mechanistic-approach-to-hallucination-resistant-models</loc></url>
<url><loc>https://apartresearch.com/project/searching-for-universality-and-equivariance-in-llms-using-sparse-autoencoder-found-features</loc></url>
<url><loc>https://apartresearch.com/project/debugging-language-models-with-saes</loc></url>
<url><loc>https://apartresearch.com/project/ai-through-the-human-lens-investigating-cognitive-theories-in-machine-psychology</loc></url>
<url><loc>https://apartresearch.com/project/u-reg-ai-you-regulate-it-or-you-regenerate-it</loc></url>
<url><loc>https://apartresearch.com/project/an-interpretable-classifier-based-on-large-scale-social-network-analysis</loc></url>
<url><loc>https://apartresearch.com/project/ai-bias-in-resume-screening</loc></url>
<url><loc>https://apartresearch.com/project/scam-detective-using-gamification-to-improve-ai-powered-scam-awareness</loc></url>
<url><loc>https://apartresearch.com/project/bluedot-impact-connect-a-comprehensive-ai-safety-community-platform</loc></url>
<url><loc>https://apartresearch.com/project/ai-society-tracker</loc></url>
<url><loc>https://apartresearch.com/project/detecting-malicious-ai-agents-through-simulated-interactions</loc></url>
<url><loc>https://apartresearch.com/project/beyond-statistical-parrots-unveiling-cognitive-similarities-and-exploring-ai-psychology-through-human-ai-interaction</loc></url>
<url><loc>https://apartresearch.com/project/latent-knowledge-analysis-via-feature-based-causal-tracing</loc></url>
<url><loc>https://apartresearch.com/project/safeai-academy-enhancing-ai-safety-awareness-through-interactive-learning</loc></url>
<url><loc>https://apartresearch.com/project/ai-hallucinations-in-healthcare-cross-cultural-and-linguistic-risks-of-llms-in-low-resource-languages</loc></url>
<url><loc>https://apartresearch.com/project/moral-wiggle-room-in-ai</loc></url>
<url><loc>https://apartresearch.com/project/ai-powered-policymaking-behavioral-nudges-and-democratic-accountability</loc></url>
<url><loc>https://apartresearch.com/project/buggy-supporting-ai-safety-education-through-gamified-learning</loc></url>
<url><loc>https://apartresearch.com/project/cotep-a-multi-modal-chain-of-thought-evaluation-platform-for-the-next-generation-of-sota-ai-models</loc></url>
<url><loc>https://apartresearch.com/project/safe-ai</loc></url>
<url><loc>https://apartresearch.com/project/ai-risk-management-assurance-network-(airman)</loc></url>
<url><loc>https://apartresearch.com/project/prompt-question-shield</loc></url>
<url><loc>https://apartresearch.com/project/scoped-llm-enhancing-adversarial-robustness-and-security-through-targeted-model-scoping</loc></url>
<url><loc>https://apartresearch.com/project/hitl-for-high-risk-ai-domains</loc></url>
<url><loc>https://apartresearch.com/project/neural-seal</loc></url>
<url><loc>https://apartresearch.com/project/securing-agi-deployment-and-mitigating-safety-risks</loc></url>
<url><loc>https://apartresearch.com/project/cite2root</loc></url>
<url><loc>https://apartresearch.com/project/vaultx-ai-driven-middleware-for-real-time-pii-detection-and-data-security</loc></url>
<url><loc>https://apartresearch.com/project/align-file</loc></url>
<url><loc>https://apartresearch.com/project/llm-prompt-optimiser-based-saas-platform-for-evaluations</loc></url>
<url><loc>https://apartresearch.com/project/navigating-the-agi-revolution-retraining-and-redefining-human-purpose</loc></url>
<url><loc>https://apartresearch.com/project/towards-an-agent-marketplace-for-alignment-research-(amar)</loc></url>
<url><loc>https://apartresearch.com/project/ai-safety-evaluation-benchmarking-framework</loc></url>
<url><loc>https://apartresearch.com/project/restriktai-enhancing-safety-and-control-for-autonomous-ai-agents</loc></url>
<url><loc>https://apartresearch.com/project/antimidas-building-commercially-viable-agents-for-alignment-dataset-generation</loc></url>
<url><loc>https://apartresearch.com/project/enhancing-human-intelligence-with-neurofeedback</loc></url>
<url><loc>https://apartresearch.com/project/building-bridges-for-ai-safety-proposal-for-a-collaborative-platform-for-alumni-and-researchers</loc></url>
<url><loc>https://apartresearch.com/project/modernizing-dc-s-emergency-communications</loc></url>
<url><loc>https://apartresearch.com/project/bias-mitigation-in-llm-by-steering-features</loc></url>
<url><loc>https://apartresearch.com/project/faithful-or-factual-tuning-mistake-acknowledgment-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/improving-llama-3-8b-instruct-hallucination-robustness-in-medical-q-a-using-feature-steering</loc></url>
<url><loc>https://apartresearch.com/project/can-we-steer-a-model-s-behavior-with-just-one-prompt-investigating-sae-driven-auto-steering</loc></url>
<url><loc>https://apartresearch.com/project/autosteer-weight-preserving-reinforcement-learning-for-interpretable-model-control</loc></url>
<url><loc>https://apartresearch.com/project/utilitarian-decision-making-in-models-evaluation-and-steering</loc></url>
<url><loc>https://apartresearch.com/project/investigating-feature-effects-on-manipulation-susceptibility</loc></url>
<url><loc>https://apartresearch.com/project/sage-safe-adaptive-generation-engine-for-long-form-document-generation-in-collaborative-high-stakes-domains</loc></url>
<url><loc>https://apartresearch.com/project/bias-mitigation</loc></url>
<url><loc>https://apartresearch.com/project/analyzing-dataset-bias-with-saes</loc></url>
<url><loc>https://apartresearch.com/project/unveiling-latent-beliefs-using-sparse-autoencoders</loc></url>
<url><loc>https://apartresearch.com/project/classification-on-latent-feature-activation-for-detecting-adversarial-prompt-vulnerabilities</loc></url>
<url><loc>https://apartresearch.com/project/sparse-autoencoders-and-gemma-2-2b-pioneering-demographic-sensitive-language-modeling-for-opinion-qa</loc></url>
<url><loc>https://apartresearch.com/project/improving-llama-3-8b-hallucination-robustness-in-medical-q-a-using-feature-steering</loc></url>
<url><loc>https://apartresearch.com/project/assessing-language-model-cybersecurity-capabilities-with-feature-steering</loc></url>
<url><loc>https://apartresearch.com/project/math-speaks-all-languages-enhancing-llm-problem-solving-across-multilingual-contexts</loc></url>
<url><loc>https://apartresearch.com/project/edufire-personalized-education-platform-using-llm-steering</loc></url>
<url><loc>https://apartresearch.com/project/explaining-latents-in-turing-llm-1-0-254m-with-pre-defined-function-types</loc></url>
<url><loc>https://apartresearch.com/project/investigate-arithmetic-features-in-multi-lingual-llms</loc></url>
<url><loc>https://apartresearch.com/project/tentative-proposal-for-ai-control-with-weak-supervisors-trough-mechanistic-inspection</loc></url>
<url><loc>https://apartresearch.com/project/clear-thought-and-clear-speech-reducing-grammatical-scope-ambiguity</loc></url>
<url><loc>https://apartresearch.com/project/bbllm</loc></url>
<url><loc>https://apartresearch.com/project/let-llm-agents-perform-llm-surgery</loc></url>
<url><loc>https://apartresearch.com/project/steering-swiftly-to-safety-with-sparse-autoencoders</loc></url>
<url><loc>https://apartresearch.com/project/feature-tuning-versus-prompting-for-ambiguous-questions</loc></url>
<url><loc>https://apartresearch.com/project/auto-prompt-injection</loc></url>
<url><loc>https://apartresearch.com/project/feature-based-unlearning</loc></url>
<url><loc>https://apartresearch.com/project/recovering-goodfire-s-sae-feature-vectors-from-their-api</loc></url>
<url><loc>https://apartresearch.com/project/encouraging-chain-of-thought-reasoning</loc></url>
<url><loc>https://apartresearch.com/project/user-transparency-within-ai</loc></url>
<url><loc>https://apartresearch.com/project/community-first-a-rights-based-framework-for-ai-governance-in-india-s-welfare-systems</loc></url>
<url><loc>https://apartresearch.com/project/national-data-privacy-and-governance-act</loc></url>
<url><loc>https://apartresearch.com/project/promoting-school-level-accountability-for-the-responsible-deployment-of-ai-and-related-systems-in-k-12-education-mitigating-bias-and-increasing-transparency</loc></url>
<url><loc>https://apartresearch.com/project/implementing-a-human-centered-ai-assessment-framework-(haaf)-for-equitable-ai-development</loc></url>
<url><loc>https://apartresearch.com/project/a-critical-review-of-chips-for-peace-lessons-from-atoms-for-peace</loc></url>
<url><loc>https://apartresearch.com/project/ai-monitoring-as-a-rapid-and-scalable-policy-solution-weekly-global-bulletins-on-ai-developments</loc></url>
<url><loc>https://apartresearch.com/project/grandfather-paradox-in-ai-bias-mitigation-ethical-ai1</loc></url>
<url><loc>https://apartresearch.com/project/glia-for-healthcare-organisations</loc></url>
<url><loc>https://apartresearch.com/project/a-fundamental-rethinking-to-ai-evaluations-establishing-a-constitution-based-framework</loc></url>
<url><loc>https://apartresearch.com/project/advancing-global-governance-for-frontier-ai-a-proposal-for-an-aisi-led-working-group-under-the-ai-safety-summit-series</loc></url>
<url><loc>https://apartresearch.com/project/finding-circular-features-in-gemma-2-2b</loc></url>
<url><loc>https://apartresearch.com/project/digital-rebellion-analyzing-misaligned-ai-agent-cooperation-for-virtual-labor-strikes</loc></url>
<url><loc>https://apartresearch.com/project/mapping-intent-documenting-policy-adherence-with-ontology-extraction</loc></url>
<url><loc>https://apartresearch.com/project/safebites</loc></url>
<url><loc>https://apartresearch.com/project/applai</loc></url>
<url><loc>https://apartresearch.com/project/policy-analysis-ai-and-sustainability-climate-impact-monitoring</loc></url>
<url><loc>https://apartresearch.com/project/understanding-incentives-to-build-uninterruptible-agentic-ai-systems</loc></url>
<url><loc>https://apartresearch.com/project/ai-parliament</loc></url>
<url><loc>https://apartresearch.com/project/mheatlth-ai</loc></url>
<url><loc>https://apartresearch.com/project/next-gen-ai-enhanced-epidemic-intelligence</loc></url>
<url><loc>https://apartresearch.com/project/glia</loc></url>
<url><loc>https://apartresearch.com/project/ai-advisory-council-for-sustainable-economic-growth-and-ethical-innovation-in-the-dominican-republic-(cania)</loc></url>
<url><loc>https://apartresearch.com/project/robust-machine-unlearning-for-dangerous-capabilities</loc></url>
<url><loc>https://apartresearch.com/project/ai-and-public-health-tsa-pre-health-check</loc></url>
<url><loc>https://apartresearch.com/project/hero-journey-personalized-health-interventions-for-the-incarcerated</loc></url>
<url><loc>https://apartresearch.com/project/econavix</loc></url>
<url><loc>https://apartresearch.com/project/towards-a-unified-framework-for-cybersecurity-and-ai-safety-recommendations-for-secure-development-of-large-language-models</loc></url>
<url><loc>https://apartresearch.com/project/enviro-a-comprehensive-environmental-solution-using-policy-and-technology</loc></url>
<url><loc>https://apartresearch.com/project/enhancing-human-verification-systems-to-address-ai-agent-circumvention-and-attributability-concerns</loc></url>
<url><loc>https://apartresearch.com/project/reprocessing-nuclear-waste-from-small-modular-reactors-(smrs)</loc></url>
<url><loc>https://apartresearch.com/project/politicians-on-ai-safety</loc></url>
<url><loc>https://apartresearch.com/project/policy-framework-for-sustainable-ai-repurposing-waste-heat-from-data-centers-in-the-usa</loc></url>
<url><loc>https://apartresearch.com/project/predictive-analytics-imagery-for-environmental-monitoring</loc></url>
<url><loc>https://apartresearch.com/project/proposal-for-u-s-china-technical-cooperation-on-ai-safety</loc></url>
<url><loc>https://apartresearch.com/project/proposal-for-a-provisional-fda-designation-targeting-biomedical-products-evaluated-with-novel-methodologies</loc></url>
<url><loc>https://apartresearch.com/project/reparative-algorithmic-impact-assessments-a-human-centered-justice-oriented-accountability-framework</loc></url>
<url><loc>https://apartresearch.com/project/infectious-disease-outbreak-prediction-and-dashboard</loc></url>
<url><loc>https://apartresearch.com/project/pan-your-smart-sustainability-expert</loc></url>
<url><loc>https://apartresearch.com/project/very-cooperative-agent</loc></url>
<url><loc>https://apartresearch.com/project/cross-model-surveillance-for-emails-handling</loc></url>
<url><loc>https://apartresearch.com/project/inference-time-agent-security</loc></url>
<url><loc>https://apartresearch.com/project/diamonds-are-not-all-you-need</loc></url>
<url><loc>https://apartresearch.com/project/cop-n-shop</loc></url>
<url><loc>https://apartresearch.com/project/intent-inspector-protecting-against-prompt-injections-for-agent-tool-misuse</loc></url>
<url><loc>https://apartresearch.com/project/ai-honeypot</loc></url>
<url><loc>https://apartresearch.com/project/dynamic-risk-assessment-in-autonomous-agents-using-ontologies-and-ai</loc></url>
<url><loc>https://apartresearch.com/project/ocap-agents</loc></url>
<url><loc>https://apartresearch.com/project/ai-agent-capabilities-evolution</loc></url>
<url><loc>https://apartresearch.com/project/an-autonomous-agent-for-model-attribution</loc></url>
<url><loc>https://apartresearch.com/project/using-arc-agi-puzzles-as-captcha-task</loc></url>
<url><loc>https://apartresearch.com/project/llm-agent-security-jailbreaking-vulnerabilities-and-mitigation-strategies</loc></url>
<url><loc>https://apartresearch.com/project/interpreting-a-toy-model-for-finding-the-maximum-element-in-a-list</loc></url>
<url><loc>https://apartresearch.com/project/nnsight-transparent-debugging</loc></url>
<url><loc>https://apartresearch.com/project/mintranscoders</loc></url>
<url><loc>https://apartresearch.com/project/latent-space-clustering-and-summarization</loc></url>
<url><loc>https://apartresearch.com/project/tiny-model</loc></url>
<url><loc>https://apartresearch.com/project/thermesagent</loc></url>
<url><loc>https://apartresearch.com/project/attention-deficit-agreeable-agent</loc></url>
<url><loc>https://apartresearch.com/project/ramon</loc></url>
<url><loc>https://apartresearch.com/project/guardianai</loc></url>
<url><loc>https://apartresearch.com/project/devising-effective-bechmarks</loc></url>
<url><loc>https://apartresearch.com/project/simulation-operators-the-next-level-of-the-annotation-business</loc></url>
<url><loc>https://apartresearch.com/project/welma-open-world-environments-for-language-model-agents</loc></url>
<url><loc>https://apartresearch.com/project/steer-an-api-to-steer-open-llms</loc></url>
<url><loc>https://apartresearch.com/project/identity-system-for-ais</loc></url>
<url><loc>https://apartresearch.com/project/ai-safety-collective-crowdsourcing-solutions-for-critical-ai-safety-challenges</loc></url>
<url><loc>https://apartresearch.com/project/camara-a-comprehensive-adaptive-multi-agent-framework-for-red-teaming-and-adversarial-defense</loc></url>
<url><loc>https://apartresearch.com/project/amplified-wise-simulations-for-safe-training-and-deployment</loc></url>
<url><loc>https://apartresearch.com/project/lign-aligned-agent-based-workflows-via-collaboration-safety-protocols</loc></url>
<url><loc>https://apartresearch.com/project/jailbreaking-general-purpose-robots</loc></url>
<url><loc>https://apartresearch.com/project/darkforest-defending-the-authentic-and-humane-web</loc></url>
<url><loc>https://apartresearch.com/project/demonstrating-llm-code-injection-via-compromised-agent-tool</loc></url>
<url><loc>https://apartresearch.com/project/phish-tycoon-phishing-using-voice-cloning</loc></url>
<url><loc>https://apartresearch.com/project/misinformational-ai-generated-academic-papers</loc></url>
<url><loc>https://apartresearch.com/project/copirate</loc></url>
<url><loc>https://apartresearch.com/project/grandslam-usecases-not-technology</loc></url>
<url><loc>https://apartresearch.com/project/ai-agents-for-personalized-interaction-and-behavioral-analysis</loc></url>
<url><loc>https://apartresearch.com/project/speculative-consequences-of-a-i-misuse</loc></url>
<url><loc>https://apartresearch.com/project/llm-code-injection</loc></url>
<url><loc>https://apartresearch.com/project/redfluence</loc></url>
<url><loc>https://apartresearch.com/project/bbc-news-impersonator</loc></url>
<url><loc>https://apartresearch.com/project/unsolved-ai-safety-concepts-explorer</loc></url>
<url><loc>https://apartresearch.com/project/ai-research-paper-processor</loc></url>
<url><loc>https://apartresearch.com/project/sleeper-agents-detector</loc></url>
<url><loc>https://apartresearch.com/project/adgpt</loc></url>
<url><loc>https://apartresearch.com/project/general-pervasiveness</loc></url>
<url><loc>https://apartresearch.com/project/webcam</loc></url>
<url><loc>https://apartresearch.com/project/verifystream</loc></url>
<url><loc>https://apartresearch.com/project/web-app-for-interacting-with-refusal-ablated-language-model-agents</loc></url>
<url><loc>https://apartresearch.com/project/alignment-research-critiquer</loc></url>
<url><loc>https://apartresearch.com/project/pureprompt-an-easy-tool-for-prompt-robustness-and-eval-augmentation</loc></url>
<url><loc>https://apartresearch.com/project/llm-research-collaboration-recommender</loc></url>
<url><loc>https://apartresearch.com/project/data-massager</loc></url>
<url><loc>https://apartresearch.com/project/ai-alignment-toolkit-research-assistant</loc></url>
<url><loc>https://apartresearch.com/project/grant-application-simulator</loc></url>
<url><loc>https://apartresearch.com/project/ai-alignment-knowledge-graph</loc></url>
<url><loc>https://apartresearch.com/project/reflections-on-using-llms-to-read-a-paper</loc></url>
<url><loc>https://apartresearch.com/project/academic-weapon</loc></url>
<url><loc>https://apartresearch.com/project/detecting-lies-of-(c)omission</loc></url>
<url><loc>https://apartresearch.com/project/the-house-always-wins-a-framework-for-evaluating-strategic-deception-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/detecting-and-controlling-deceptive-representation-in-llms-with-representational-engineering</loc></url>
<url><loc>https://apartresearch.com/project/sandbag-detection-through-model-degradation</loc></url>
<url><loc>https://apartresearch.com/project/detecting-deception-in-gpt-3-5-turbo-a-metadata-based-approach</loc></url>
<url><loc>https://apartresearch.com/project/can-language-models-sandbag-manipulation</loc></url>
<url><loc>https://apartresearch.com/project/deceptive-behavior-does-not-seem-to-be-reducible-to-a-single-vector</loc></url>
<url><loc>https://apartresearch.com/project/werewolf-benchmark</loc></url>
<url><loc>https://apartresearch.com/project/detecting-deception-with-ai-tics</loc></url>
<url><loc>https://apartresearch.com/project/eliciting-maximally-distressing-questions-for-deceptive-llms</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-steering-methods-for-deceptive-behavior-control-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/an-exploration-of-current-theory-of-mind-evals</loc></url>
<url><loc>https://apartresearch.com/project/sandbagging-llms-using-activation-steering</loc></url>
<url><loc>https://apartresearch.com/project/towards-a-benchmark-for-self-correction-on-model-attributed-misinformation</loc></url>
<url><loc>https://apartresearch.com/project/boosting-language-model-honesty-with-truthful-suffixes</loc></url>
<url><loc>https://apartresearch.com/project/detection-of-potentially-deceptive-attitudes-using-expression-style-analysis</loc></url>
<url><loc>https://apartresearch.com/project/from-sycophancy-(not)-to-sandbagging</loc></url>
<url><loc>https://apartresearch.com/project/gradient-based-deceptive-trigger-discovery</loc></url>
<url><loc>https://apartresearch.com/project/modelling-the-oversight-of-automated-interpretability-against-deceptive-agents-on-sparse-autoencoders</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-and-inducing-steganography-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/developing-a-deception-dataset</loc></url>
<url><loc>https://apartresearch.com/project/unsupervised-recovery-of-hidden-markov-models-from-transformers-with-evolutionary-algorithms</loc></url>
<url><loc>https://apartresearch.com/project/looking-forward-to-posterity-what-past-information-is-transferred-to-the-future</loc></url>
<url><loc>https://apartresearch.com/project/investigating-the-effect-of-model-capacity-constraints-on-belief-state-representations</loc></url>
<url><loc>https://apartresearch.com/project/belief-state-representations-in-transformer-models-on-nonergodic-data</loc></url>
<url><loc>https://apartresearch.com/project/rnns-represent-belief-state-geometry-in-hidden-state</loc></url>
<url><loc>https://apartresearch.com/project/steering-model-s-belief-states</loc></url>
<url><loc>https://apartresearch.com/project/handcrafting-a-network-to-predict-next-token-probabilities-for-the-random-random-xor-process</loc></url>
<url><loc>https://apartresearch.com/project/exploring-hierarchical-structure-representation-in-transformer-models-through-computational-mechanics</loc></url>
<url><loc>https://apartresearch.com/project/rainboltbench-benchmarking-user-location-inference-through-single-images</loc></url>
<url><loc>https://apartresearch.com/project/llm-benchmarking-with-single-agent-stochastic-dynamic-simulations</loc></url>
<url><loc>https://apartresearch.com/project/benchmark-for-emergent-capabilities-in-high-risk-scenarios-2</loc></url>
<url><loc>https://apartresearch.com/project/benchmark-for-emergent-capabilities-in-high-risk-scenarios</loc></url>
<url><loc>https://apartresearch.com/project/benchmarking-dark-patterns-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/say-no-to-mass-destruction-benchmarking-refusals-to-answer-dangerous-questions</loc></url>
<url><loc>https://apartresearch.com/project/cybersecurity-persistence-benchmark</loc></url>
<url><loc>https://apartresearch.com/project/washbench-a-benchmark-for-assessing-softening-of-harmful-content-in-llm-generated-text-summaries</loc></url>
<url><loc>https://apartresearch.com/project/evaluating-the-ability-of-llms-to-follow-rules</loc></url>
<url><loc>https://apartresearch.com/project/black-box-detection-of-sleeper-agents</loc></url>
<url><loc>https://apartresearch.com/project/manifold-recovery-as-a-benchmark-for-text-embedding-models</loc></url>
<url><loc>https://apartresearch.com/project/anthroprobe</loc></url>
<url><loc>https://apartresearch.com/project/jekyll-and-haide-the-better-an-llm-is-at-identifying-misinformation-the-more-effective-it-is-at-worsening-it</loc></url>
<url><loc>https://apartresearch.com/project/the-role-of-ai-in-combating-political-deepfakes-in-african-democracies</loc></url>
<url><loc>https://apartresearch.com/project/legislaitor-a-tool-for-jailbreaking-the-legislative-process</loc></url>
<url><loc>https://apartresearch.com/project/subtle-and-simple-ways-to-shift-political-bias-in-llms</loc></url>
<url><loc>https://apartresearch.com/project/beyond-refusal-scrubbing-hazards-from-open-source-models</loc></url>
<url><loc>https://apartresearch.com/project/silent-curriculum</loc></url>
<url><loc>https://apartresearch.com/project/building-more-democratic-institutions-with-collaboratively-constructed-debate-moderation-tools</loc></url>
<url><loc>https://apartresearch.com/project/ai-misinformation-and-threats-to-democratic-rights</loc></url>
<url><loc>https://apartresearch.com/project/artificial-advocates-biasing-democratic-feedback-using-ai</loc></url>
<url><loc>https://apartresearch.com/project/assessing-algorithmic-bias-in-large-language-models-predictions-of-public-opinion-across-demographics</loc></url>
<url><loc>https://apartresearch.com/project/ai-misinformation-threatens-the-wisdom-of-the-crowd</loc></url>
<url><loc>https://apartresearch.com/project/trustworthy-or-knave-scoring-politicians-with-ai-in-real-time</loc></url>
<url><loc>https://apartresearch.com/project/unleashing-sleeper-agents</loc></url>
<url><loc>https://apartresearch.com/project/multilingual-bias-in-large-language-models-assessing-political-skew-across-languages</loc></url>
<url><loc>https://apartresearch.com/project/ai-in-the-newsroom-analyzing-the-increase-in-chatgpt-favored-words-in-news-articles</loc></url>
<url><loc>https://apartresearch.com/project/wndp-defense-weapons-of-mass-disruption</loc></url>
<url><loc>https://apartresearch.com/project/democracy-and-ai-ensuring-election-efficiency-in-nigeria-and-africa</loc></url>
<url><loc>https://apartresearch.com/project/universal-jailbreak-of-closed-source-llms-which-provide-an-end-point-to-finetune</loc></url>
<url><loc>https://apartresearch.com/project/ai-politician</loc></url>
<url><loc>https://apartresearch.com/project/a-framework-for-centralizing-forces-in-ai</loc></url>
<url><loc>https://apartresearch.com/project/digital-diplomacy-advancing-digital-peace-building-with-al-in-africa-2</loc></url>
<url><loc>https://apartresearch.com/project/digital-diplomacy-advancing-digital-peace-building-with-al-in-africa</loc></url>
<url><loc>https://apartresearch.com/project/investigating-detection-of-election-influencing-sleeper-agents-using-probes</loc></url>
<url><loc>https://apartresearch.com/project/no-place-is-safe-automated-investigation-of-private-communities</loc></url>
<url><loc>https://apartresearch.com/project/use-of-ai-in-political-campaigns-gap-assessment-and-recommendations</loc></url>
<url><loc>https://apartresearch.com/news/explaining-the-apart-research-fellowships</loc></url>
<url><loc>https://apartresearch.com/news/problem-areas-in-physics-and-ai-safety</loc></url>
<url><loc>https://apartresearch.com/news/apart-two-days-left-of-our-fundraiser</loc></url>
<url><loc>https://apartresearch.com/news/apart-fundraiser-extended</loc></url>
<url><loc>https://apartresearch.com/news/apart-fundraiser-update</loc></url>
<url><loc>https://apartresearch.com/news/beyond-monolithic-ai-the-case-for-an-expert-orchestration-architecture</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-transformative-ai-economics</loc></url>
<url><loc>https://apartresearch.com/news/engineering-a-world-designed-for-safe-superintelligence</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-our-biggest-event-ever</loc></url>
<url><loc>https://apartresearch.com/news/women-in-ai-safety-hackathon-round-up</loc></url>
<url><loc>https://apartresearch.com/news/mapping-ai-safety-research-an-open-source-knowledge-graph</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-san-francisco-edition</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-iclr-awards-women-in-ai-safety</loc></url>
<url><loc>https://apartresearch.com/news/uncovering-model-manipulation-with-darkbench</loc></url>
<url><loc>https://apartresearch.com/news/studio-progress-report</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-esben-at-iaseai-studio-progress-report</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-paris-ai-summit-catching-hackers</loc></url>
<url><loc>https://apartresearch.com/news/ai-safety-entrepreneurship-hackathon-round-up</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-ai-entrepreneurship-new-research</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-exclusive-interview-with-interpretability-insider</loc></url>
<url><loc>https://apartresearch.com/news/behind-the-features-goodfire-s-interpretability-tools-in-action</loc></url>
<url><loc>https://apartresearch.com/news/promising-results-from-latent-adversarial-training</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-new-lat-research-just-dropped</loc></url>
<url><loc>https://apartresearch.com/news/inside-the-first-ai-policy-hackathon-at-johns-hopkins</loc></url>
<url><loc>https://apartresearch.com/news/apart-in-2024</loc></url>
<url><loc>https://apartresearch.com/news/ai-hackers-in-the-wild-llm-agent-honeypot</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-hackathons-in-2025-preview</loc></url>
<url><loc>https://apartresearch.com/news/sparse-autoencoder-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/rethinking-cyberseceval-an-llm-aided-approach-to-evaluation-critique</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-our-research-at-neurips</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-new-video-jacob-haimes-on-working-at-apart</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-2024-was-our-biggest-year-yet</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-how-impactful-are-we</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-new-papers-elections-goodfire</loc></url>
<url><loc>https://apartresearch.com/news/testing-llms-ability-to-find-security-flaws-in-cryptographic-protocols</loc></url>
<url><loc>https://apartresearch.com/news/how-impactful-is-donating-to-apart-research</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-announcing-apart-lab-studio</loc></url>
<url><loc>https://apartresearch.com/news/announcing-apart-lab-studio</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-ale-cash-prizes-the-uk-s-aisi</loc></url>
<url><loc>https://apartresearch.com/news/researcher-spotlight-alexandra-abbas</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-esben-winning-sprints-3cb</loc></url>
<url><loc>https://apartresearch.com/news/esben-on-agi-sentware-and-confident-optimism</loc></url>
<url><loc>https://apartresearch.com/news/3cb-the-catastrophic-cyber-capabilities-benchmark</loc></url>
<url><loc>https://apartresearch.com/news/ai-policy-hackathon-in-washington-d-c</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-finn-cyber-offense-johns-hopkins</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-clement-benchmarks-d-c</loc></url>
<url><loc>https://apartresearch.com/news/benchmark-inflation-revealing-llm-performance-gaps-using-retro-holdouts</loc></url>
<url><loc>https://apartresearch.com/news/researcher-spotlight-clement-neo</loc></url>
<url><loc>https://apartresearch.com/news/researcher-spotlight-akash-kundu</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-researcher-spotlight-new-team-member-bangalore</loc></url>
<url><loc>https://apartresearch.com/news/esben-on-agent-safety-research</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-agents-submissions-spain</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-new-research-neurips-papers-team-offsite</loc></url>
<url><loc>https://apartresearch.com/news/do-models-really-internalize-our-preferences</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-o1-awards-singapore</loc></url>
<url><loc>https://apartresearch.com/news/apart-news-ai-startups-india-concordia</loc></url>
<url><loc>https://apartresearch.com/news/can-startups-be-impactful-in-ai-safety</loc></url>
<url><loc>https://apartresearch.com/news/where-we-are-on-for-profit-ai-safety</loc></url>
<url><loc>https://apartresearch.com/news/finding-deception-in-language-models</loc></url>
<url><loc>https://apartresearch.com/news/code-red-llm-evaluations-hackathon-wrap-up-(metr-and-apart)</loc></url>
<url><loc>https://apartresearch.com/news/the-ultimate-guide-to-ai-safety-research-hackathons</loc></url>
<url><loc>https://apartresearch.com/news/join-us-at-the-ai-x-democracy-research-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/join-the-ai-evaluation-tasks-bounty-hackathon-with-metr</loc></url>
<url><loc>https://apartresearch.com/news/how-to-organize-a-research-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/researcher-spotlight-jacob-haimes</loc></url>
<url><loc>https://apartresearch.com/news/ai-safety-needs-to-scale-and-heres-how-you-can-do-it</loc></url>
<url><loc>https://apartresearch.com/news/for-profit-ai-safety</loc></url>
<url><loc>https://apartresearch.com/news/taking-your-next-steps-after-a-research-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/why-organize-a-research-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/updated-quickstart-guide-for-mechanistic-interpretability</loc></url>
<url><loc>https://apartresearch.com/news/results-from-the-scale-oversight-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/results-from-the-ai-testing-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/results-from-the-language-model-hackathon</loc></url>
<url><loc>https://apartresearch.com/news/results-from-the-interpretability-hackathon</loc></url>
</urlset>