<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>/external/2024/2024-03-14-fsdp-qlora-deep-dive</loc>
<lastmod>2024-03-14T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/external/2024/2024-12-19-finally-replacement-for-bert</loc>
<lastmod>2024-12-19T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/external/2025/2025-02-10-masked-language-models-zero-shot</loc>
<lastmod>2025-02-10T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/external/2025/2025-11-14-openmidnight</loc>
<lastmod>2025-11-14T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/external/2025/2025-12-22-medmarks_01</loc>
<lastmod>2025-12-22T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2021/07/19/benchmarking-pytorch-native-mish.html</loc>
<lastmod>2021-07-19T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2021/10/01/inference-with-fastai.html</loc>
<lastmod>2021-10-01T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2021/12/08/testing-amazon-sagemaker-studio-lab.html</loc>
<lastmod>2021-12-08T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/03/11/detecting-cloud-cover-via-satellite.html</loc>
<lastmod>2022-03-11T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/06/06/introducing-fastxtend.html</loc>
<lastmod>2022-06-06T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/06/14/debugging-pytorch-performance-decrease.html</loc>
<lastmod>2022-06-14T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/07/14/tinkering-with-attention-pooling.html</loc>
<lastmod>2022-07-14T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/08/07/remixed-art-history-with-stable-diffusion.html</loc>
<lastmod>2022-08-07T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2022/08/31/training-atari-agents-faster.html</loc>
<lastmod>2022-08-31T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2023/01/20/replicating-growing-cosine-unit.html</loc>
<lastmod>2023-01-20T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2023/05/10/quickly-finetune-transformers.html</loc>
<lastmod>2023-05-10T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2023/07/01/attention-mechanism.html</loc>
<lastmod>2023-07-01T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2023/07/28/rest-of-the-transformer.html</loc>
<lastmod>2023-07-28T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/2023/08/16/flash-attention-compile.html</loc>
<lastmod>2023-08-16T00:00:00+00:00</lastmod>
</url>
<url>
<loc>/about.html</loc>
</url>
<url>
<loc>/</loc>
</url>
<url>
<loc>/papers.html</loc>
</url>
<url>
<loc>/projects.html</loc>
</url>
<url>
<loc>/all/all.html</loc>
</url>
<url>
<loc>/all/page/2/all.html</loc>
</url>
<url>
<loc>/all/page/3/all.html</loc>
</url>
<url>
<loc>/all/page/4/all.html</loc>
</url>
<url>
<loc>/posts/posts.html</loc>
</url>
<url>
<loc>/posts/page/2/posts.html</loc>
</url>
<url>
<loc>/posts/page/3/posts.html</loc>
</url>
</urlset>
