CINXE.COM
Replicate - Blog
<!DOCTYPE html><html lang="en" class=""><head><meta charSet="utf-8"/><meta name="viewport" content="width=device-width, initial-scale=1"/><title>Replicate - Blog</title><meta name="description" content="Follow Replicate’s blog for product updates and feature announcements."/><meta name="og:description" content="Follow Replicate’s blog for product updates and feature announcements."/><meta name="color-scheme" content="dark light"/><script> (() => { const theme = window.matchMedia("(prefers-color-scheme: light)").matches ? 'light' : 'dark'; const cl = document.documentElement.classList; const dataAttr = document.documentElement.dataset.theme; if (dataAttr != null) { const themeAlreadyApplied = dataAttr === 'light' || dataAttr === 'dark'; if (!themeAlreadyApplied) { document.documentElement.dataset.theme = theme; } } else { const themeAlreadyApplied = cl.contains('light') || cl.contains('dark'); if (!themeAlreadyApplied) { cl.add(theme); } } const meta = document.querySelector('meta[name=color-scheme]'); if (meta) { if (theme === 'dark') { meta.content = 'dark light'; } else if (theme === 'light') { meta.content = 'light dark'; } } })(); </script><link rel="stylesheet" href="/frontend-assets/glyph-loader-DeE7NgvF.css"/><link rel="stylesheet" href="/frontend-assets/index-BBxItpE1.css"/><link rel="stylesheet" href="/frontend-assets/nprogress-IQvgPhqq.css"/><link rel="icon" href="data:image/svg+xml,%3c?xml%20version='1.0'%20encoding='utf-8'?%3e%3csvg%20version='1.1'%20xmlns='http://www.w3.org/2000/svg'%20viewBox='0%200%20512%20512'%3e%3cstyle%3e%20polygon%20{%20fill:%20black;%20}%20@media%20(prefers-color-scheme:%20dark)%20{%20polygon%20{%20fill:%20white;%20}%20}%20%3c/style%3e%3cg%3e%3cpolygon%20points='512,218.9%20512,276.8%20308.9,276.8%20308.9,512%20244.2,512%20244.2,218.9'%20/%3e%3cpolygon%20points='512,109.5%20512,167.5%20186.8,167.5%20186.8,512%20122.1,512%20122.1,109.5'%20/%3e%3cpolygon%20points='512,0%20512,57.9%2064.7,57.9%2064.7,512%200,512%200,0'%20/%3e%3c/g%3e%3c/svg%3e" type="image/svg+xml"/></head><body><header class="bg-white/80 dark:bg-r8-gray-a1 top-0 left-0 right-0 z-50 relative backdrop-blur-md md:fixed"><div class="h-[var(--header-height)] border-b border-r8-gray-6 dark:border-white/10 flex items-center"><div class="max-w-screen-2xl px-6 lg:px-16 w-full mx-auto flex items-center justify-between"><div class="flex items-center gap-2"><a href="https://replicate.com" class="text-black dark:text-white size-8 inline-flex items-center justify-center focus:bg-black focus:text-white dark:focus:bg-white text-r8-sm focus:outline-black dark:focus:outline-white dark:focus:text-black outline-offset-0 focus:outline outline-8"><div class="size-8"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></a></div><nav class="hidden md:flex items-center gap-4"><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/explore">Explore</a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/playground">Playground<span class="text-r8-xs ml-2 text-r8-green-a10 border border-r8-green-a10 rounded-full px-2 py-0.5 text-xs group-focus:text-r8-gray-1 group-focus:border-r8-gray-1 group-focus:bg-r8-gray-12 group-hover:bg-r8-green-10 group-hover:border-r8-green-1 group-hover:text-r8-green-1">Beta</span></a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/pricing">Pricing</a><a data-discover="true" class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="/docs">Docs</a><a data-discover="true" aria-current="page" class="link-focus group text-r8-gray-12 underline underline-offset-4" href="/blog">Blog</a><a data-discover="true" class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="/changelog">Changelog</a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/signin">Sign in</a><a class="link-focus group link-primary" href="https://replicate.com/signin?next=/docs">Get started</a></nav><div class="md:hidden"><button aria-expanded="false" class="r8-btn r8-btn--outlined r8-btn--primary r8-btn--sm"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M228,128a12,12,0,0,1-12,12H40a12,12,0,0,1,0-24H216A12,12,0,0,1,228,128ZM40,76H216a12,12,0,0,0,0-24H40a12,12,0,0,0,0,24ZM216,180H40a12,12,0,0,0,0,24H216a12,12,0,0,0,0-24Z"></path></svg></span>Menu</button></div></div></div></header><div id=":R4j5:" hidden="" class="md:hidden" style="display:none"><div class="bg-white dark:bg-r8-gray-1 border-b border-r8-gray-6"><div class="max-w-screen-2xl px-6 lg:px-16 mx-auto"><nav class="flex flex-col gap-3 py-4"><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/explore">Explore</a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/playground">Playground<span class="text-r8-xs ml-2 text-r8-green-a10 border border-r8-green-a10 rounded-full px-2 py-0.5 text-xs group-focus:text-r8-gray-1 group-focus:border-r8-gray-1 group-focus:bg-r8-gray-12 group-hover:bg-r8-green-10 group-hover:border-r8-green-1 group-hover:text-r8-green-1">Beta</span></a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/pricing">Pricing</a><a data-discover="true" class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="/docs">Docs</a><a data-discover="true" aria-current="page" class="link-focus group text-r8-gray-12 underline underline-offset-4" href="/blog">Blog</a><a data-discover="true" class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="/changelog">Changelog</a><a class="link-focus group text-r8-gray-11 hover:text-r8-gray-12" href="https://replicate.com/signin">Sign in</a><a class="link-focus group link-primary" href="https://replicate.com/signin?next=/docs">Get started</a></nav></div></div></div><div class="container px-6 md:pt-[var(--header-height)] min-h-[calc(100dvh-var(--header-height))]"><div class="max-w-screen-xl py-8"><div class="max-w-3xl"><div><div><div class="mb-4 flex items-center gap-8"><h1 class="text-r8-4xl tracking-tight text-balance leading-tight font-heading font-semibold">Blog</h1><div class="flex items-center gap-2"><a href="/blog/rss" class="r8-btn r8-btn--outlined r8-btn--primary r8-btn--sm"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M106.91,149.09A71.53,71.53,0,0,1,128,200a8,8,0,0,1-16,0,56,56,0,0,0-56-56,8,8,0,0,1,0-16A71.53,71.53,0,0,1,106.91,149.09ZM56,80a8,8,0,0,0,0,16A104,104,0,0,1,160,200a8,8,0,0,0,16,0A120,120,0,0,0,56,80Zm118.79,1.21A166.9,166.9,0,0,0,56,32a8,8,0,0,0,0,16A151,151,0,0,1,163.48,92.52,151,151,0,0,1,208,200a8,8,0,0,0,16,0A166.9,166.9,0,0,0,174.79,81.21ZM60,184a12,12,0,1,0,12,12A12,12,0,0,0,60,184Z"></path></svg></span>RSS</a><a href="/blog/atom" class="r8-btn r8-btn--outlined r8-btn--primary r8-btn--sm"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M196.12,128c24.65-34.61,37.22-70.38,19.74-87.86S162.61,35.23,128,59.88C93.39,35.23,57.62,22.66,40.14,40.14S35.23,93.39,59.88,128c-24.65,34.61-37.22,70.38-19.74,87.86h0c5.63,5.63,13.15,8.14,21.91,8.14,18.48,0,42.48-11.17,66-27.88C151.47,212.83,175.47,224,194,224c8.76,0,16.29-2.52,21.91-8.14h0C233.34,198.38,220.77,162.61,196.12,128Zm8.43-76.55c7.64,7.64,2.48,32.4-18.52,63.28a300.33,300.33,0,0,0-21.19-23.57A300.33,300.33,0,0,0,141.27,70C172.15,49,196.91,43.8,204.55,51.45ZM176.29,128a289.14,289.14,0,0,1-22.76,25.53A289.14,289.14,0,0,1,128,176.29a289.14,289.14,0,0,1-25.53-22.76A289.14,289.14,0,0,1,79.71,128,298.62,298.62,0,0,1,128,79.71a289.14,289.14,0,0,1,25.53,22.76A289.14,289.14,0,0,1,176.29,128ZM51.45,51.45c2.2-2.21,5.83-3.35,10.62-3.35C73.89,48.1,92.76,55,114.72,70A304,304,0,0,0,91.16,91.16,300.33,300.33,0,0,0,70,114.73C49,83.85,43.81,59.09,51.45,51.45Zm0,153.1C43.81,196.91,49,172.15,70,141.27a300.33,300.33,0,0,0,21.19,23.57A304.18,304.18,0,0,0,114.73,186C83.85,207,59.09,212.2,51.45,204.55Zm153.1,0c-7.64,7.65-32.4,2.48-63.28-18.52a304.18,304.18,0,0,0,23.57-21.19A300.33,300.33,0,0,0,186,141.27C207,172.15,212.19,196.91,204.55,204.55ZM140,128a12,12,0,1,1-12-12A12,12,0,0,1,140,128Z"></path></svg></span>Atom</a></div></div><ol class="divide-y divide-r8-gray-6"><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fast-flux-fine-tunes"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fast-flux-fine-tunes/out-0-11.webp" alt="FLUX fine-tunes are now fast"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">FLUX fine-tunes are now fast</h2><p class="text-r8-gray-11 max-w-xl">We've made running fine-tunes on Replicate much faster, and the optimizations are open-source.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 26, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/flux-tools"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/flux-tools/cover.png" alt="FLUX.1 Tools – Control and steerability for FLUX"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">FLUX.1 Tools – Control and steerability for FLUX</h2><p class="text-r8-gray-11 max-w-xl">A new set of image generation capabilities for FLUX models, including inpainting, outpainting, canny edge detection, and depth maps.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 21, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/nvidia-l40s-gpus-are-here"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/nvidia-l40s-gpus-are-here/cover.png" alt="NVIDIA L40S GPUs are here"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">NVIDIA L40S GPUs are here</h2><p class="text-r8-gray-11 max-w-xl">NVIDIA L40S GPUs are here, with better performance and lower cost.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 15, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/data-urls-in-our-sync-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">We messed up: data URLs in our sync API</h2><p class="text-r8-gray-11 max-w-xl">We've decided to stop returning data URLs in sync API outputs based on feedback from users. We're going to take a few steps back and figure out the best way to get your model output as fast as possible.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 31, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/ideogram-v2-inpainting"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/ideogram-v2-inpainting/cover.png" alt="Ideogram v2 is an outstanding new inpainting model"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Ideogram v2 is an outstanding new inpainting model</h2><p class="text-r8-gray-11 max-w-xl">We've partnered with Ideogram to bring their inpainting model to Replicate's API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 22, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/stable-diffusion-3-5-is-here"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/stable-diffusion-3-5-is-here/cover.webp" alt="Stable Diffusion 3.5 is here"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Stable Diffusion 3.5 is here</h2><p class="text-r8-gray-11 max-w-xl">Stability AI's latest text-to-image model is now available on Replicate and you can run it with an API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 22, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/flux-is-fast-and-open-source"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/flux-is-fast/cover.png" alt="FLUX is fast and it's open source"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">FLUX is fast and it's open source</h2><p class="text-r8-gray-11 max-w-xl">FLUX is now much faster on Replicate, and we’ve made our optimizations open-source so you can see exactly how they work and build upon them.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 10, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/flux-1-1-pro-is-here"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/flux-1-1-pro-is-here/cover.webp" alt="FLUX1.1 [pro] is here"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">FLUX1.1 [pro] is here</h2><p class="text-r8-gray-11 max-w-xl">Black Forest Labs continue to push boundaries with their latest release of FLUX.1 image generation model.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 3, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/using-synthetic-data-to-improve-flux-finetunes"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/using-synthetic-data-to-improve-flux-finetunes/cover.jpg" alt="Using synthetic training data to improve Flux finetunes"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Using synthetic training data to improve Flux finetunes</h2><p class="text-r8-gray-11 max-w-xl">It's easy to fine-tune Flux, but sometimes you need to do a little more work to get the best results. This post covers techniques you can use to improve your fine-tuned Flux models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>September 20, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-flux-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-flux-with-an-api/cover.jpg" alt="Fine-tune FLUX.1 with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune FLUX.1 with an API</h2><p class="text-r8-gray-11 max-w-xl">Create and run your own fine-tuned Flux models programmatically using Replicate's HTTP API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>September 9, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-flux-with-faces"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-flux-with-faces/cover.jpg" alt="Fine-tune FLUX.1 to create images of yourself"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune FLUX.1 to create images of yourself</h2><p class="text-r8-gray-11 max-w-xl">Create your own fine-tuned Flux model to generate new images of yourself.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 30, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-08-23"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #12</h2><p class="text-r8-gray-11 max-w-xl">Flux LoRAs, Hot Zuck, and Replicate on Lex Fridman</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 23, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-08-16"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #11</h2><p class="text-r8-gray-11 max-w-xl">Fine tune FLUX.1, generative video games, a vision for the metaverse</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 16, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-flux"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-flux/cover.jpg" alt="Fine-tune FLUX.1 with your own images"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune FLUX.1 with your own images</h2><p class="text-r8-gray-11 max-w-xl">We've added fine-tuning (LoRA) support to FLUX.1 image generation models. You can train FLUX.1 on your own images with one line of code using Replicate's API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 15, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-08-09"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #10</h2><p class="text-r8-gray-11 max-w-xl">Flux developments, Minecraft bot, Streamlit cookbook with Zeke</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 9, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/flux-first-impressions"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/flux-first-impressions/library.webp" alt="FLUX.1: First Impressions"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">FLUX.1: First Impressions</h2><p class="text-r8-gray-11 max-w-xl">We explore FLUX.1's unique strengths and aesthetics to see what we can generate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 2, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-08-02"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #9</h2><p class="text-r8-gray-11 max-w-xl">Open source frontier image model, cut objects from videos, new Python web framework from Jeremy Howard</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 2, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/flux-state-of-the-art-image-generation"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/flux/cover.jpg" alt="Run FLUX with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run FLUX with an API</h2><p class="text-r8-gray-11 max-w-xl">FLUX.1 is a new text-to-image model from Black Forest Labs, the creators of Stable Diffusion, that exceeds the capabilities of previous open-source models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 1, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-07-26"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #8</h2><p class="text-r8-gray-11 max-w-xl">A top-tier open-ish language model, new safety classifiers, model search API</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 26, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-llama-3-1-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-3-api/meta.png" alt="Run Meta Llama 3.1 405B with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Meta Llama 3.1 405B with an API</h2><p class="text-r8-gray-11 max-w-xl">Llama 3.1 405B: is the most powerful open-source language model from Meta. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 23, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-07-12"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #7</h2><p class="text-r8-gray-11 max-w-xl">Data curation, data generation, data data data</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 12, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-06-28"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #6</h2><p class="text-r8-gray-11 max-w-xl">Google's Gemma2 models, language model leaderboard, tips for Stable Diffusion 3</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 28, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-06-21"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #5</h2><p class="text-r8-gray-11 max-w-xl">Really good coding model, AI search breakthroughs, Discord support bot</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 21, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/get-the-best-from-stable-diffusion-3"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/get-the-best-from-stable-diffusion-3/get-the-best-from-stable-diffusion-3.webp" alt="How to get the best results from Stable Diffusion 3"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to get the best results from Stable Diffusion 3</h2><p class="text-r8-gray-11 max-w-xl">We show you how to use Stable Diffusion 3 to get the best images, including new techniques for prompting.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 18, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-stable-diffusion-3-on-apple-silicon-mac"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/sd3-mac-mps/cover.webp" alt="Run Stable Diffusion 3 on your Apple Silicon Mac"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Stable Diffusion 3 on your Apple Silicon Mac</h2><p class="text-r8-gray-11 max-w-xl">A step-by-step guide to generating images with Stable Diffusion 3 on your M-series Mac using MPS acceleration.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 18, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/push-a-custom-sd3"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/push-a-custom-sd3/push-a-custom-sd3.webp" alt="Push a custom version of Stable Diffusion 3"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Push a custom version of Stable Diffusion 3</h2><p class="text-r8-gray-11 max-w-xl">Create your own custom version of Stability's latest image generation model and run it on Replicate via the web or API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 14, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-06-14"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #4</h2><p class="text-r8-gray-11 max-w-xl">Find concepts in GPT models, real-time speech to text in the browser, H100s are coming</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 14, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-sd3-on-comfyui"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/sd3-comfyui-steps/comfyui-sd3.webp" alt="Run Stable Diffusion 3 on your own machine with ComfyUI"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Stable Diffusion 3 on your own machine with ComfyUI</h2><p class="text-r8-gray-11 max-w-xl">Copy and paste a few commands into terminal to play with Stable Diffusion 3 on your own GPU-powered machine.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 14, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/h100s-are-coming"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/h100s-are-coming/h100s-are-coming.webp" alt="H100s are coming to Replicate"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">H100s are coming to Replicate</h2><p class="text-r8-gray-11 max-w-xl">We'll soon support NVIDIA's H100 GPUs for predictions and training. Let us know if you want early access.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 12, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-stable-diffusion-3-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/stable-diffusion-3-api/stability-ai.webp" alt="Run Stable Diffusion 3 with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Stable Diffusion 3 with an API</h2><p class="text-r8-gray-11 max-w-xl">Stable Diffusion 3 is the latest text-to-image model from Stability, with improved image quality, typography, prompt understanding, and resource efficiency. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 12, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-06-07"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #3</h2><p class="text-r8-gray-11 max-w-xl">Garden State Llama, applied LLMs guide, real-time image generation</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>June 7, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-05-31"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #2</h2><p class="text-r8-gray-11 max-w-xl">Faster image generation, AI-powered world simulator, insights on AI dataset complexity</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 31, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-intelligence-2024-05-24"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Replicate Intelligence #1</h2><p class="text-r8-gray-11 max-w-xl">DIY Llama 3 implementation, open-source smart glasses, steering language models with dictionary learning</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 24, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/shared-network-vulnerability-disclosure"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Shared network vulnerability disclosure</h2><p class="text-r8-gray-11 max-w-xl"></p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 23, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-arctic-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/arctic-api/snowflake_arctic.png" alt="Run Snowflake Arctic with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Snowflake Arctic with an API</h2><p class="text-r8-gray-11 max-w-xl">Arctic is a new open-source language model from Snowflake. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>April 23, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-llama-3-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-3-api/meta.png" alt="Run Meta Llama 3 with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Meta Llama 3 with an API</h2><p class="text-r8-gray-11 max-w-xl">Llama 3 is the latest language model from Meta. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>April 18, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-codellama-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/codellama/codellama.png" alt="Run Code Llama 70B with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Code Llama 70B with an API</h2><p class="text-r8-gray-11 max-w-xl">Code Llama 70B is one of the powerful open-source code generation models. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>January 30, 2024</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/how-to-create-an-ai-narrator"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/ai-narrator/2023-12-01_at_11.58.52.png" alt="How to create an AI narrator for your life"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to create an AI narrator for your life</h2><p class="text-r8-gray-11 max-w-xl">Or, how I met a virtual David Attenborough.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>December 6, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/how-to-tune-a-realistic-voice-clone"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/how-to-tune-a-realistic-voice-clone/rvc.jpg" alt="Clone your voice using open-source models"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Clone your voice using open-source models</h2><p class="text-r8-gray-11 max-w-xl">We’ve added fine-tuning for realistic voice cloning (RVC). You can train RVC on your own dataset from a YouTube video with a few lines of code using Replicate's API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>December 6, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/series-b"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/series-b/goo-logo.jpg" alt="Businesses are building on open-source AI"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Businesses are building on open-source AI</h2><p class="text-r8-gray-11 max-w-xl">We've raised a $40 million Series B led by a16z.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>December 5, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-yi-chat-with-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-yi-chat-with-api/Yi.svg" alt="How to run Yi chat models with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to run Yi chat models with an API</h2><p class="text-r8-gray-11 max-w-xl">The Yi series models are large language models trained from scratch by developers at 01.AI. Learn how to run them in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 23, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-scaffold"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/ready-set-scaffold/scaffold-llama.jpg" alt="Scaffold Replicate apps with one command"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Scaffold Replicate apps with one command</h2><p class="text-r8-gray-11 max-w-xl">We've added a CLI command that makes it easy to get started with Replicate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 22, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-bge-embedding-models"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-bge-embedding-models/cover.jpg" alt="Using open-source models for faster and cheaper text embeddings"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Using open-source models for faster and cheaper text embeddings</h2><p class="text-r8-gray-11 max-w-xl">An interactive example showing how to embed text using a state-of-the-art embedding model that beats OpenAI's embeddings API on price and performance.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 10, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/generate-music-from-chord-progressions-musicgen-chord"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/generate-music-from-chord-progressions-musicgen-chord/cover.png" alt="Generate music from chord progressions and text prompts with MusicGen-Chord"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Generate music from chord progressions and text prompts with MusicGen-Chord</h2><p class="text-r8-gray-11 max-w-xl">We’ve added chord conditioning to Meta’s MusicGen model, so you can create automatic backing tracks in any style using text prompts and chord progressions.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 8, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-latent-consistency-model-on-mac"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-latent-consistency-model-on-mac/cover.webp" alt="Generate images in one second on your Mac using a latent consistency model"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Generate images in one second on your Mac using a latent consistency model</h2><p class="text-r8-gray-11 max-w-xl">How to run a latent consistency model on your M1 or M2 Mac</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 25, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/how-to-use-rag-with-chromadb-and-mistral-7b-instruct"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/how-to-use-rag-with-chromadb-and-mistral-7b-instruct/rag-cover-image.webp" alt="How to use retrieval augmented generation with ChromaDB and Mistral"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to use retrieval augmented generation with ChromaDB and Mistral</h2><p class="text-r8-gray-11 max-w-xl">In this post we'll explore the basics of retrieval augmented generation by creating an example app that uses bge-large-en for embeddings, ChromaDB for vector store, and mistral-7b-instruct for language model generation.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 17, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-musicgen"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-musicgen/fine-tune-musicgen.webp" alt="Fine-tune MusicGen to generate music in any style"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune MusicGen to generate music in any style</h2><p class="text-r8-gray-11 max-w-xl">We’ve added fine-tuning support to MusicGen. You can train the small, medium and melody models on your own audio files using Replicate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 13, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/llama-2-grammars"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-2-grammars/llama2-grammar.webp" alt="Jet-setting with Llama 2 + Grammars"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Jet-setting with Llama 2 + Grammars</h2><p class="text-r8-gray-11 max-w-xl">How to use Llama 2 models with grammars for information extraction tasks.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 9, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-mistral-7b-with-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/demystifying-mistral-7b/mistral_box.jpeg" alt="How to run Mistral 7B with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to run Mistral 7B with an API</h2><p class="text-r8-gray-11 max-w-xl">Mistral 7B is an open-source large language model. Learn what it's good at and how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 6, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/animatediff-interpolator"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/animatediff-interpolator/animatediff.webp" alt="Make smooth AI generated videos with AnimateDiff and an interpolator"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Make smooth AI generated videos with AnimateDiff and an interpolator</h2><p class="text-r8-gray-11 max-w-xl">Combine AnimateDiff and the ST-MFNet frame interpolator to create smooth and realistic videos from a text prompt</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>October 4, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-cold-boots"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-cold-boots/fast-llamas.webp" alt="Fine-tuned models now boot in less than one second"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tuned models now boot in less than one second</h2><p class="text-r8-gray-11 max-w-xl">We've made some dramatic improvements to cold boots for fine-tuned models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>September 6, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/painting-with-words-a-history-of-text-to-image-ai"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/painting-with-words-a-history-of-text-to-image-ai/sketch_of_internet_is_a_series_of_tubes_by_Leonardo_da_Vinci.png" alt="Painting with words: a history of text-to-image AI"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Painting with words: a history of text-to-image AI</h2><p class="text-r8-gray-11 max-w-xl">With the recent release of Stable Diffusion XL fine-tuning on Replicate, and today being the 1-year anniversary of Stable Diffusion, now feels like the perfect opportunity to take a step back and reflect on how text-to-image AI has improved over the last few years.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 22, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/cutting-prices-in-half"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/cutting-prices-in-half/out-3-1.png" alt="We're cutting our prices in half"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">We're cutting our prices in half</h2><p class="text-r8-gray-11 max-w-xl">The price of public models is being cut in half, and soon we'll start charging new users for setup and idle time on private models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 16, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/how-to-prompt-llama"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/prompt-llama/llama-typing.png" alt="A guide to prompting Llama 2"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">A guide to prompting Llama 2</h2><p class="text-r8-gray-11 max-w-xl">Learn the art of the Llama prompt.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 14, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/streaming"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/streaming/streaming.jpg" alt="Streaming output for language models"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Streaming output for language models</h2><p class="text-r8-gray-11 max-w-xl">Our API now supports server-sent event streams for language models. Learn how to use them to make your apps more responsive.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 14, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-sdxl"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-sdxl/out-3-8.png" alt="Fine-tune SDXL with your own images"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune SDXL with your own images</h2><p class="text-r8-gray-11 max-w-xl">We’ve added fine-tuning (Dreambooth, Textual Inversion and LoRA) support to SDXL 1.0. You can train SDXL on your own images with one line of code using the Replicate API.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 8, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-llama-2-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-api/llama-clouds.png" alt="Run Llama 2 with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Llama 2 with an API</h2><p class="text-r8-gray-11 max-w-xl">Llama 2 is the first open source language model of the same caliber as OpenAI’s models. Learn how to run it in the cloud with one line of code.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 27, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-sdxl-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-sdxl-with-an-api/astronaut-riding-unicorn.webp" alt="Run SDXL with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run SDXL with an API</h2><p class="text-r8-gray-11 max-w-xl">How to run Stable Diffusion XL 1.0 using the Replicate API</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 26, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-llama-locally"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-llama-locally/llama-captain.jpg" alt="A comprehensive guide to running Llama 2 locally"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">A comprehensive guide to running Llama 2 locally</h2><p class="text-r8-gray-11 max-w-xl">How to run Llama 2 on Mac, Linux, Windows, and your phone.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 22, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-llama-2"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-llama-2/llama-salon.png" alt="Fine-tune Llama 2 on Replicate"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune Llama 2 on Replicate</h2><p class="text-r8-gray-11 max-w-xl">So you want to train a llama...</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 20, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/llama-2-roundup"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-2-roundup/llama2.jpg" alt="What happened with Llama 2 in the last 24 hours? 🦙"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">What happened with Llama 2 in the last 24 hours? 🦙</h2><p class="text-r8-gray-11 max-w-xl">A roundup of recent developments from the llamaverse following the second major release of Meta's open-source large language model.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 19, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/turn-your-llm-into-a-poet"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/poet/poet.jpg" alt="Make any large language model a better poet"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Make any large language model a better poet</h2><p class="text-r8-gray-11 max-w-xl">Prompt engineering and training are often the first solutions we reach for to improve language model behavior, but they're not the only way.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 26, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/new-status-page"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/status-page/nines.jpg" alt="Status page"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Status page</h2><p class="text-r8-gray-11 max-w-xl">We've added a status page to provide real-time updates on the health of Replicate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 18, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/language-model-roundup"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/language-model-roundup/language-model-roundup.jpg" alt="Language model roundup, April 2023"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Language model roundup, April 2023</h2><p class="text-r8-gray-11 max-w-xl">A roundup of recent developments from the world of open-source language models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>April 21, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/autocog"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/autocog/autocog.png" alt="AutoCog — Generate Cog configuration with GPT-4"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">AutoCog — Generate Cog configuration with GPT-4</h2><p class="text-r8-gray-11 max-w-xl">Give it a machine learning directory and AutoCog will create predict.py and cog.yaml until it successfully runs a prediction</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>April 19, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/language-models"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/language-models/out-2.png" alt="Language models are on Replicate"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Language models are on Replicate</h2><p class="text-r8-gray-11 max-w-xl"></p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>April 5, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-alpaca-with-lora"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/fine-tune-alpaca-with-lora/alpaca-lora.jpg" alt="How to use Alpaca-LoRA to fine-tune a model like ChatGPT"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">How to use Alpaca-LoRA to fine-tune a model like ChatGPT</h2><p class="text-r8-gray-11 max-w-xl"></p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>March 23, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/llama-roundup"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/llama-roundup/llama-astronaut.jpg" alt="Week 3 of LLaMA 🦙"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Week 3 of LLaMA 🦙</h2><p class="text-r8-gray-11 max-w-xl">A roundup of recent developments from the llamaverse.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>March 18, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/fine-tune-llama-to-speak-like-homer-simpson"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/homer/robot-homer.webp" alt="Fine-tune LLaMA to speak like Homer Simpson"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Fine-tune LLaMA to speak like Homer Simpson</h2><p class="text-r8-gray-11 max-w-xl">With a small amount of data and an hour of training you can make LLaMA output text in the voice of the dataset.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>March 17, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/replicate-alpaca"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/replicate-alpaca/party-alpaca.png" alt="Train and run Stanford Alpaca on your own machine"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Train and run Stanford Alpaca on your own machine</h2><p class="text-r8-gray-11 max-w-xl">We'll show you how to train Alpaca, a fine-tuned version of LLaMA that can respond to instructions like ChatGPT.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>March 16, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/machine-learning-needs-better-tools"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/machine-learning-is-just-software/cover.png" alt="Machine learning needs better tools"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Machine learning needs better tools</h2><p class="text-r8-gray-11 max-w-xl">Lots of people want to build things with machine learning, but they don't have the expertise to use it.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>February 21, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/lora-faster-fine-tuning-of-stable-diffusion"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/lora-api/lora-api.png" alt="Introducing LoRA: A faster way to fine-tune Stable Diffusion"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Introducing LoRA: A faster way to fine-tune Stable Diffusion</h2><p class="text-r8-gray-11 max-w-xl">It's like DreamBooth, but much faster. And you can run it in the cloud on Replicate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>February 7, 2023</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/dreambooth-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/dreambooth-api/Untitled.png" alt="Train and deploy a DreamBooth model on Replicate"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Train and deploy a DreamBooth model on Replicate</h2><p class="text-r8-gray-11 max-w-xl">With just a handful of images and a single API call, you can train a model, publish it to Replicate, and run predictions on it in the cloud.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>November 21, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-stable-diffusion-on-m1-mac"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-stable-diffusion-on-m1-mac/grid-0002.png" alt="Run Stable Diffusion on your M1 Mac’s GPU"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Stable Diffusion on your M1 Mac’s GPU</h2><p class="text-r8-gray-11 max-w-xl">How to run Stable Diffusion locally so you can hack on it</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 31, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/run-stable-diffusion-with-an-api"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/run-stable-diffusion-with-an-api/out-0-3.png" alt="Run Stable Diffusion with an API"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Run Stable Diffusion with an API</h2><p class="text-r8-gray-11 max-w-xl">How to use Replicate to integrate Stable Diffusion into hacks, apps, and projects</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 29, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/build-a-robot-artist-for-your-discord-server-with-stable-diffusion"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><img class="object-cover w-full h-full" src="/assets/blog/discord-bot/dreaming-of-rabbits.png" alt="Build a robot artist for your Discord server with Stable Diffusion, Replicate, and Fly.io"/></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Build a robot artist for your Discord server with Stable Diffusion, Replicate, and Fly.io</h2><p class="text-r8-gray-11 max-w-xl">A tutorial for building a chat bot that replies to prompts with the output of a text-to-image model.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 25, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/uncanny-spaces"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Join us at Uncanny Spaces</h2><p class="text-r8-gray-11 max-w-xl">We're bringing people together to explore what's being created with machine learning.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 11, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/grab-hundreds-of-images-with-clip-and-laion"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Automating image collection</h2><p class="text-r8-gray-11 max-w-xl">Using CLIP and LAION5B to collect thousands of captioned images.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>August 5, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/exploring-text-to-image-models"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Exploring text to image models</h2><p class="text-r8-gray-11 max-w-xl">The basics of using the API to create your own images from text.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 18, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/model-docs"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">A new template for model READMEs</h2><p class="text-r8-gray-11 max-w-xl">Inspired by model cards, we've created templates for documenting models on Replicate.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>July 5, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/constraining-clipdraw"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Constraining CLIPDraw</h2><p class="text-r8-gray-11 max-w-xl">An introduction to differentiable programming and the process of refining generative art models.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 27, 2022</span></div></div></div></a></li><li class="py-12"><a class="flex flex-col sm:flex-row gap-4 group" data-discover="true" href="/blog/hello-world"><div class="shrink-0 sm:size-32 md:size-40"><div class="aspect-square bg-r8-gray-6"><div class="h-full flex items-center justify-center"><svg version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" viewBox="0 0 1000 1000" fill="currentColor" class="w-8 h-8 undefined" preserveAspectRatio="none"><title>Replicate logo</title><g><polygon points="1000,427.6 1000,540.6 603.4,540.6 603.4,1000 477,1000 477,427.6"></polygon><polygon points="1000,213.8 1000,327 364.8,327 364.8,1000 238.4,1000 238.4,213.8"></polygon><polygon points="1000,0 1000,113.2 126.4,113.2 126.4,1000 0,1000 0,0"></polygon></g></svg></div></div></div><div class="flex-1 min-w-0"><div class="flex flex-col justify-between h-full min-h-0"><div class="flex-1"><h2 class="text-r8-2xl text-balance font-heading font-semibold mb-0.5 group-hover:underline">Hello, world!</h2><p class="text-r8-gray-11 max-w-xl">We're a small team of engineers and machine learning enthusiasts working to make machine learning more accessible.</p></div><div class="pt-4 flex items-center gap-2 text-r8-gray-10"><span>May 16, 2022</span></div></div></div></a></li></ol></div></div></div></div></div><footer class="border-t border-r8-gray-5 py-4 text-r8-sm mx-auto"><div class="container flex items-center justify-end"><div><button class="r8-btn r8-btn--outlined r8-btn--primary r8-btn--md r8-btn--icon undefined"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M232,168h-8V72a24,24,0,0,0-24-24H56A24,24,0,0,0,32,72v96H24a8,8,0,0,0-8,8v16a24,24,0,0,0,24,24H216a24,24,0,0,0,24-24V176A8,8,0,0,0,232,168ZM48,72a8,8,0,0,1,8-8H200a8,8,0,0,1,8,8v96H48ZM224,192a8,8,0,0,1-8,8H40a8,8,0,0,1-8-8v-8H224ZM152,88a8,8,0,0,1-8,8H112a8,8,0,0,1,0-16h32A8,8,0,0,1,152,88Z"></path></svg></span></button><span id=":Rjj5:" style="position:fixed" hidden=""></span><button class="r8-btn r8-btn--clear r8-btn--primary r8-btn--md r8-btn--icon undefined"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M120,40V16a8,8,0,0,1,16,0V40a8,8,0,0,1-16,0Zm72,88a64,64,0,1,1-64-64A64.07,64.07,0,0,1,192,128Zm-16,0a48,48,0,1,0-48,48A48.05,48.05,0,0,0,176,128ZM58.34,69.66A8,8,0,0,0,69.66,58.34l-16-16A8,8,0,0,0,42.34,53.66Zm0,116.68-16,16a8,8,0,0,0,11.32,11.32l16-16a8,8,0,0,0-11.32-11.32ZM192,72a8,8,0,0,0,5.66-2.34l16-16a8,8,0,0,0-11.32-11.32l-16,16A8,8,0,0,0,192,72Zm5.66,114.34a8,8,0,0,0-11.32,11.32l16,16a8,8,0,0,0,11.32-11.32ZM48,128a8,8,0,0,0-8-8H16a8,8,0,0,0,0,16H40A8,8,0,0,0,48,128Zm80,80a8,8,0,0,0-8,8v24a8,8,0,0,0,16,0V216A8,8,0,0,0,128,208Zm112-88H216a8,8,0,0,0,0,16h24a8,8,0,0,0,0-16Z"></path></svg></span></button><span id=":Rlj5:" style="position:fixed" hidden=""></span><button class="r8-btn r8-btn--clear r8-btn--primary r8-btn--md r8-btn--icon undefined"><span class="r8-btn__icon"><svg xmlns="http://www.w3.org/2000/svg" width="1em" height="1em" fill="currentColor" viewBox="0 0 256 256"><path d="M233.54,142.23a8,8,0,0,0-8-2,88.08,88.08,0,0,1-109.8-109.8,8,8,0,0,0-10-10,104.84,104.84,0,0,0-52.91,37A104,104,0,0,0,136,224a103.09,103.09,0,0,0,62.52-20.88,104.84,104.84,0,0,0,37-52.91A8,8,0,0,0,233.54,142.23ZM188.9,190.34A88,88,0,0,1,65.66,67.11a89,89,0,0,1,31.4-26A106,106,0,0,0,96,56,104.11,104.11,0,0,0,200,160a106,106,0,0,0,14.92-1.06A89,89,0,0,1,188.9,190.34Z"></path></svg></span></button><span id=":Rnj5:" style="position:fixed" hidden=""></span></div></div></footer><link rel="modulepreload" href="/frontend-assets/manifest-67830084.js"/><link rel="modulepreload" href="/frontend-assets/entry.client-BS4mLQdq.js"/><link rel="modulepreload" href="/frontend-assets/jsx-runtime-Dgm-cqF7.js"/><link rel="modulepreload" href="/frontend-assets/exports-BZMQLlpl.js"/><link rel="modulepreload" href="/frontend-assets/env-EKHJ7Xvn.js"/><link rel="modulepreload" href="/frontend-assets/index-BXA5qGEp.js"/><link rel="modulepreload" href="/frontend-assets/sitemap-frontend_._xml-D7Y4D-KF.js"/><link rel="modulepreload" href="/frontend-assets/index-Cl8Rf4oY.js"/><link rel="modulepreload" href="/frontend-assets/index-CbScJO5J.js"/><link rel="modulepreload" href="/frontend-assets/components-BG4HJmcs.js"/><link rel="modulepreload" href="/frontend-assets/index-DMRs56b-.js"/><link rel="modulepreload" href="/frontend-assets/avatar-menu-BmsVaUxj.js"/><link rel="modulepreload" href="/frontend-assets/glyph-loader-hQHK-gUp.js"/><link rel="modulepreload" href="/frontend-assets/client-only-CTgu87Fw.js"/><link rel="modulepreload" href="/frontend-assets/index-DqK8_yBz.js"/><link rel="modulepreload" href="/frontend-assets/Warning-E3sNqDty.js"/><link rel="modulepreload" href="/frontend-assets/bg-goo-kzFvpDYy.js"/><link rel="modulepreload" href="/frontend-assets/index-g70-E7pN.js"/><link rel="modulepreload" href="/frontend-assets/index-0wdBTNeh.js"/><link rel="modulepreload" href="/frontend-assets/index-5DnRZ27y.js"/><link rel="modulepreload" href="/frontend-assets/IconBase-BijvMpG7.js"/><link rel="modulepreload" href="/frontend-assets/index-BJEPNQMR.js"/><link rel="modulepreload" href="/frontend-assets/index-CX0QHlGP.js"/><link rel="modulepreload" href="/frontend-assets/tooltip-provider-BMT24CM9.js"/><link rel="modulepreload" href="/frontend-assets/CO7ZDQU2-BFuNuTN9.js"/><link rel="modulepreload" href="/frontend-assets/string-CTc_OE_H.js"/><link rel="modulepreload" href="/frontend-assets/OIB4PV4M-DQW3M9NW.js"/><link rel="modulepreload" href="/frontend-assets/isBrowser-BQ9AB6EB.js"/><link rel="modulepreload" href="/frontend-assets/index-B_3ptoRv.js"/><link rel="modulepreload" href="/frontend-assets/use-in-view-B1669etU.js"/><link rel="modulepreload" href="/frontend-assets/resolve-element-CuSV-CWS.js"/><link rel="modulepreload" href="/frontend-assets/proxy-BbQZqLBY.js"/><link rel="modulepreload" href="/frontend-assets/root-BP_mC3Sm.js"/><link rel="modulepreload" href="/frontend-assets/index-IRMWvoiJ.js"/><link rel="modulepreload" href="/frontend-assets/index-CSvAeq6o.js"/><link rel="modulepreload" href="/frontend-assets/layout-lnCEgoRq.js"/><link rel="modulepreload" href="/frontend-assets/Rss-CYHcKmIx.js"/><link rel="modulepreload" href="/frontend-assets/logo-glyph-CLxWJ3ua.js"/><link rel="modulepreload" href="/frontend-assets/index-Cu5O9l-Z.js"/><script>window.__remixContext = {"basename":"/","future":{"v3_fetcherPersist":false,"v3_relativeSplatPath":false,"v3_throwAbortReason":false,"unstable_singleFetch":false,"unstable_lazyRouteDiscovery":false,"unstable_optimizeDeps":true},"isSpaMode":false,"state":{"loaderData":{"root":{"theme":null,"remixVersion":2},"routes/blog/layout":{"metadata":{"all-the-llamas":{"title":"What’s the difference between Llama 2 7B, 13B, and 70B?","authors":["zeke"],"intro":"Let's break down the differences between the Llama 2 models and help you choose the right one for your use case.","image":"assets/blog/all-the-llamas/all-the-llamas.jpg","published_at":"2023-08-04T00:00:00.000Z","unlisted":true,"publishedAtDisplay":"August 4, 2023"},"animatediff-interpolator":{"title":"Make smooth AI generated videos with AnimateDiff and an interpolator","authors":["fofr","zsxkib"],"intro":"Combine AnimateDiff and the ST-MFNet frame interpolator to create smooth and realistic videos from a text prompt","image":"assets/blog/animatediff-interpolator/animatediff.webp","published_at":"2023-10-04T00:00:00.000Z","publishedAtDisplay":"October 4, 2023"},"autocog":{"title":"AutoCog — Generate Cog configuration with GPT-4","authors":["andreasjansson"],"intro":"Give it a machine learning directory and AutoCog will create predict.py and cog.yaml until it successfully runs a prediction","image":"assets/blog/autocog/autocog.png","published_at":"2023-04-19T00:00:00.000Z","publishedAtDisplay":"April 19, 2023"},"build-a-robot-artist-for-your-discord-server-with-stable-diffusion":{"title":"Build a robot artist for your Discord server with Stable Diffusion, Replicate, and Fly.io","authors":["zeke,","evilstreak","bfirsh"],"intro":"A tutorial for building a chat bot that replies to prompts with the output of a text-to-image model.","image":"assets/blog/discord-bot/dreaming-of-rabbits.png","published_at":"2022-08-25T00:00:00.000Z","publishedAtDisplay":"August 25, 2022"},"constraining-clipdraw":{"title":"Constraining CLIPDraw","authors":["evilstreak"],"intro":"An introduction to differentiable programming and the process of refining generative art models.","published_at":"2022-05-27T00:00:00.000Z","publishedAtDisplay":"May 27, 2022"},"cutting-prices-in-half":{"title":"We're cutting our prices in half","authors":["bfirsh"],"intro":"The price of public models is being cut in half, and soon we'll start charging new users for setup and idle time on private models.","image":"assets/blog/cutting-prices-in-half/out-3-1.png","published_at":"2023-08-16T00:00:00.000Z","publishedAtDisplay":"August 16, 2023"},"daily-news":{"title":"Illustrating the news with AI","authors":["vccheng2001"],"intro":"Creating a web app to illustrate news headlines with AI-generated visualizations","published_at":"2022-07-28T00:00:00.000Z","unlisted":true,"publishedAtDisplay":"July 28, 2022"},"data-urls-in-our-sync-api":{"title":"We messed up: data URLs in our sync API","authors":["nickstenning","evilstreak"],"intro":"We've decided to stop returning data URLs in sync API outputs based on feedback from users. We're going to take a few steps back and figure out the best way to get your model output as fast as possible.","published_at":"2024-10-31T00:00:00.000Z","publishedAtDisplay":"October 31, 2024"},"dreambooth-api":{"title":"Train and deploy a DreamBooth model on Replicate","authors":["bfirsh","zeke"],"intro":"With just a handful of images and a single API call, you can train a model, publish it to Replicate, and run predictions on it in the cloud.","image":"assets/blog/dreambooth-api/Untitled.png","published_at":"2022-11-21T00:00:00.000Z","publishedAtDisplay":"November 21, 2022"},"exploring-text-to-image-models":{"title":"Exploring text to image models","authors":["afiaka87","rossjillian"],"intro":"The basics of using the API to create your own images from text.","published_at":"2022-07-18T00:00:00.000Z","publishedAtDisplay":"July 18, 2022"},"fast-flux-fine-tunes":{"title":"FLUX fine-tunes are now fast","authors":["bfirsh"],"intro":"We've made running fine-tunes on Replicate much faster, and the optimizations are open-source.","image":"assets/blog/fast-flux-fine-tunes/out-0-11.webp","published_at":"2024-11-26T00:00:00.000Z","publishedAtDisplay":"November 26, 2024"},"fine-tune-alpaca-with-lora":{"title":"How to use Alpaca-LoRA to fine-tune a model like ChatGPT","authors":["andreasjansson","daanelson","zeke"],"intro":"","image":"assets/blog/fine-tune-alpaca-with-lora/alpaca-lora.jpg","published_at":"2023-03-23T00:00:00.000Z","publishedAtDisplay":"March 23, 2023"},"fine-tune-cold-boots":{"title":"Fine-tuned models now boot in less than one second","authors":["andreasjansson"],"intro":"We've made some dramatic improvements to cold boots for fine-tuned models.","image":"assets/blog/fine-tune-cold-boots/fast-llamas.webp","og_image":"assets/blog/fine-tune-cold-boots/fast-llamas.jpg","published_at":"2023-09-06T00:00:00.000Z","publishedAtDisplay":"September 6, 2023"},"fine-tune-flux-with-an-api":{"title":"Fine-tune FLUX.1 with an API","authors":["zeke"],"intro":"Create and run your own fine-tuned Flux models programmatically using Replicate's HTTP API.","image":"assets/blog/fine-tune-flux-with-an-api/cover.jpg","published_at":"2024-09-09T00:00:00.000Z","publishedAtDisplay":"September 9, 2024"},"fine-tune-flux-with-faces":{"title":"Fine-tune FLUX.1 to create images of yourself","authors":["zeke"],"intro":"Create your own fine-tuned Flux model to generate new images of yourself.","image":"assets/blog/fine-tune-flux-with-faces/cover.jpg","published_at":"2024-08-30T00:00:00.000Z","publishedAtDisplay":"August 30, 2024"},"fine-tune-flux":{"title":"Fine-tune FLUX.1 with your own images","authors":["deepfates"],"intro":"We've added fine-tuning (LoRA) support to FLUX.1 image generation models. You can train FLUX.1 on your own images with one line of code using Replicate's API.","image":"assets/blog/fine-tune-flux/cover.jpg","published_at":"2024-08-15T00:00:00.000Z","publishedAtDisplay":"August 15, 2024"},"fine-tune-llama-2":{"title":"Fine-tune Llama 2 on Replicate","authors":["cbh123"],"intro":"So you want to train a llama...","image":"assets/blog/fine-tune-llama-2/llama-salon.png","published_at":"2023-07-20T00:00:00.000Z","publishedAtDisplay":"July 20, 2023"},"fine-tune-llama-to-speak-like-homer-simpson":{"title":"Fine-tune LLaMA to speak like Homer Simpson","authors":["bfirsh"],"intro":"With a small amount of data and an hour of training you can make LLaMA output text in the voice of the dataset.","image":"assets/blog/homer/robot-homer.webp","og_image":"assets/blog/homer/robot-homer.jpg","published_at":"2023-03-17T00:00:00.000Z","publishedAtDisplay":"March 17, 2023"},"fine-tune-musicgen":{"title":"Fine-tune MusicGen to generate music in any style","authors":["fofr","sakemin"],"intro":"We’ve added fine-tuning support to MusicGen. You can train the small, medium and melody models on your own audio files using Replicate.","image":"assets/blog/fine-tune-musicgen/fine-tune-musicgen.webp","og_image":"assets/blog/fine-tune-musicgen/fine-tune-musicgen.jpg","published_at":"2023-10-13T00:00:00.000Z","publishedAtDisplay":"October 13, 2023"},"fine-tune-sdxl":{"title":"Fine-tune SDXL with your own images","authors":["andreasjansson","anotherjesse","cloneofsimo","daanelson"],"intro":"We’ve added fine-tuning (Dreambooth, Textual Inversion and LoRA) support to SDXL 1.0. You can train SDXL on your own images with one line of code using the Replicate API.","image":"assets/blog/fine-tune-sdxl/out-3-8.png","published_at":"2023-08-08T00:00:00.000Z","publishedAtDisplay":"August 8, 2023"},"flux-1-1-pro-is-here":{"title":"FLUX1.1 [pro] is here","authors":["zeke"],"intro":"Black Forest Labs continue to push boundaries with their latest release of FLUX.1 image generation model.","image":"assets/blog/flux-1-1-pro-is-here/cover.webp","published_at":"2024-10-03T00:00:00.000Z","publishedAtDisplay":"October 3, 2024"},"flux-first-impressions":{"title":"FLUX.1: First Impressions","authors":["deepfates"],"published_at":"2024-08-02T00:00:00.000Z","intro":"We explore FLUX.1's unique strengths and aesthetics to see what we can generate.","image":"assets/blog/flux-first-impressions/library.webp","publishedAtDisplay":"August 2, 2024"},"flux-is-fast-and-open-source":{"title":"FLUX is fast and it's open source","authors":["bfirsh"],"intro":"FLUX is now much faster on Replicate, and we’ve made our optimizations open-source so you can see exactly how they work and build upon them.","image":"assets/blog/flux-is-fast/cover.png","published_at":"2024-10-10T00:00:00.000Z","publishedAtDisplay":"October 10, 2024"},"flux-state-of-the-art-image-generation":{"title":"Run FLUX with an API","authors":["zeke","zsxkib"],"intro":"FLUX.1 is a new text-to-image model from Black Forest Labs, the creators of Stable Diffusion, that exceeds the capabilities of previous open-source models.","image":"assets/blog/flux/cover.jpg","published_at":"2024-08-01T00:00:00.000Z","publishedAtDisplay":"August 1, 2024"},"flux-tools":{"title":"FLUX.1 Tools – Control and steerability for FLUX","authors":["zeke","fofr"],"intro":"A new set of image generation capabilities for FLUX models, including inpainting, outpainting, canny edge detection, and depth maps.","image":"assets/blog/flux-tools/cover.png","published_at":"2024-11-21T00:00:00.000Z","publishedAtDisplay":"November 21, 2024"},"generate-music-from-chord-progressions-musicgen-chord":{"title":"Generate music from chord progressions and text prompts with MusicGen-Chord","authors":["sakemin"],"intro":"We’ve added chord conditioning to Meta’s MusicGen model, so you can create automatic backing tracks in any style using text prompts and chord progressions.","image":"assets/blog/generate-music-from-chord-progressions-musicgen-chord/cover.png","og_image":"assets/blog/generate-music-from-chord-progressions-musicgen-chord/cover.png","published_at":"2023-11-08T00:00:00.000Z","publishedAtDisplay":"November 8, 2023"},"get-the-best-from-stable-diffusion-3":{"title":"How to get the best results from Stable Diffusion 3","authors":["fofr"],"published_at":"2024-06-18T00:00:00.000Z","intro":"We show you how to use Stable Diffusion 3 to get the best images, including new techniques for prompting.","image":"assets/blog/get-the-best-from-stable-diffusion-3/get-the-best-from-stable-diffusion-3.webp","publishedAtDisplay":"June 18, 2024"},"grab-hundreds-of-images-with-clip-and-laion":{"title":"Automating image collection","authors":["afiaka87"],"intro":"Using CLIP and LAION5B to collect thousands of captioned images.","published_at":"2022-08-05T00:00:00.000Z","publishedAtDisplay":"August 5, 2022"},"h100s-are-coming":{"title":"H100s are coming to Replicate","authors":["zeke"],"intro":"We'll soon support NVIDIA's H100 GPUs for predictions and training. Let us know if you want early access.","image":"assets/blog/h100s-are-coming/h100s-are-coming.webp","published_at":"2024-06-12T00:00:00.000Z","publishedAtDisplay":"June 12, 2024"},"hello-world":{"title":"Hello, world!","authors":["evilstreak","zeke"],"intro":"We're a small team of engineers and machine learning enthusiasts working to make machine learning more accessible.","published_at":"2022-05-16T00:00:00.000Z","publishedAtDisplay":"May 16, 2022"},"how-to-create-an-ai-narrator":{"title":"How to create an AI narrator for your life","authors":["cbh123"],"intro":"Or, how I met a virtual David Attenborough.","image":"assets/blog/ai-narrator/2023-12-01_at_11.58.52.png","published_at":"2023-12-06T00:00:00.000Z","publishedAtDisplay":"December 6, 2023"},"how-to-prompt-llama":{"title":"A guide to prompting Llama 2","authors":["cbh123"],"intro":"Learn the art of the Llama prompt.","image":"assets/blog/prompt-llama/llama-typing.png","published_at":"2023-08-14T00:00:00.000Z","publishedAtDisplay":"August 14, 2023"},"how-to-tune-a-realistic-voice-clone":{"title":"Clone your voice using open-source models","authors":["zsxkib","fofr"],"intro":"We’ve added fine-tuning for realistic voice cloning (RVC). You can train RVC on your own dataset from a YouTube video with a few lines of code using Replicate's API.","image":"assets/blog/how-to-tune-a-realistic-voice-clone/rvc.jpg","published_at":"2023-12-06T00:00:00.000Z","publishedAtDisplay":"December 6, 2023"},"how-to-use-rag-with-chromadb-and-mistral-7b-instruct":{"title":"How to use retrieval augmented generation with ChromaDB and Mistral","authors":["jakedahn"],"intro":"In this post we'll explore the basics of retrieval augmented generation by creating an example app that uses bge-large-en for embeddings, ChromaDB for vector store, and mistral-7b-instruct for language model generation.","published_at":"2023-10-17T00:00:00.000Z","image":"assets/blog/how-to-use-rag-with-chromadb-and-mistral-7b-instruct/rag-cover-image.webp","og_image":"assets/blog/how-to-use-rag-with-chromadb-and-mistral-7b-instruct/rag-cover-image.jpg","publishedAtDisplay":"October 17, 2023"},"ideogram-v2-inpainting":{"title":"Ideogram v2 is an outstanding new inpainting model","authors":["andreasjansson"],"intro":"We've partnered with Ideogram to bring their inpainting model to Replicate's API.","image":"assets/blog/ideogram-v2-inpainting/cover.png","published_at":"2024-10-22T00:00:00.000Z","publishedAtDisplay":"October 22, 2024"},"language-model-roundup":{"title":"Language model roundup, April 2023","authors":["joehoover","mattt","zeke"],"intro":"A roundup of recent developments from the world of open-source language models.","image":"assets/blog/language-model-roundup/language-model-roundup.jpg","published_at":"2023-04-21T00:00:00.000Z","publishedAtDisplay":"April 21, 2023"},"language-models":{"title":"Language models are on Replicate","authors":["bfirsh"],"intro":"","image":"assets/blog/language-models/out-2.png","published_at":"2023-04-05T00:00:00.000Z","publishedAtDisplay":"April 5, 2023"},"llama-2-grammars":{"title":"Jet-setting with Llama 2 + Grammars","authors":["mattt"],"intro":"How to use Llama 2 models with grammars for information extraction tasks.","image":"assets/blog/llama-2-grammars/llama2-grammar.webp","og_image":"assets/blog/llama-2-grammars/llama2-grammar.jpg","published_at":"2023-10-09T00:00:00.000Z","publishedAtDisplay":"October 9, 2023"},"llama-2-roundup":{"title":"What happened with Llama 2 in the last 24 hours? 🦙","authors":["cbh123","zeke"],"intro":"A roundup of recent developments from the llamaverse following the second major release of Meta's open-source large language model.","image":"assets/blog/llama-2-roundup/llama2.jpg","published_at":"2023-07-19T00:00:00.000Z","publishedAtDisplay":"July 19, 2023"},"llama-roundup":{"title":"Week 3 of LLaMA 🦙","authors":["zeke"],"intro":"A roundup of recent developments from the llamaverse.","image":"assets/blog/llama-roundup/llama-astronaut.jpg","published_at":"2023-03-18T00:00:00.000Z","publishedAtDisplay":"March 18, 2023"},"lora-faster-fine-tuning-of-stable-diffusion":{"title":"Introducing LoRA: A faster way to fine-tune Stable Diffusion","authors":["cloneofsimo","andreasjansson","anotherjesse","zeke"],"intro":"It's like DreamBooth, but much faster. And you can run it in the cloud on Replicate.","image":"assets/blog/lora-api/lora-api.png","published_at":"2023-02-07T00:00:00.000Z","publishedAtDisplay":"February 7, 2023"},"machine-learning-needs-better-tools":{"title":"Machine learning needs better tools","authors":["bfirsh"],"intro":"Lots of people want to build things with machine learning, but they don't have the expertise to use it.","published_at":"2023-02-21T00:00:00.000Z","image":"assets/blog/machine-learning-is-just-software/cover.png","publishedAtDisplay":"February 21, 2023"},"model-docs":{"title":"A new template for model READMEs","authors":["rossjillian","zeke"],"intro":"Inspired by model cards, we've created templates for documenting models on Replicate.","published_at":"2022-07-05T00:00:00.000Z","publishedAtDisplay":"July 5, 2022"},"new-status-page":{"title":"Status page","authors":["nickstenning","zeke"],"intro":"We've added a status page to provide real-time updates on the health of Replicate.","image":"assets/blog/status-page/nines.jpg","published_at":"2023-05-18T00:00:00.000Z","publishedAtDisplay":"May 18, 2023"},"nvidia-l40s-gpus-are-here":{"title":"NVIDIA L40S GPUs are here","authors":["zeke"],"intro":"NVIDIA L40S GPUs are here, with better performance and lower cost.","image":"assets/blog/nvidia-l40s-gpus-are-here/cover.png","published_at":"2024-11-15T00:00:00.000Z","publishedAtDisplay":"November 15, 2024"},"official-models":{"title":"Explore Replicate’s official models","authors":["superhighfives"],"intro":"Replicate now has official models. Official models are always on, fast, and high quality. They have predictable pricing and dedicated support. They're a reliable choice to build projects on.","image":"assets/blog/official-models/cover.jpg","published_at":"2024-09-02T00:00:00.000Z","unlisted":true,"publishedAtDisplay":"September 2, 2024"},"painting-with-words-a-history-of-text-to-image-ai":{"title":"Painting with words: a history of text-to-image AI","authors":["jakedahn"],"intro":"With the recent release of Stable Diffusion XL fine-tuning on Replicate, and today being the 1-year anniversary of Stable Diffusion, now feels like the perfect opportunity to take a step back and reflect on how text-to-image AI has improved over the last few years.","image":"assets/blog/painting-with-words-a-history-of-text-to-image-ai/sketch_of_internet_is_a_series_of_tubes_by_Leonardo_da_Vinci.png","published_at":"2023-08-22T00:00:00.000Z","publishedAtDisplay":"August 22, 2023"},"push-a-custom-sd3":{"title":"Push a custom version of Stable Diffusion 3","authors":["zeke"],"intro":"Create your own custom version of Stability's latest image generation model and run it on Replicate via the web or API.","image":"assets/blog/push-a-custom-sd3/push-a-custom-sd3.webp","published_at":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024"},"replicate-alpaca":{"title":"Train and run Stanford Alpaca on your own machine","authors":["zeke"],"intro":"We'll show you how to train Alpaca, a fine-tuned version of LLaMA that can respond to instructions like ChatGPT.","image":"assets/blog/replicate-alpaca/party-alpaca.png","published_at":"2023-03-16T00:00:00.000Z","publishedAtDisplay":"March 16, 2023"},"replicate-intelligence-2024-05-24":{"authors":["deepfates"],"title":"Replicate Intelligence #1","intro":"DIY Llama 3 implementation, open-source smart glasses, steering language models with dictionary learning","published_at":"2024-05-24T00:00:00.000Z","publishedAtDisplay":"May 24, 2024"},"replicate-intelligence-2024-05-31":{"title":"Replicate Intelligence #2","authors":["deepfates"],"intro":"Faster image generation, AI-powered world simulator, insights on AI dataset complexity","published_at":"2024-05-31T00:00:00.000Z","publishedAtDisplay":"May 31, 2024"},"replicate-intelligence-2024-06-07":{"authors":["deepfates"],"title":"Replicate Intelligence #3","intro":"Garden State Llama, applied LLMs guide, real-time image generation","published_at":"2024-06-07T00:00:00.000Z","publishedAtDisplay":"June 7, 2024"},"replicate-intelligence-2024-06-14":{"authors":["deepfates"],"title":"Replicate Intelligence #4","intro":"Find concepts in GPT models, real-time speech to text in the browser, H100s are coming","published_at":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024"},"replicate-intelligence-2024-06-21":{"authors":["deepfates"],"title":"Replicate Intelligence #5","intro":"Really good coding model, AI search breakthroughs, Discord support bot","published_at":"2024-06-21T00:00:00.000Z","publishedAtDisplay":"June 21, 2024"},"replicate-intelligence-2024-06-28":{"authors":["deepfates"],"title":"Replicate Intelligence #6","intro":"Google's Gemma2 models, language model leaderboard, tips for Stable Diffusion 3","published_at":"2024-06-28T00:00:00.000Z","publishedAtDisplay":"June 28, 2024"},"replicate-intelligence-2024-07-12":{"authors":["deepfates"],"title":"Replicate Intelligence #7","intro":"Data curation, data generation, data data data","published_at":"2024-07-12T00:00:00.000Z","publishedAtDisplay":"July 12, 2024"},"replicate-intelligence-2024-07-26":{"authors":["deepfates"],"title":"Replicate Intelligence #8","intro":"A top-tier open-ish language model, new safety classifiers, model search API","published_at":"2024-07-26T00:00:00.000Z","publishedAtDisplay":"July 26, 2024"},"replicate-intelligence-2024-08-02":{"authors":["deepfates"],"title":"Replicate Intelligence #9","intro":"Open source frontier image model, cut objects from videos, new Python web framework from Jeremy Howard","published_at":"2024-08-02T00:00:00.000Z","publishedAtDisplay":"August 2, 2024"},"replicate-intelligence-2024-08-09":{"authors":["deepfates"],"title":"Replicate Intelligence #10","intro":"Flux developments, Minecraft bot, Streamlit cookbook with Zeke","published_at":"2024-08-09T00:00:00.000Z","publishedAtDisplay":"August 9, 2024"},"replicate-intelligence-2024-08-16":{"authors":["deepfates"],"title":"Replicate Intelligence #11","intro":"Fine tune FLUX.1, generative video games, a vision for the metaverse","published_at":"2024-08-16T00:00:00.000Z","publishedAtDisplay":"August 16, 2024"},"replicate-intelligence-2024-08-23":{"authors":["deepfates"],"title":"Replicate Intelligence #12","intro":"Flux LoRAs, Hot Zuck, and Replicate on Lex Fridman","published_at":"2024-08-23T00:00:00.000Z","publishedAtDisplay":"August 23, 2024"},"replicate-scaffold":{"title":"Scaffold Replicate apps with one command","authors":["jakedahn","mattrothenberg"],"intro":"We've added a CLI command that makes it easy to get started with Replicate.","image":"assets/blog/ready-set-scaffold/scaffold-llama.jpg","published_at":"2023-11-22T00:00:00.000Z","publishedAtDisplay":"November 22, 2023"},"run-arctic-with-an-api":{"title":"Run Snowflake Arctic with an API","authors":["cbh123"],"intro":"Arctic is a new open-source language model from Snowflake. Learn how to run it in the cloud with one line of code.","image":"assets/blog/arctic-api/snowflake_arctic.png","published_at":"2024-04-23T00:00:00.000Z","publishedAtDisplay":"April 23, 2024"},"run-bge-embedding-models":{"title":"Using open-source models for faster and cheaper text embeddings","authors":["nateraw"],"intro":"An interactive example showing how to embed text using a state-of-the-art embedding model that beats OpenAI's embeddings API on price and performance.","image":"assets/blog/run-bge-embedding-models/cover.jpg","published_at":"2023-11-10T00:00:00.000Z","publishedAtDisplay":"November 10, 2023"},"run-codellama-with-an-api":{"title":"Run Code Llama 70B with an API","authors":["cbh123"],"intro":"Code Llama 70B is one of the powerful open-source code generation models. Learn how to run it in the cloud with one line of code.","image":"assets/blog/codellama/codellama.png","published_at":"2024-01-30T00:00:00.000Z","publishedAtDisplay":"January 30, 2024"},"run-latent-consistency-model-on-mac":{"title":"Generate images in one second on your Mac using a latent consistency model","authors":["fofr"],"intro":"How to run a latent consistency model on your M1 or M2 Mac","image":"assets/blog/run-latent-consistency-model-on-mac/cover.webp","og_image":"assets/blog/run-latent-consistency-model-on-mac/og.jpg","published_at":"2023-10-25T00:00:00.000Z","publishedAtDisplay":"October 25, 2023"},"run-llama-2-with-an-api":{"title":"Run Llama 2 with an API","authors":["joehoover"],"intro":"Llama 2 is the first open source language model of the same caliber as OpenAI’s models. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-api/llama-clouds.png","published_at":"2023-07-27T00:00:00.000Z","publishedAtDisplay":"July 27, 2023"},"run-llama-3-1-with-an-api":{"title":"Run Meta Llama 3.1 405B with an API","authors":["deepfates"],"intro":"Llama 3.1 405B: is the most powerful open-source language model from Meta. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-3-api/meta.png","published_at":"2024-07-23T00:00:00.000Z","publishedAtDisplay":"July 23, 2024"},"run-llama-3-with-an-api":{"title":"Run Meta Llama 3 with an API","authors":["cbh123"],"intro":"Llama 3 is the latest language model from Meta. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-3-api/meta.png","published_at":"2024-04-18T00:00:00.000Z","publishedAtDisplay":"April 18, 2024"},"run-llama-locally":{"title":"A comprehensive guide to running Llama 2 locally","authors":["zeke"],"published_at":"2023-07-22T00:00:00.000Z","intro":"How to run Llama 2 on Mac, Linux, Windows, and your phone.","image":"assets/blog/run-llama-locally/llama-captain.jpg","publishedAtDisplay":"July 22, 2023"},"run-mistral-7b-with-api":{"title":"How to run Mistral 7B with an API","authors":["daanelson","zeke"],"published_at":"2023-10-06T00:00:00.000Z","intro":"Mistral 7B is an open-source large language model. Learn what it's good at and how to run it in the cloud with one line of code.","image":"assets/blog/demystifying-mistral-7b/mistral_box.jpeg","publishedAtDisplay":"October 6, 2023"},"run-nvidia-nim-models-on-replicate":{"title":"Simplified AI Inference APIs on Replicate with NVIDIA NIM","authors":["andreasjansson","zeke"],"published_at":"2024-06-02T00:00:00.000Z","intro":"","image":"assets/blog/run-nvidia-nim-models-on-replicate/nim-square.png","og_image":"assets/blog/run-nvidia-nim-models-on-replicate/nim-opengraph.png","unlisted":true,"publishedAtDisplay":"June 2, 2024"},"run-sd3-on-comfyui":{"title":"Run Stable Diffusion 3 on your own machine with ComfyUI","authors":["zsxkib","zeke"],"intro":"Copy and paste a few commands into terminal to play with Stable Diffusion 3 on your own GPU-powered machine.","image":"assets/blog/sd3-comfyui-steps/comfyui-sd3.webp","published_at":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024"},"run-sdxl-with-an-api":{"title":"Run SDXL with an API","authors":["fofr"],"published_at":"2023-07-26T00:00:00.000Z","intro":"How to run Stable Diffusion XL 1.0 using the Replicate API","image":"assets/blog/run-sdxl-with-an-api/astronaut-riding-unicorn.webp","og_image":"assets/blog/run-sdxl-with-an-api/astronaut-riding-unicorn.jpg","publishedAtDisplay":"July 26, 2023"},"run-stable-diffusion-3-on-apple-silicon-mac":{"title":"Run Stable Diffusion 3 on your Apple Silicon Mac","authors":["zsxkib"],"intro":"A step-by-step guide to generating images with Stable Diffusion 3 on your M-series Mac using MPS acceleration.","image":"assets/blog/sd3-mac-mps/cover.webp","published_at":"2024-06-18T00:00:00.000Z","publishedAtDisplay":"June 18, 2024"},"run-stable-diffusion-3-with-an-api":{"title":"Run Stable Diffusion 3 with an API","authors":["cbh123"],"intro":"Stable Diffusion 3 is the latest text-to-image model from Stability, with improved image quality, typography, prompt understanding, and resource efficiency. Learn how to run it in the cloud with one line of code.","image":"assets/blog/stable-diffusion-3-api/stability-ai.webp","published_at":"2024-06-12T00:00:00.000Z","publishedAtDisplay":"June 12, 2024"},"run-stable-diffusion-on-m1-mac":{"title":"Run Stable Diffusion on your M1 Mac’s GPU","authors":["bfirsh"],"intro":"How to run Stable Diffusion locally so you can hack on it","image":"assets/blog/run-stable-diffusion-on-m1-mac/grid-0002.png","published_at":"2022-08-31T00:00:00.000Z","publishedAtDisplay":"August 31, 2022"},"run-stable-diffusion-with-an-api":{"title":"Run Stable Diffusion with an API","authors":["zeke"],"intro":"How to use Replicate to integrate Stable Diffusion into hacks, apps, and projects","image":"assets/blog/run-stable-diffusion-with-an-api/out-0-3.png","published_at":"2022-08-29T00:00:00.000Z","publishedAtDisplay":"August 29, 2022"},"run-yi-chat-with-api":{"title":"How to run Yi chat models with an API","authors":["nateraw"],"published_at":"2023-11-23T00:00:00.000Z","intro":"The Yi series models are large language models trained from scratch by developers at 01.AI. Learn how to run them in the cloud with one line of code.","image":"assets/blog/run-yi-chat-with-api/Yi.svg","publishedAtDisplay":"November 23, 2023"},"series-b":{"title":"Businesses are building on open-source AI","authors":["bfirsh"],"published_at":"2023-12-05T00:00:00.000Z","intro":"We've raised a $40 million Series B led by a16z.","image":"assets/blog/series-b/goo-logo.jpg","publishedAtDisplay":"December 5, 2023"},"shared-network-vulnerability-disclosure":{"title":"Shared network vulnerability disclosure","authors":["nickstenning","philandstuff","zeke"],"published_at":"2024-05-23T00:00:00.000Z","publishedAtDisplay":"May 23, 2024"},"stable-diffusion-3-5-is-here":{"title":"Stable Diffusion 3.5 is here","authors":["deepfates"],"intro":"Stability AI's latest text-to-image model is now available on Replicate and you can run it with an API.","image":"assets/blog/stable-diffusion-3-5-is-here/cover.webp","published_at":"2024-10-22T00:00:00.000Z","publishedAtDisplay":"October 22, 2024"},"streaming":{"title":"Streaming output for language models","authors":["zeke"],"intro":"Our API now supports server-sent event streams for language models. Learn how to use them to make your apps more responsive.","image":"assets/blog/streaming/streaming.jpg","published_at":"2023-08-14T00:00:00.000Z","publishedAtDisplay":"August 14, 2023"},"turn-your-llm-into-a-poet":{"title":"Make any large language model a better poet","authors":["joehoover"],"published_at":"2023-05-26T00:00:00.000Z","intro":"Prompt engineering and training are often the first solutions we reach for to improve language model behavior, but they're not the only way.","image":"assets/blog/poet/poet.jpg","publishedAtDisplay":"May 26, 2023"},"uncanny-spaces":{"title":"Join us at Uncanny Spaces","authors":["rossjillian"],"intro":"We're bringing people together to explore what's being created with machine learning.","published_at":"2022-08-11T00:00:00.000Z","publishedAtDisplay":"August 11, 2022"},"using-synthetic-data-to-improve-flux-finetunes":{"title":"Using synthetic training data to improve Flux finetunes","authors":["zeke"],"intro":"It's easy to fine-tune Flux, but sometimes you need to do a little more work to get the best results. This post covers techniques you can use to improve your fine-tuned Flux models.","image":"assets/blog/using-synthetic-data-to-improve-flux-finetunes/cover.jpg","published_at":"2024-09-20T00:00:00.000Z","publishedAtDisplay":"September 20, 2024"}}},"routes/blog/index":{"posts":[{"slug":"fast-flux-fine-tunes","title":"FLUX fine-tunes are now fast","intro":"We've made running fine-tunes on Replicate much faster, and the optimizations are open-source.","image":"assets/blog/fast-flux-fine-tunes/out-0-11.webp","authors":["bfirsh"],"publishedAt":"2024-11-26T00:00:00.000Z","publishedAtDisplay":"November 26, 2024","unlisted":false},{"slug":"flux-tools","title":"FLUX.1 Tools – Control and steerability for FLUX","intro":"A new set of image generation capabilities for FLUX models, including inpainting, outpainting, canny edge detection, and depth maps.","image":"assets/blog/flux-tools/cover.png","authors":["zeke","fofr"],"publishedAt":"2024-11-21T00:00:00.000Z","publishedAtDisplay":"November 21, 2024","unlisted":false},{"slug":"nvidia-l40s-gpus-are-here","title":"NVIDIA L40S GPUs are here","intro":"NVIDIA L40S GPUs are here, with better performance and lower cost.","image":"assets/blog/nvidia-l40s-gpus-are-here/cover.png","authors":["zeke"],"publishedAt":"2024-11-15T00:00:00.000Z","publishedAtDisplay":"November 15, 2024","unlisted":false},{"slug":"data-urls-in-our-sync-api","title":"We messed up: data URLs in our sync API","intro":"We've decided to stop returning data URLs in sync API outputs based on feedback from users. We're going to take a few steps back and figure out the best way to get your model output as fast as possible.","authors":["nickstenning","evilstreak"],"publishedAt":"2024-10-31T00:00:00.000Z","publishedAtDisplay":"October 31, 2024","unlisted":false},{"slug":"ideogram-v2-inpainting","title":"Ideogram v2 is an outstanding new inpainting model","intro":"We've partnered with Ideogram to bring their inpainting model to Replicate's API.","image":"assets/blog/ideogram-v2-inpainting/cover.png","authors":["andreasjansson"],"publishedAt":"2024-10-22T00:00:00.000Z","publishedAtDisplay":"October 22, 2024","unlisted":false},{"slug":"stable-diffusion-3-5-is-here","title":"Stable Diffusion 3.5 is here","intro":"Stability AI's latest text-to-image model is now available on Replicate and you can run it with an API.","image":"assets/blog/stable-diffusion-3-5-is-here/cover.webp","authors":["deepfates"],"publishedAt":"2024-10-22T00:00:00.000Z","publishedAtDisplay":"October 22, 2024","unlisted":false},{"slug":"flux-is-fast-and-open-source","title":"FLUX is fast and it's open source","intro":"FLUX is now much faster on Replicate, and we’ve made our optimizations open-source so you can see exactly how they work and build upon them.","image":"assets/blog/flux-is-fast/cover.png","authors":["bfirsh"],"publishedAt":"2024-10-10T00:00:00.000Z","publishedAtDisplay":"October 10, 2024","unlisted":false},{"slug":"flux-1-1-pro-is-here","title":"FLUX1.1 [pro] is here","intro":"Black Forest Labs continue to push boundaries with their latest release of FLUX.1 image generation model.","image":"assets/blog/flux-1-1-pro-is-here/cover.webp","authors":["zeke"],"publishedAt":"2024-10-03T00:00:00.000Z","publishedAtDisplay":"October 3, 2024","unlisted":false},{"slug":"using-synthetic-data-to-improve-flux-finetunes","title":"Using synthetic training data to improve Flux finetunes","intro":"It's easy to fine-tune Flux, but sometimes you need to do a little more work to get the best results. This post covers techniques you can use to improve your fine-tuned Flux models.","image":"assets/blog/using-synthetic-data-to-improve-flux-finetunes/cover.jpg","authors":["zeke"],"publishedAt":"2024-09-20T00:00:00.000Z","publishedAtDisplay":"September 20, 2024","unlisted":false},{"slug":"fine-tune-flux-with-an-api","title":"Fine-tune FLUX.1 with an API","intro":"Create and run your own fine-tuned Flux models programmatically using Replicate's HTTP API.","image":"assets/blog/fine-tune-flux-with-an-api/cover.jpg","authors":["zeke"],"publishedAt":"2024-09-09T00:00:00.000Z","publishedAtDisplay":"September 9, 2024","unlisted":false},{"slug":"fine-tune-flux-with-faces","title":"Fine-tune FLUX.1 to create images of yourself","intro":"Create your own fine-tuned Flux model to generate new images of yourself.","image":"assets/blog/fine-tune-flux-with-faces/cover.jpg","authors":["zeke"],"publishedAt":"2024-08-30T00:00:00.000Z","publishedAtDisplay":"August 30, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-08-23","title":"Replicate Intelligence #12","intro":"Flux LoRAs, Hot Zuck, and Replicate on Lex Fridman","authors":["deepfates"],"publishedAt":"2024-08-23T00:00:00.000Z","publishedAtDisplay":"August 23, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-08-16","title":"Replicate Intelligence #11","intro":"Fine tune FLUX.1, generative video games, a vision for the metaverse","authors":["deepfates"],"publishedAt":"2024-08-16T00:00:00.000Z","publishedAtDisplay":"August 16, 2024","unlisted":false},{"slug":"fine-tune-flux","title":"Fine-tune FLUX.1 with your own images","intro":"We've added fine-tuning (LoRA) support to FLUX.1 image generation models. You can train FLUX.1 on your own images with one line of code using Replicate's API.","image":"assets/blog/fine-tune-flux/cover.jpg","authors":["deepfates"],"publishedAt":"2024-08-15T00:00:00.000Z","publishedAtDisplay":"August 15, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-08-09","title":"Replicate Intelligence #10","intro":"Flux developments, Minecraft bot, Streamlit cookbook with Zeke","authors":["deepfates"],"publishedAt":"2024-08-09T00:00:00.000Z","publishedAtDisplay":"August 9, 2024","unlisted":false},{"slug":"flux-first-impressions","title":"FLUX.1: First Impressions","intro":"We explore FLUX.1's unique strengths and aesthetics to see what we can generate.","image":"assets/blog/flux-first-impressions/library.webp","authors":["deepfates"],"publishedAt":"2024-08-02T00:00:00.000Z","publishedAtDisplay":"August 2, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-08-02","title":"Replicate Intelligence #9","intro":"Open source frontier image model, cut objects from videos, new Python web framework from Jeremy Howard","authors":["deepfates"],"publishedAt":"2024-08-02T00:00:00.000Z","publishedAtDisplay":"August 2, 2024","unlisted":false},{"slug":"flux-state-of-the-art-image-generation","title":"Run FLUX with an API","intro":"FLUX.1 is a new text-to-image model from Black Forest Labs, the creators of Stable Diffusion, that exceeds the capabilities of previous open-source models.","image":"assets/blog/flux/cover.jpg","authors":["zeke","zsxkib"],"publishedAt":"2024-08-01T00:00:00.000Z","publishedAtDisplay":"August 1, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-07-26","title":"Replicate Intelligence #8","intro":"A top-tier open-ish language model, new safety classifiers, model search API","authors":["deepfates"],"publishedAt":"2024-07-26T00:00:00.000Z","publishedAtDisplay":"July 26, 2024","unlisted":false},{"slug":"run-llama-3-1-with-an-api","title":"Run Meta Llama 3.1 405B with an API","intro":"Llama 3.1 405B: is the most powerful open-source language model from Meta. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-3-api/meta.png","authors":["deepfates"],"publishedAt":"2024-07-23T00:00:00.000Z","publishedAtDisplay":"July 23, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-07-12","title":"Replicate Intelligence #7","intro":"Data curation, data generation, data data data","authors":["deepfates"],"publishedAt":"2024-07-12T00:00:00.000Z","publishedAtDisplay":"July 12, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-06-28","title":"Replicate Intelligence #6","intro":"Google's Gemma2 models, language model leaderboard, tips for Stable Diffusion 3","authors":["deepfates"],"publishedAt":"2024-06-28T00:00:00.000Z","publishedAtDisplay":"June 28, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-06-21","title":"Replicate Intelligence #5","intro":"Really good coding model, AI search breakthroughs, Discord support bot","authors":["deepfates"],"publishedAt":"2024-06-21T00:00:00.000Z","publishedAtDisplay":"June 21, 2024","unlisted":false},{"slug":"get-the-best-from-stable-diffusion-3","title":"How to get the best results from Stable Diffusion 3","intro":"We show you how to use Stable Diffusion 3 to get the best images, including new techniques for prompting.","image":"assets/blog/get-the-best-from-stable-diffusion-3/get-the-best-from-stable-diffusion-3.webp","authors":["fofr"],"publishedAt":"2024-06-18T00:00:00.000Z","publishedAtDisplay":"June 18, 2024","unlisted":false},{"slug":"run-stable-diffusion-3-on-apple-silicon-mac","title":"Run Stable Diffusion 3 on your Apple Silicon Mac","intro":"A step-by-step guide to generating images with Stable Diffusion 3 on your M-series Mac using MPS acceleration.","image":"assets/blog/sd3-mac-mps/cover.webp","authors":["zsxkib"],"publishedAt":"2024-06-18T00:00:00.000Z","publishedAtDisplay":"June 18, 2024","unlisted":false},{"slug":"push-a-custom-sd3","title":"Push a custom version of Stable Diffusion 3","intro":"Create your own custom version of Stability's latest image generation model and run it on Replicate via the web or API.","image":"assets/blog/push-a-custom-sd3/push-a-custom-sd3.webp","authors":["zeke"],"publishedAt":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-06-14","title":"Replicate Intelligence #4","intro":"Find concepts in GPT models, real-time speech to text in the browser, H100s are coming","authors":["deepfates"],"publishedAt":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024","unlisted":false},{"slug":"run-sd3-on-comfyui","title":"Run Stable Diffusion 3 on your own machine with ComfyUI","intro":"Copy and paste a few commands into terminal to play with Stable Diffusion 3 on your own GPU-powered machine.","image":"assets/blog/sd3-comfyui-steps/comfyui-sd3.webp","authors":["zsxkib","zeke"],"publishedAt":"2024-06-14T00:00:00.000Z","publishedAtDisplay":"June 14, 2024","unlisted":false},{"slug":"h100s-are-coming","title":"H100s are coming to Replicate","intro":"We'll soon support NVIDIA's H100 GPUs for predictions and training. Let us know if you want early access.","image":"assets/blog/h100s-are-coming/h100s-are-coming.webp","authors":["zeke"],"publishedAt":"2024-06-12T00:00:00.000Z","publishedAtDisplay":"June 12, 2024","unlisted":false},{"slug":"run-stable-diffusion-3-with-an-api","title":"Run Stable Diffusion 3 with an API","intro":"Stable Diffusion 3 is the latest text-to-image model from Stability, with improved image quality, typography, prompt understanding, and resource efficiency. Learn how to run it in the cloud with one line of code.","image":"assets/blog/stable-diffusion-3-api/stability-ai.webp","authors":["cbh123"],"publishedAt":"2024-06-12T00:00:00.000Z","publishedAtDisplay":"June 12, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-06-07","title":"Replicate Intelligence #3","intro":"Garden State Llama, applied LLMs guide, real-time image generation","authors":["deepfates"],"publishedAt":"2024-06-07T00:00:00.000Z","publishedAtDisplay":"June 7, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-05-31","title":"Replicate Intelligence #2","intro":"Faster image generation, AI-powered world simulator, insights on AI dataset complexity","authors":["deepfates"],"publishedAt":"2024-05-31T00:00:00.000Z","publishedAtDisplay":"May 31, 2024","unlisted":false},{"slug":"replicate-intelligence-2024-05-24","title":"Replicate Intelligence #1","intro":"DIY Llama 3 implementation, open-source smart glasses, steering language models with dictionary learning","authors":["deepfates"],"publishedAt":"2024-05-24T00:00:00.000Z","publishedAtDisplay":"May 24, 2024","unlisted":false},{"slug":"shared-network-vulnerability-disclosure","title":"Shared network vulnerability disclosure","authors":["nickstenning","philandstuff","zeke"],"publishedAt":"2024-05-23T00:00:00.000Z","publishedAtDisplay":"May 23, 2024","unlisted":false},{"slug":"run-arctic-with-an-api","title":"Run Snowflake Arctic with an API","intro":"Arctic is a new open-source language model from Snowflake. Learn how to run it in the cloud with one line of code.","image":"assets/blog/arctic-api/snowflake_arctic.png","authors":["cbh123"],"publishedAt":"2024-04-23T00:00:00.000Z","publishedAtDisplay":"April 23, 2024","unlisted":false},{"slug":"run-llama-3-with-an-api","title":"Run Meta Llama 3 with an API","intro":"Llama 3 is the latest language model from Meta. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-3-api/meta.png","authors":["cbh123"],"publishedAt":"2024-04-18T00:00:00.000Z","publishedAtDisplay":"April 18, 2024","unlisted":false},{"slug":"run-codellama-with-an-api","title":"Run Code Llama 70B with an API","intro":"Code Llama 70B is one of the powerful open-source code generation models. Learn how to run it in the cloud with one line of code.","image":"assets/blog/codellama/codellama.png","authors":["cbh123"],"publishedAt":"2024-01-30T00:00:00.000Z","publishedAtDisplay":"January 30, 2024","unlisted":false},{"slug":"how-to-create-an-ai-narrator","title":"How to create an AI narrator for your life","intro":"Or, how I met a virtual David Attenborough.","image":"assets/blog/ai-narrator/2023-12-01_at_11.58.52.png","authors":["cbh123"],"publishedAt":"2023-12-06T00:00:00.000Z","publishedAtDisplay":"December 6, 2023","unlisted":false},{"slug":"how-to-tune-a-realistic-voice-clone","title":"Clone your voice using open-source models","intro":"We’ve added fine-tuning for realistic voice cloning (RVC). You can train RVC on your own dataset from a YouTube video with a few lines of code using Replicate's API.","image":"assets/blog/how-to-tune-a-realistic-voice-clone/rvc.jpg","authors":["zsxkib","fofr"],"publishedAt":"2023-12-06T00:00:00.000Z","publishedAtDisplay":"December 6, 2023","unlisted":false},{"slug":"series-b","title":"Businesses are building on open-source AI","intro":"We've raised a $40 million Series B led by a16z.","image":"assets/blog/series-b/goo-logo.jpg","authors":["bfirsh"],"publishedAt":"2023-12-05T00:00:00.000Z","publishedAtDisplay":"December 5, 2023","unlisted":false},{"slug":"run-yi-chat-with-api","title":"How to run Yi chat models with an API","intro":"The Yi series models are large language models trained from scratch by developers at 01.AI. Learn how to run them in the cloud with one line of code.","image":"assets/blog/run-yi-chat-with-api/Yi.svg","authors":["nateraw"],"publishedAt":"2023-11-23T00:00:00.000Z","publishedAtDisplay":"November 23, 2023","unlisted":false},{"slug":"replicate-scaffold","title":"Scaffold Replicate apps with one command","intro":"We've added a CLI command that makes it easy to get started with Replicate.","image":"assets/blog/ready-set-scaffold/scaffold-llama.jpg","authors":["jakedahn","mattrothenberg"],"publishedAt":"2023-11-22T00:00:00.000Z","publishedAtDisplay":"November 22, 2023","unlisted":false},{"slug":"run-bge-embedding-models","title":"Using open-source models for faster and cheaper text embeddings","intro":"An interactive example showing how to embed text using a state-of-the-art embedding model that beats OpenAI's embeddings API on price and performance.","image":"assets/blog/run-bge-embedding-models/cover.jpg","authors":["nateraw"],"publishedAt":"2023-11-10T00:00:00.000Z","publishedAtDisplay":"November 10, 2023","unlisted":false},{"slug":"generate-music-from-chord-progressions-musicgen-chord","title":"Generate music from chord progressions and text prompts with MusicGen-Chord","intro":"We’ve added chord conditioning to Meta’s MusicGen model, so you can create automatic backing tracks in any style using text prompts and chord progressions.","image":"assets/blog/generate-music-from-chord-progressions-musicgen-chord/cover.png","authors":["sakemin"],"publishedAt":"2023-11-08T00:00:00.000Z","publishedAtDisplay":"November 8, 2023","unlisted":false},{"slug":"run-latent-consistency-model-on-mac","title":"Generate images in one second on your Mac using a latent consistency model","intro":"How to run a latent consistency model on your M1 or M2 Mac","image":"assets/blog/run-latent-consistency-model-on-mac/cover.webp","authors":["fofr"],"publishedAt":"2023-10-25T00:00:00.000Z","publishedAtDisplay":"October 25, 2023","unlisted":false},{"slug":"how-to-use-rag-with-chromadb-and-mistral-7b-instruct","title":"How to use retrieval augmented generation with ChromaDB and Mistral","intro":"In this post we'll explore the basics of retrieval augmented generation by creating an example app that uses bge-large-en for embeddings, ChromaDB for vector store, and mistral-7b-instruct for language model generation.","image":"assets/blog/how-to-use-rag-with-chromadb-and-mistral-7b-instruct/rag-cover-image.webp","authors":["jakedahn"],"publishedAt":"2023-10-17T00:00:00.000Z","publishedAtDisplay":"October 17, 2023","unlisted":false},{"slug":"fine-tune-musicgen","title":"Fine-tune MusicGen to generate music in any style","intro":"We’ve added fine-tuning support to MusicGen. You can train the small, medium and melody models on your own audio files using Replicate.","image":"assets/blog/fine-tune-musicgen/fine-tune-musicgen.webp","authors":["fofr","sakemin"],"publishedAt":"2023-10-13T00:00:00.000Z","publishedAtDisplay":"October 13, 2023","unlisted":false},{"slug":"llama-2-grammars","title":"Jet-setting with Llama 2 + Grammars","intro":"How to use Llama 2 models with grammars for information extraction tasks.","image":"assets/blog/llama-2-grammars/llama2-grammar.webp","authors":["mattt"],"publishedAt":"2023-10-09T00:00:00.000Z","publishedAtDisplay":"October 9, 2023","unlisted":false},{"slug":"run-mistral-7b-with-api","title":"How to run Mistral 7B with an API","intro":"Mistral 7B is an open-source large language model. Learn what it's good at and how to run it in the cloud with one line of code.","image":"assets/blog/demystifying-mistral-7b/mistral_box.jpeg","authors":["daanelson","zeke"],"publishedAt":"2023-10-06T00:00:00.000Z","publishedAtDisplay":"October 6, 2023","unlisted":false},{"slug":"animatediff-interpolator","title":"Make smooth AI generated videos with AnimateDiff and an interpolator","intro":"Combine AnimateDiff and the ST-MFNet frame interpolator to create smooth and realistic videos from a text prompt","image":"assets/blog/animatediff-interpolator/animatediff.webp","authors":["fofr","zsxkib"],"publishedAt":"2023-10-04T00:00:00.000Z","publishedAtDisplay":"October 4, 2023","unlisted":false},{"slug":"fine-tune-cold-boots","title":"Fine-tuned models now boot in less than one second","intro":"We've made some dramatic improvements to cold boots for fine-tuned models.","image":"assets/blog/fine-tune-cold-boots/fast-llamas.webp","authors":["andreasjansson"],"publishedAt":"2023-09-06T00:00:00.000Z","publishedAtDisplay":"September 6, 2023","unlisted":false},{"slug":"painting-with-words-a-history-of-text-to-image-ai","title":"Painting with words: a history of text-to-image AI","intro":"With the recent release of Stable Diffusion XL fine-tuning on Replicate, and today being the 1-year anniversary of Stable Diffusion, now feels like the perfect opportunity to take a step back and reflect on how text-to-image AI has improved over the last few years.","image":"assets/blog/painting-with-words-a-history-of-text-to-image-ai/sketch_of_internet_is_a_series_of_tubes_by_Leonardo_da_Vinci.png","authors":["jakedahn"],"publishedAt":"2023-08-22T00:00:00.000Z","publishedAtDisplay":"August 22, 2023","unlisted":false},{"slug":"cutting-prices-in-half","title":"We're cutting our prices in half","intro":"The price of public models is being cut in half, and soon we'll start charging new users for setup and idle time on private models.","image":"assets/blog/cutting-prices-in-half/out-3-1.png","authors":["bfirsh"],"publishedAt":"2023-08-16T00:00:00.000Z","publishedAtDisplay":"August 16, 2023","unlisted":false},{"slug":"how-to-prompt-llama","title":"A guide to prompting Llama 2","intro":"Learn the art of the Llama prompt.","image":"assets/blog/prompt-llama/llama-typing.png","authors":["cbh123"],"publishedAt":"2023-08-14T00:00:00.000Z","publishedAtDisplay":"August 14, 2023","unlisted":false},{"slug":"streaming","title":"Streaming output for language models","intro":"Our API now supports server-sent event streams for language models. Learn how to use them to make your apps more responsive.","image":"assets/blog/streaming/streaming.jpg","authors":["zeke"],"publishedAt":"2023-08-14T00:00:00.000Z","publishedAtDisplay":"August 14, 2023","unlisted":false},{"slug":"fine-tune-sdxl","title":"Fine-tune SDXL with your own images","intro":"We’ve added fine-tuning (Dreambooth, Textual Inversion and LoRA) support to SDXL 1.0. You can train SDXL on your own images with one line of code using the Replicate API.","image":"assets/blog/fine-tune-sdxl/out-3-8.png","authors":["andreasjansson","anotherjesse","cloneofsimo","daanelson"],"publishedAt":"2023-08-08T00:00:00.000Z","publishedAtDisplay":"August 8, 2023","unlisted":false},{"slug":"run-llama-2-with-an-api","title":"Run Llama 2 with an API","intro":"Llama 2 is the first open source language model of the same caliber as OpenAI’s models. Learn how to run it in the cloud with one line of code.","image":"assets/blog/llama-api/llama-clouds.png","authors":["joehoover"],"publishedAt":"2023-07-27T00:00:00.000Z","publishedAtDisplay":"July 27, 2023","unlisted":false},{"slug":"run-sdxl-with-an-api","title":"Run SDXL with an API","intro":"How to run Stable Diffusion XL 1.0 using the Replicate API","image":"assets/blog/run-sdxl-with-an-api/astronaut-riding-unicorn.webp","authors":["fofr"],"publishedAt":"2023-07-26T00:00:00.000Z","publishedAtDisplay":"July 26, 2023","unlisted":false},{"slug":"run-llama-locally","title":"A comprehensive guide to running Llama 2 locally","intro":"How to run Llama 2 on Mac, Linux, Windows, and your phone.","image":"assets/blog/run-llama-locally/llama-captain.jpg","authors":["zeke"],"publishedAt":"2023-07-22T00:00:00.000Z","publishedAtDisplay":"July 22, 2023","unlisted":false},{"slug":"fine-tune-llama-2","title":"Fine-tune Llama 2 on Replicate","intro":"So you want to train a llama...","image":"assets/blog/fine-tune-llama-2/llama-salon.png","authors":["cbh123"],"publishedAt":"2023-07-20T00:00:00.000Z","publishedAtDisplay":"July 20, 2023","unlisted":false},{"slug":"llama-2-roundup","title":"What happened with Llama 2 in the last 24 hours? 🦙","intro":"A roundup of recent developments from the llamaverse following the second major release of Meta's open-source large language model.","image":"assets/blog/llama-2-roundup/llama2.jpg","authors":["cbh123","zeke"],"publishedAt":"2023-07-19T00:00:00.000Z","publishedAtDisplay":"July 19, 2023","unlisted":false},{"slug":"turn-your-llm-into-a-poet","title":"Make any large language model a better poet","intro":"Prompt engineering and training are often the first solutions we reach for to improve language model behavior, but they're not the only way.","image":"assets/blog/poet/poet.jpg","authors":["joehoover"],"publishedAt":"2023-05-26T00:00:00.000Z","publishedAtDisplay":"May 26, 2023","unlisted":false},{"slug":"new-status-page","title":"Status page","intro":"We've added a status page to provide real-time updates on the health of Replicate.","image":"assets/blog/status-page/nines.jpg","authors":["nickstenning","zeke"],"publishedAt":"2023-05-18T00:00:00.000Z","publishedAtDisplay":"May 18, 2023","unlisted":false},{"slug":"language-model-roundup","title":"Language model roundup, April 2023","intro":"A roundup of recent developments from the world of open-source language models.","image":"assets/blog/language-model-roundup/language-model-roundup.jpg","authors":["joehoover","mattt","zeke"],"publishedAt":"2023-04-21T00:00:00.000Z","publishedAtDisplay":"April 21, 2023","unlisted":false},{"slug":"autocog","title":"AutoCog — Generate Cog configuration with GPT-4","intro":"Give it a machine learning directory and AutoCog will create predict.py and cog.yaml until it successfully runs a prediction","image":"assets/blog/autocog/autocog.png","authors":["andreasjansson"],"publishedAt":"2023-04-19T00:00:00.000Z","publishedAtDisplay":"April 19, 2023","unlisted":false},{"slug":"language-models","title":"Language models are on Replicate","intro":"","image":"assets/blog/language-models/out-2.png","authors":["bfirsh"],"publishedAt":"2023-04-05T00:00:00.000Z","publishedAtDisplay":"April 5, 2023","unlisted":false},{"slug":"fine-tune-alpaca-with-lora","title":"How to use Alpaca-LoRA to fine-tune a model like ChatGPT","intro":"","image":"assets/blog/fine-tune-alpaca-with-lora/alpaca-lora.jpg","authors":["andreasjansson","daanelson","zeke"],"publishedAt":"2023-03-23T00:00:00.000Z","publishedAtDisplay":"March 23, 2023","unlisted":false},{"slug":"llama-roundup","title":"Week 3 of LLaMA 🦙","intro":"A roundup of recent developments from the llamaverse.","image":"assets/blog/llama-roundup/llama-astronaut.jpg","authors":["zeke"],"publishedAt":"2023-03-18T00:00:00.000Z","publishedAtDisplay":"March 18, 2023","unlisted":false},{"slug":"fine-tune-llama-to-speak-like-homer-simpson","title":"Fine-tune LLaMA to speak like Homer Simpson","intro":"With a small amount of data and an hour of training you can make LLaMA output text in the voice of the dataset.","image":"assets/blog/homer/robot-homer.webp","authors":["bfirsh"],"publishedAt":"2023-03-17T00:00:00.000Z","publishedAtDisplay":"March 17, 2023","unlisted":false},{"slug":"replicate-alpaca","title":"Train and run Stanford Alpaca on your own machine","intro":"We'll show you how to train Alpaca, a fine-tuned version of LLaMA that can respond to instructions like ChatGPT.","image":"assets/blog/replicate-alpaca/party-alpaca.png","authors":["zeke"],"publishedAt":"2023-03-16T00:00:00.000Z","publishedAtDisplay":"March 16, 2023","unlisted":false},{"slug":"machine-learning-needs-better-tools","title":"Machine learning needs better tools","intro":"Lots of people want to build things with machine learning, but they don't have the expertise to use it.","image":"assets/blog/machine-learning-is-just-software/cover.png","authors":["bfirsh"],"publishedAt":"2023-02-21T00:00:00.000Z","publishedAtDisplay":"February 21, 2023","unlisted":false},{"slug":"lora-faster-fine-tuning-of-stable-diffusion","title":"Introducing LoRA: A faster way to fine-tune Stable Diffusion","intro":"It's like DreamBooth, but much faster. And you can run it in the cloud on Replicate.","image":"assets/blog/lora-api/lora-api.png","authors":["cloneofsimo","andreasjansson","anotherjesse","zeke"],"publishedAt":"2023-02-07T00:00:00.000Z","publishedAtDisplay":"February 7, 2023","unlisted":false},{"slug":"dreambooth-api","title":"Train and deploy a DreamBooth model on Replicate","intro":"With just a handful of images and a single API call, you can train a model, publish it to Replicate, and run predictions on it in the cloud.","image":"assets/blog/dreambooth-api/Untitled.png","authors":["bfirsh","zeke"],"publishedAt":"2022-11-21T00:00:00.000Z","publishedAtDisplay":"November 21, 2022","unlisted":false},{"slug":"run-stable-diffusion-on-m1-mac","title":"Run Stable Diffusion on your M1 Mac’s GPU","intro":"How to run Stable Diffusion locally so you can hack on it","image":"assets/blog/run-stable-diffusion-on-m1-mac/grid-0002.png","authors":["bfirsh"],"publishedAt":"2022-08-31T00:00:00.000Z","publishedAtDisplay":"August 31, 2022","unlisted":false},{"slug":"run-stable-diffusion-with-an-api","title":"Run Stable Diffusion with an API","intro":"How to use Replicate to integrate Stable Diffusion into hacks, apps, and projects","image":"assets/blog/run-stable-diffusion-with-an-api/out-0-3.png","authors":["zeke"],"publishedAt":"2022-08-29T00:00:00.000Z","publishedAtDisplay":"August 29, 2022","unlisted":false},{"slug":"build-a-robot-artist-for-your-discord-server-with-stable-diffusion","title":"Build a robot artist for your Discord server with Stable Diffusion, Replicate, and Fly.io","intro":"A tutorial for building a chat bot that replies to prompts with the output of a text-to-image model.","image":"assets/blog/discord-bot/dreaming-of-rabbits.png","authors":["zeke,","evilstreak","bfirsh"],"publishedAt":"2022-08-25T00:00:00.000Z","publishedAtDisplay":"August 25, 2022","unlisted":false},{"slug":"uncanny-spaces","title":"Join us at Uncanny Spaces","intro":"We're bringing people together to explore what's being created with machine learning.","authors":["rossjillian"],"publishedAt":"2022-08-11T00:00:00.000Z","publishedAtDisplay":"August 11, 2022","unlisted":false},{"slug":"grab-hundreds-of-images-with-clip-and-laion","title":"Automating image collection","intro":"Using CLIP and LAION5B to collect thousands of captioned images.","authors":["afiaka87"],"publishedAt":"2022-08-05T00:00:00.000Z","publishedAtDisplay":"August 5, 2022","unlisted":false},{"slug":"exploring-text-to-image-models","title":"Exploring text to image models","intro":"The basics of using the API to create your own images from text.","authors":["afiaka87","rossjillian"],"publishedAt":"2022-07-18T00:00:00.000Z","publishedAtDisplay":"July 18, 2022","unlisted":false},{"slug":"model-docs","title":"A new template for model READMEs","intro":"Inspired by model cards, we've created templates for documenting models on Replicate.","authors":["rossjillian","zeke"],"publishedAt":"2022-07-05T00:00:00.000Z","publishedAtDisplay":"July 5, 2022","unlisted":false},{"slug":"constraining-clipdraw","title":"Constraining CLIPDraw","intro":"An introduction to differentiable programming and the process of refining generative art models.","authors":["evilstreak"],"publishedAt":"2022-05-27T00:00:00.000Z","publishedAtDisplay":"May 27, 2022","unlisted":false},{"slug":"hello-world","title":"Hello, world!","intro":"We're a small team of engineers and machine learning enthusiasts working to make machine learning more accessible.","authors":["evilstreak","zeke"],"publishedAt":"2022-05-16T00:00:00.000Z","publishedAtDisplay":"May 16, 2022","unlisted":false}]}},"actionData":null,"errors":null}};</script><script type="module" async="">import "/frontend-assets/manifest-67830084.js"; import * as route0 from "/frontend-assets/root-BP_mC3Sm.js"; import * as route1 from "/frontend-assets/layout-lnCEgoRq.js"; import * as route2 from "/frontend-assets/index-Cu5O9l-Z.js"; window.__remixRouteModules = {"root":route0,"routes/blog/layout":route1,"routes/blog/index":route2}; import("/frontend-assets/entry.client-BS4mLQdq.js");</script><div style="position:fixed;z-index:9999;top:16px;left:16px;right:16px;bottom:16px;pointer-events:none"></div><script>((STORAGE_KEY, restoreKey) => { if (!window.history.state || !window.history.state.key) { let key = Math.random().toString(32).slice(2); window.history.replaceState({ key }, ""); } try { let positions = JSON.parse(sessionStorage.getItem(STORAGE_KEY) || "{}"); let storedY = positions[restoreKey || window.history.state.key]; if (typeof storedY === "number") { window.scrollTo(0, storedY); } } catch (error) { console.error(error); sessionStorage.removeItem(STORAGE_KEY); } })("positions", null)</script></body></html>