[{"@context":"https:\/\/schema.org\/","@type":"BlogPosting","@id":"https:\/\/blog.terabox.com\/insights\/future-of-ai-inference-base-10-tuhans-srivastava#BlogPosting","mainEntityOfPage":"https:\/\/blog.terabox.com\/insights\/future-of-ai-inference-base-10-tuhans-srivastava","headline":"AI Inference at Scale: Interview with Base 10 CEO","name":"AI Inference at Scale: Interview with Base 10 CEO","description":"\ud83d\udcfa Today&#8217;s recommended deep-dive video: https:\/\/www.youtube.com\/watch?v=XAbKflCncDo Scaling the Frontier: Tuhans Srivastava on the Future of AI Inference and the Compute CrunchThe Transition to Custom AIThe Infrastructure Reality CheckTalent and the Multi-Chip FutureKey TakeawaysQ&amp;A Scaling the Frontier: Tuhans Srivastava on the... ","datePublished":"2026-06-24","dateModified":"2026-06-24","author":{"@type":"Person","@id":"https:\/\/blog.terabox.com\/author\/flextech-admin\/#Person","name":"flextech-admin","url":"https:\/\/blog.terabox.com\/author\/flextech-admin\/","image":{"@type":"ImageObject","@id":"https:\/\/secure.gravatar.com\/avatar\/ad516503a11cd5ca435acc9bb6523536?s=150&#038;d=mm&#038;r=gforcedefault=1","url":"https:\/\/secure.gravatar.com\/avatar\/ad516503a11cd5ca435acc9bb6523536?s=150&#038;d=mm&#038;r=gforcedefault=1","height":96,"width":96}},"publisher":{"@type":"Organization","name":"terabox","logo":{"@type":"ImageObject","@id":"http:\/\/blog.terabox.com\/wp-content\/uploads\/2021\/11\/logo\u4ea7\u54c1\u540d-\u7ad6\u7248.png","url":"http:\/\/blog.terabox.com\/wp-content\/uploads\/2021\/11\/logo\u4ea7\u54c1\u540d-\u7ad6\u7248.png","width":900,"height":900}},"image":{"@type":"ImageObject","@id":"https:\/\/img.youtube.com\/vi\/XAbKflCncDo\/maxresdefault.jpg","url":"https:\/\/img.youtube.com\/vi\/XAbKflCncDo\/maxresdefault.jpg","height":"","width":""},"url":"https:\/\/blog.terabox.com\/insights\/future-of-ai-inference-base-10-tuhans-srivastava","video":{"@context":"http:\/\/schema.org\/","@type":"VideoObject","@id":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo#VideoObject","contentUrl":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo","name":"Baseten CEO Tuhin Srivastava on Custom Models, and Building the Inference Cloud","description":"Baseten CEO and co-founder Tuhin Srivastava sits down with Sarah Guo and Elad Gil to discuss the rapid growth of AI inference demand, Baseten\u2019s 30x growth, and why inference is becoming the strategic \u201clast market.\u201d Tuhin Srivastava argues the application layer will persist because companies with unique user signals can encode value into workflows and post-train specialized models, citing examples like Abridge and support workflows. The conversation covers GPU capacity constraints, Baseten\u2019s multi-cloud fabric across 18 clouds and 90 clusters, long-term contracting dynamics, the importance of the software layer for stickiness, evolving workloads, multichip possibilities, and operational lessons at scale.\nSign up for new podcasts every week. Email feedback to show@no-priors.com\nFollow us on Twitter: @NoPriorsPod | @Saranormous | @EladGil | @Tuhinone \nChapters:\n00:31 Baseten growth\n01:55 Why the app layer wins\n05:57 Serving frontier customers\n07:55 Open source model mix\n09:21 Chinese models and geopolitics\n13:07 Custom inference dominates\n14:22 Post training acquisition\n17:10 When to invest in custom models\n18:35 Supply crunch and data centerse\n22:25 Longer GPU Contracts\n24:09 What Makes a Winner\n26:07 Multi Chip Future\n28:19 Runtime Roadmap\n31:08 Scaling Edge Cases\n33:48 Hiring and Leadership\n36:44 Operations Pager Culture\n38:19 Efficiency Drives Demand\n40:41 Concierge Everything Future\n42:34 Conclusion","thumbnailUrl":["https:\/\/i.ytimg.com\/vi\/XAbKflCncDo\/default.jpg","https:\/\/i.ytimg.com\/vi\/XAbKflCncDo\/mqdefault.jpg","https:\/\/i.ytimg.com\/vi\/XAbKflCncDo\/hqdefault.jpg","https:\/\/i.ytimg.com\/vi\/XAbKflCncDo\/sddefault.jpg","https:\/\/i.ytimg.com\/vi\/XAbKflCncDo\/maxresdefault.jpg"],"uploadDate":"2026-05-01T15:07:25+00:00","duration":"PT42M58S","embedUrl":"https:\/\/www.youtube.com\/embed\/XAbKflCncDo","publisher":{"@type":"Organization","@id":"https:\/\/www.youtube.com\/channel\/UCSI7h9hydQ40K5MJHnCrQvw#Organization","url":"https:\/\/www.youtube.com\/channel\/UCSI7h9hydQ40K5MJHnCrQvw","name":"No Priors: AI, Machine Learning, Tech, & Startups","description":"Your guide to the AI revolution, co-hosts Elad Gil and Sarah Guo talk to the world's leading engineers, researchers and founders about the biggest questions:\n\nHow far away is AGI? What markets are at risk for disruption? How will commerce, culture, and society change? What\u2019s happening in state-of-the-art in research? Email feedback to show@no-priors.com.\n\nSarah Guo is a startup investor and the founder of Conviction, an investment firm purpose-built to serve intelligent software, or \"Software 3.0\" companies. She spent nearly a decade incubating and investing at venture firm Greylock Partners.\n\nElad Gil is a serial entrepreneur and a startup investor. He was co-founder of Color Health, Mixer Labs (which was acquired by Twitter). He has invested in over 40 companies now worth $1B or more each, and is also author of the High Growth Handbook.\n","logo":{"url":"https:\/\/yt3.ggpht.com\/HQXIpkLms_iVMi_Ob5Cie3PNcZ3smOT7HeNLIAWvBO-lZMdiax2N5LH1blWMxUtMrJCcXyNZ=s800-c-k-c0x00ffffff-no-rj","width":800,"height":800,"@type":"ImageObject","@id":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo#VideoObject_publisher_logo_ImageObject"}},"potentialAction":{"@type":"SeekToAction","@id":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo#VideoObject_potentialAction","target":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo&t={seek_to_second_number}","startOffset-input":"required name=seek_to_second_number"},"interactionStatistic":[[{"@type":"InteractionCounter","@id":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo#VideoObject_interactionStatistic_WatchAction","interactionType":{"@type":"WatchAction"},"userInteractionCount":6715}],{"@type":"InteractionCounter","@id":"https:\/\/www.youtube.com\/watch?v=XAbKflCncDo#VideoObject_interactionStatistic_LikeAction","interactionType":{"@type":"LikeAction"},"userInteractionCount":92}]},"about":["Insights","\u300eEnglish\u300f"],"wordCount":1336,"keywords":["download"]},{"@context":"https:\/\/schema.org\/","@type":"BreadcrumbList","itemListElement":[{"@type":"ListItem","position":1,"name":"Insights","item":"https:\/\/blog.terabox.com\/insights\/#breadcrumbitem"},{"@type":"ListItem","position":2,"name":"AI Inference at Scale: Interview with Base 10 CEO","item":"https:\/\/blog.terabox.com\/insights\/future-of-ai-inference-base-10-tuhans-srivastava#breadcrumbitem"}]}]