<!DOCTYPE html><html lang="en"><head><meta http-equiv="Content-Type" content="text/html charset=UTF-8"><meta charset="UTF-8"><meta name="viewport" content="width=device-width"><meta name="x-apple-disable-message-reformatting"><title>TLDR Data</title><meta name="color-scheme" content="light dark"><meta name="supported-color-schemes" content="light dark"><style type="text/css">
:root {
color-scheme: light dark; supported-color-schemes: light dark;
}
*,
*:after,
*:before {
-webkit-box-sizing: border-box; -moz-box-sizing: border-box; box-sizing: border-box;
}
* {
-ms-text-size-adjust: 100%; -webkit-text-size-adjust: 100%;
}
html,
body,
.document {
width: 100% !important; height: 100% !important; margin: 0; padding: 0;
}
body {
-webkit-font-smoothing: antialiased; -moz-osx-font-smoothing: grayscale; text-rendering: optimizeLegibility;
}
div[style*="margin: 16px 0"] {
margin: 0 !important;
}
table,
td {
mso-table-lspace: 0pt; mso-table-rspace: 0pt;
}
table {
border-spacing: 0; border-collapse: collapse; table-layout: fixed; margin: 0 auto;
}
img {
-ms-interpolation-mode: bicubic; max-width: 100%; border: 0;
}
*[x-apple-data-detectors] {
color: inherit !important; text-decoration: none !important;
}
.x-gmail-data-detectors,
.x-gmail-data-detectors *,
.aBn {
border-bottom: 0 !important; cursor: default !important;
}
.btn {
-webkit-transition: all 200ms ease; transition: all 200ms ease;
}
.btn:hover {
background-color: #f67575; border-color: #f67575;
}
* {
font-family: Arial, Helvetica, sans-serif; font-size: 18px;
}
@media screen and (max-width: 600px) {
.container {
width: 100%; margin: auto;
}
.stack {
display: block!important; width: 100%!important; max-width: 100%!important;
}
.btn {
display: block; width: 100%; text-align: center;
}
}
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
a {
color: inherit !important; text-decoration: underline !important;
}
</style><!--[if mso | ie]>
<style type="text/css">
a {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
a {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
</style>
<![endif]--></head><body class="">
<div style="display: none; max-height: 0px; overflow: hidden;">Quack is a new client-server protocol that lets separate DuckDB instances communicate over HTTP instead of only running in-process β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β </div>
<div style="display: none; max-height: 0px; overflow: hidden;">
<br>
</div>
<table align="center" class="document"><tbody><tr><td valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" class="container" width="600"><tbody><tr class="inner-body"><td>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr class="header"><td bgcolor="" class="container">
<table width="100%"><tbody><tr><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" style="margin-top: 0px;" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div style="text-align: center;">
<span style="margin-right: 0px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/jUU6U1lWzTuUxPsaQ5h9qTpozHpPW91eVQuaNapcSoY=452" rel="noopener noreferrer" target="_blank"><span>Sign Up</span></a>
|<span style="margin-right: 2px; margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisetopnav/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/_jFlxnLNZenlMP9vBfCf070eyOGVw4G38ehRMtKRR20=452" rel="noopener noreferrer" target="_blank"><span>Advertise</span></a></span>|<span style="margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Fweb-version%3Fep=1%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=777216a8-4f6f-11f1-a634-bf7d98d39e9f%26pt=campaign%26t=1778753289%26s=0e13df01d4b43d4d49b896cdd2fbc10ff806e02510c6a12e918d5136b4749796/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/WpevjiKGyPKbN2Im4a1sdRedJ_jPAcY_E3xVQJQfiCI=452"><span>View Online</span></a></span>
<br>
</span></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="text-align: center;"><span data-darkreader-inline-color="" style="--darkreader-inline-color:#3db3ff; color: rgb(51, 175, 255) !important; font-size: 30px;">T</span><span style="font-size: 30px;"><span data-darkreader-inline-color="" style="color: rgb(232, 192, 96) !important; --darkreader-inline-color:#e8c163; font-size:30px;">L</span><span data-darkreader-inline-color="" style="color: rgb(101, 195, 173) !important; --darkreader-inline-color:#6ec7b2; font-size:30px;">D</span></span><span data-darkreader-inline-color="" style="--darkreader-inline-color:#dd6e6e; color: rgb(220, 107, 107) !important; font-size: 30px;">R</span>
<br>
</td></tr></tbody></table>
<br>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr id="together-with"><td align="center" height="20" style="vertical-align:middle !important;" valign="middle" width="100%"><strong style="vertical-align:middle !important; height: 100%;">Together With </strong>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.fivetran.com%2Fresources%2Freports%2Fthe-2026-agentic-ai-readiness-index/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/48QsbUfwG1m2P4dkGK9j-EI68wUlaV38ogkhxbk9N9o=452"><img src="https://images.tldr.tech/fivetran.png" valign="middle" style="vertical-align: middle !important; height: 100%;" alt="Fivetran"></a></td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;">
<div style="text-align: center;">
<h1><strong>TLDR Data <span id="date">2026-05-14</span></strong></h1>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr id="sponsy-copy"><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.fivetran.com%2Fresources%2Freports%2Fthe-2026-agentic-ai-readiness-index/2/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/q35mDgQQ31tXaU7OFHuQPfYzSTHTL00GG9Zz6hOsFfE=452">
<span>
<strong>Fewer than 1 in 6 companies have the data foundation for agentic AI. $$$ is being spent anyway (Sponsor)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
<strong>Nearly half of orgs say data quality & lineage are the biggest obstacle to scaling agentic AI. Most are investing millions to tens of millions of $ anyway.</strong><p></p><p><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.fivetran.com%2Fresources%2Freports%2Fthe-2026-agentic-ai-readiness-index/3/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/x5omch1Wb3vaLnRBUIWuscy7ufekksea4c1wVPG-gW4=452" rel="noopener noreferrer nofollow" target="_blank"><span>Fivetran's agentic AI readiness index</span></a> shows why most companies aren't realizing the full value of AI. Read it to learn why:</p>
<ul>
<li>Only 15% of teams are prepared for agentic AI at scale</li>
<li>Governance and compliance issues are stalling AI projects</li>
<li><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.fivetran.com%2Fblog%2Fwhat-is-open-data-infrastructure/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/i1tAAI62TpLA5dWwYy0kXAuBsLm0OJTL3hwTHEEaOGg=452" rel="noopener noreferrer nofollow" target="_blank"><span>Open Data Infrastructure</span></a> is emerging as the new agentic standard</li>
</ul>
<p>If you're trying to deliver autonomous AI systems, start with the foundation. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.fivetran.com%2Fresources%2Freports%2Fthe-2026-agentic-ai-readiness-index/4/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/xe70Urp9gFWiTnhl2RAsG1AmT1RmE8lhQLPxv03UPRA=452" rel="noopener noreferrer nofollow" target="_blank"><span>Get the index</span></a><strong> </strong>and <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ffivetran.com%2Fsignup%3Futm_medium=paid_listing%26utm_source=tldr%26utm_campaign=2026-May-14-TLDR-Data-sponsorship%26utm_content=newsletter%26utm_term=default/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/tQ33RudKo42Jr5vuuSBwTQ3BB6y-5oaRb6WVfP36Mk8=452" rel="noopener noreferrer nofollow" target="_blank"><span>try Fivetran with a free account</span></a>.
</p>
</span></span></div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr>
<tr bgcolor=""><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π±</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Deep Dives</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FTs162V/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/NLhBseeuvR7Lri5q3fiZ7aM5tLtZZQtoYjvfrH37Ep4=452">
<span>
<strong>Data Projects: Managing Data Assets at Netflix Scale (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Netflix introduced Data Projects to replace brittle ACLs and human-owned workflow identities across millions of tables and thousands of jobs. Projects group tables, workflows, secrets, and assets under durable team-owned app identities, with scoped roles and tokens to reduce permission churn.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FBdrSPI/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/tuiLD93JT4Eb66HxHavVQr52X9b3jMr01xyklXdG8dY=452">
<span>
<strong>When 36,000 Tiny Files Break Your Spark Pipeline: A Deep Dive into S3 DNS Exhaustion and the Small File Problem (9 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Thousands of tiny Parquet files on S3 can break Spark reads with UnknownHostException, even when networking is fine, by overwhelming DNS, S3 LIST/GET calls, and driver/task metadata. Spark partition tuning can help stabilize reads, but the real fix is compaction and table formats like Delta Lake or Iceberg.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FnSa2pQ/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/F4Py2IVtMaenbpIQRxzjUrai7jP2buFszXcvd2H_VpA=452">
<span>
<strong>Why your AI agent has amnesia and why forgetting is the fix (16 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Enterprise AI agents fail in long workflows because they reset, lose context, and rely on bloated prompts or flat vector search. Microsoft's memory architecture uses consolidation, forgetting, and delayed maturation to keep high-value events, reaching 97.2% retention precision and stabilizing around 400 to 500 memories.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fengineering.fb.com%2F2026%2F05%2F12%2Fdata-infrastructure%2Fmigrating-data-ingestion-systems-at-meta-scale%2F%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/cJ1MkFny0txQGC5MyWZrNsCO2VCuYBYSmedOH2NiJ_Q=452">
<span>
<strong>Migrating Data Ingestion Systems at Meta Scale (8 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Meta migrated its massive data ingestion system from legacy customer-owned pipelines to a simpler self-managed service using a phased Shadow β Reverse Shadow β Cleanup lifecycle, row count and checksum checks, automated promotion tooling, custom debugging infrastructure, and rollback mechanisms to prevent bad CDC data propagation.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Opinions & Advice</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fpulse%2Flakehouse-statistics-why-query-engines-get-lost-neil-carson-agnac%2F%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/qjjQW3DvgYV6Pz9JeDMM00By4OvBr-qLRO_9F1gozck=452">
<span>
<strong>Lakehouse statistics and why query engines get lost (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Lakehouse query engines often struggle because the statistical metadata they need to plan queries, skip irrelevant data, size joins, and handle skew is optional, inconsistent, or missing across formats like Iceberg, Delta Lake, and Parquet. Without reliable stats, engines are forced to guess, leading to bad query plans, wasted reads, higher costs, memory issues, and slow or failed queries.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fpracticaldatamodeling.substack.com%2Fp%2Fapril-2026-pdc-state-of-data-modeling%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/z7_chI_idql1Tqg5XdBgfPJw6Sj0VSC3hrUvY1P43i4=452">
<span>
<strong>April 2026 PDC State of Data Modeling Survey Results Are In! (9 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
A 334-response April 2026 pulse survey shows data modeling pain is overwhelmingly organizational, not tooling: 28.1% want training, 24.6% clearer requirements, 21.6% more time, 21.0% dedicated ownership, and only 4.8% better tools. Modeling is often owned by whoever builds pipelines (42.5%), while only 19.2% have a dedicated modeler or architect, and 68.3% refactor only occasionally or rarely. Teams with enforced standards are about 5x more likely to say their models hold up.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fdatabased.pedramnavid.com%2Fp%2Fwe-need-to-talk-about-dbt%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/geuqMLJ_5e3i1pYfCkt9SRlq7vwCI4_CBBsYn9aCZ4w=452">
<span>
<strong>We need to talk about dbt (5 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
dbt's growth has created tension between its practitioner-led roots and enterprise ambitions. dbt must better protect community trust, improve dbt Core, strengthen integrations, fix developer ergonomics, and make dbt Cloud feel like a real IDE. The risk is not adoption, but alienating the users who made dbt valuable.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π»</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Launches & Tools</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fduckdb.org%2F2026%2F05%2F12%2Fquack-remote-protocol.html%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/-rRCTxwrNb3ChDHpx7PURI_Wv9acikHMyrKOS5NCPQ4=452">
<span>
<strong>Quack: The DuckDB Client-Server Protocol (12 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Quack is a new client-server protocol that lets separate DuckDB instances communicate over HTTP instead of only running in-process. It uses a request/response model with custom application/duckdb serialization, default token-based auth, localhost binding, and no SSL by default for local use, while supporting remote connections through standard HTTP infrastructure.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fboringsql.com%2Fposts%2Fstrong-views%2F%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/BLKNk3ylKJIaOzUwFtoxatmf92GF9i34dEpHze89SXk=452">
<span>
<strong>Strong views on PostgreSQL VIEWs (19 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Views are just stored rewrite rules (macros) that get expanded at query time. They behave like tables for simple cases, but create hidden complexity through nested spirals, fragile dependencies on attribute numbers, painful schema changes, and limited writability, often leading to the classic advice: βuse them, but don't treat them like tables.β
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.streamingdata.tech%2Fp%2Fcan-kafka-queues-make-consumers-faster-part-2%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/tIt5frVfVsuhdf9aDqco13xkv3OSYtfH6lXDsl7qBHw=452">
<span>
<strong>Can Kafka Queues Make Consumers Faster? Part 2: Head-Of-Line Blocking (4 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Kafka Queues (Share Groups) shine when consumer processing involves delays or external I/O that causes Head-Of-Line Blocking. By allowing more consumer instances than partitions, share groups enable linear scaling of throughput (tested up to 8x with 32 instances) with no noticeable per-instance overhead, making them very effective for I/O-bound workloads.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><strong><h1>Miscellaneous</h1></strong></div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="http://tracking.tldrnewsletter.com/CL0/http:%2F%2Fsoftwaredoug.com%2Fblog%2F2026%2F05%2F11%2Fthe-new-agentic-search-models.html%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/XB4ciBxetWDXW5XDnEaE-hhUOnjoYFraFX4Uyld6GHE=452">
<span>
<strong>Agentic search models (3 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Agentic search models are emerging to orchestrate the full retrieval workflow, replacing today's brittle stack of embeddings, rerankers, query classifiers, and BM25 with thinner backend primitives. Unlike frontier LLMs that handle the β80% case,β models trained specifically for search can encode domain-specific intent and the βlast 20%β of retrieval nuances, improving relevance in narrow contexts like e-commerce or job search. Early examples such as SID-1 and Waldo emphasize smaller size and lower latency.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.datagibberish.com%2Fp%2Fstop-starting-data-projects%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/IZLLB9bslnIggRI9k5qUGxFVYLxMe2f6iDIaImYsT_I=452">
<span>
<strong>Stop Starting Data Projects (9 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Many data projects fail not because of technical issues, but because engineers jump straight into building without properly understanding the stakeholders' real needs and processes. Instead, start by asking the stakeholder to walk through their current workflow, create a one-sentence Definition of Done, ship an ugly MVP, and iterate on it to turn vague requests into shipped, adopted work while dramatically reducing wasted effort.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">β‘</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Quick Links</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fposts%2Fmedriscoll_aicouncil-share-7460452137131565056-NUMB%2F%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/FVYfiuZNZzWYFJxRgMppc1DxXF5aqRNm4jYzQkajh7E=452">
<span>
<strong>Postgres has had a good 30-year run β is DuckDB coming for its crown? (2 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
DuckDB is no longer just an embedded analytics database.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fperformancede.substack.com%2Fp%2Fcomplete-end-to-end-build-of-etl%3Futm_source=tldrdata/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/7EdnZgV1Y-PxsJQLiZBIMCm0qhYAF2ONuvJiEVb29No=452">
<span>
<strong>Complete End-To-End Build of ETL Pipeline in AWS (12 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
A reusable AWS ETL pattern is built with ECS Fargate, DuckDB, ECR, EventBridge, CloudWatch, Secrets Manager, and Terraform, targeting single-node jobs rather than Spark-heavy Glue.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td align="left" style="word-break: break-word; vertical-align: top; padding: 5px 10px;">
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to advertise in TLDR? π°
</p>
<div class="text-block" style="margin-top: 10px;">
If your company is interested in reaching an audience of data engineering professionals and decision makers, you may want to <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%2F%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisecta/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/GT7qFX1ZG1ivr9aqA2MUJFtRBt_4VTcnI4plOwdubEk=452"><strong><span>advertise with us</span></strong></a>.
</div>
<br>
<!-- New "Want to work at TLDR?" section -->
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to work at TLDR? πΌ
</p>
<div class="text-block" style="margin-top: 10px;">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/VX-8LeSjjBZ5pC2JDkuW5pwKpDIeYwbXQ5POGwgREdE=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Apply here</strong></a>,
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech%2Fc227b917-a6a4-40ce-8950-d3e165357871/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/96zYhKWeD7C1xN-y1KS3fw9KbS3hjVZpnJJ1pZzB1wE=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>create your own role</strong></a> or send a friend's resume to <a href="mailto:jobs@tldr.tech" style="color: #0000EE; text-decoration: underline;">jobs@tldr.tech</a> and get $1k if we hire them! TLDR is one of <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Ffeed%2Fupdate%2Furn:li:activity:7401699691039830016%2F/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/n3f0Xqzp1L6G-esqLdiFnkRiQgs7BJYt1gjWmwCgoqE=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Inc.'s Best Bootstrapped businesses</strong></a> of 2025.
</div>
<br>
<div class="text-block">
If you have any comments or feedback, just respond to this email!
<br>
<br> Thanks for reading,
<br>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjoelvanveluwen%2F/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/wegdGWSb01EwzeHC7VQkg8Ea7iu4CeNdnlpxk_zC5TE=452"><span>Joel Van Veluwen</span></a>, <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjennytzurueyching%2F/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/C52ndRZ2izc5j-Y_fsniMsaVkOK4xdxHltW3ty_3qYI=452"><span>Tzu-Ruey Ching</span></a> & <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fremi-turpaud%2F/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/HTzbQWUWbYijTCPVOxWX1JkihehCWWPb2uP54h-Jnlc=452"><span>Remi Turpaud</span></a>
<br>
<br>
</div>
<br>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block" id="testing-id">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%2Fmanage%3Femail=silk.theater.56%2540fwdnl.com/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/fg1b3pFTMoy4aJTevyQtU18al8k4K2eJVhb5s-j9DKg=452">Manage your subscriptions</a> to our other newsletters on tech, startups, and programming. Or if TLDR Data isn't for you, please <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Funsubscribe%3Fep=1%26l=037ede50-92cc-11ee-b0f2-b761aa2217ad%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=777216a8-4f6f-11f1-a634-bf7d98d39e9f%26pt=campaign%26pv=4%26spa=1778752839%26t=1778753289%26s=c638585604054906cc20870360e07368720d359c4c54a25db8317ab1da986ff2/1/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/dYpX5UpKa4w7m4LRPE9ssElOebhrXMU_udsIuRLmgcs=452">unsubscribe</a>.
<br>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
<img alt="" src="http://tracking.tldrnewsletter.com/CI0/0100019e25f53c0e-9efef70a-0e1b-4a4c-aa1b-04902dd11556-000000/DeTJpCSUcztsUIvUYg8a0oOesyr3F2YIl33Se8b6Xm4=452" style="display: none; width: 1px; height: 1px;">
</body></html>