<!DOCTYPE html><html lang="en"><head><meta http-equiv="Content-Type" content="text/html charset=UTF-8"><meta charset="UTF-8"><meta name="viewport" content="width=device-width"><meta name="x-apple-disable-message-reformatting"><title>TLDR Data</title><meta name="color-scheme" content="light dark"><meta name="supported-color-schemes" content="light dark"><style type="text/css">
:root {
color-scheme: light dark; supported-color-schemes: light dark;
}
*,
*:after,
*:before {
-webkit-box-sizing: border-box; -moz-box-sizing: border-box; box-sizing: border-box;
}
* {
-ms-text-size-adjust: 100%; -webkit-text-size-adjust: 100%;
}
html,
body,
.document {
width: 100% !important; height: 100% !important; margin: 0; padding: 0;
}
body {
-webkit-font-smoothing: antialiased; -moz-osx-font-smoothing: grayscale; text-rendering: optimizeLegibility;
}
div[style*="margin: 16px 0"] {
margin: 0 !important;
}
table,
td {
mso-table-lspace: 0pt; mso-table-rspace: 0pt;
}
table {
border-spacing: 0; border-collapse: collapse; table-layout: fixed; margin: 0 auto;
}
img {
-ms-interpolation-mode: bicubic; max-width: 100%; border: 0;
}
*[x-apple-data-detectors] {
color: inherit !important; text-decoration: none !important;
}
.x-gmail-data-detectors,
.x-gmail-data-detectors *,
.aBn {
border-bottom: 0 !important; cursor: default !important;
}
.btn {
-webkit-transition: all 200ms ease; transition: all 200ms ease;
}
.btn:hover {
background-color: #f67575; border-color: #f67575;
}
* {
font-family: Arial, Helvetica, sans-serif; font-size: 18px;
}
@media screen and (max-width: 600px) {
.container {
width: 100%; margin: auto;
}
.stack {
display: block!important; width: 100%!important; max-width: 100%!important;
}
.btn {
display: block; width: 100%; text-align: center;
}
}
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
a {
color: inherit !important; text-decoration: underline !important;
}
</style><!--[if mso | ie]>
<style type="text/css">
a {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
a {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
</style>
<![endif]--></head><body class="">
<div style="display: none; max-height: 0px; overflow: hidden;">Stripe runs DocDB on open-source MongoDB to support 5 million QPS, 2,000+ shards, and 99.9995% reliability while processing $1.4T in payments in 2024 β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β </div>
<div style="display: none; max-height: 0px; overflow: hidden;">
<br>
</div>
<table align="center" class="document"><tbody><tr><td valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" class="container" width="600"><tbody><tr class="inner-body"><td>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr class="header"><td bgcolor="" class="container">
<table width="100%"><tbody><tr><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" style="margin-top: 0px;" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div style="text-align: center;">
<span style="margin-right: 0px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/kGq7mffYasEeQRtWRuqu1N1nYcArLElp9xwPxpjtf2o=452" rel="noopener noreferrer" target="_blank"><span>Sign Up</span></a>
|<span style="margin-right: 2px; margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisetopnav/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/QTT9wp4xz0vYFYCsx6sd0o6DaRJszITFGDrt1hqrYV8=452" rel="noopener noreferrer" target="_blank"><span>Advertise</span></a></span>|<span style="margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Fweb-version%3Fep=1%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=159ab312-4769-11f1-bf34-a10f63a237bd%26pt=campaign%26t=1777889268%26s=1bba7e95fcbe3149ee55f90686b7e3e736572ea88d403346561c7ce25a3cdd9c/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/RofYtW0Ph4KQYaoT9_bX5tDQxgPEaggdEH7G_nN3vHs=452"><span>View Online</span></a></span>
<br>
</span></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="text-align: center;"><span data-darkreader-inline-color="" style="--darkreader-inline-color:#3db3ff; color: rgb(51, 175, 255) !important; font-size: 30px;">T</span><span style="font-size: 30px;"><span data-darkreader-inline-color="" style="color: rgb(232, 192, 96) !important; --darkreader-inline-color:#e8c163; font-size:30px;">L</span><span data-darkreader-inline-color="" style="color: rgb(101, 195, 173) !important; --darkreader-inline-color:#6ec7b2; font-size:30px;">D</span></span><span data-darkreader-inline-color="" style="--darkreader-inline-color:#dd6e6e; color: rgb(220, 107, 107) !important; font-size: 30px;">R</span>
<br>
</td></tr></tbody></table>
<br>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr id="together-with"><td align="center" height="20" style="vertical-align:middle !important;" valign="middle" width="100%"><strong style="vertical-align:middle !important; height: 100%;">Together With </strong>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fai4.io%2Fregister%2F%3Futm_source=paid_partner%26utm_campaign=TLDR_Data%26utm_term=newsletter/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/oaWOvInSNo8KxAm5RlNeykTwRHn0JPmPvW5zr89OB1o=452"><img src="https://images.tldr.tech/ai4.png" valign="middle" style="vertical-align: middle !important; height: 100%;" alt="Ai4"></a></td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;">
<div style="text-align: center;">
<h1><strong>TLDR Data <span id="date">2026-05-04</span></strong></h1>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr id="sponsy-copy"><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fai4.io%2Fregister%2F%3Futm_source=paid_partner%26utm_campaign=TLDR_Data%26utm_term=newsletter/2/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/ReGoJD1G4EXINZzhH-qwe8v7ow57bMsdz8w78aFomsU=452">
<span>
<strong>Don't miss Ai4 2026 β America's largest AI conference! (Sponsor)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Join 12,000+ attendees, 1,000+ speakers, and 400+ exhibits spanning every layer of the modern AI stack. Go deep on AI agents, RAG, world models, MLOps, and applied ML with technical sessions and case studies from Fortune 500 teams shipping AI in production. Don't missβ¦<p></p><p>> Dedicated content tracks for <strong>data scientists </strong>and <strong>ML engineers</strong>, amongst other technical roles</p><p>> Keynotes from AI greats including <strong>Geoffrey Hinton</strong>,<strong> Fei-Fei Li,</strong> and <strong>Andrew Ng</strong></p><p>> <strong>Peer-to-peer networking</strong> opportunities with those solving the same problems you are</p><p>Taking place at the <strong>Venetian in Las Vegas, August 4-6</strong>. Save $1200<strong> </strong>off final prices. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fai4.io%2Fregister%2F%3Futm_source=paid_partner%26utm_campaign=TLDR_Data%26utm_term=newsletter/3/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/PyLRo9i1mTJSszCx1udSxDJwn4XEb03VaItyTRaj3QU=452" rel="noopener noreferrer nofollow" target="_blank"><span><strong>Learn more and register now!</strong></span></a>
</p>
</span></span></div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr>
<tr bgcolor=""><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π±</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Deep Dives</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.infoq.com%2Fpresentations%2Fdocdb-online-database%2F%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/SY4hzvK-goKcBthvjCZCVqKxTEFjRS2n2QR7utdFyx8=452">
<span>
<strong>Stripe's DocDB: How Zero-Downtime Data Movement Powers Trillion-Dollar Payment Processing (44 minute video)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Stripe runs DocDB on open-source MongoDB to support 5 million QPS, 2,000+ shards, and 99.9995% reliability while processing $1.4T in payments in 2024. Its zero-downtime data movement platform enables horizontal sharding, version upgrades, and single-tenant/multi-tenant migrations without interrupting traffic using point-in-time snapshots, CDC-based replication, and version-gated cutovers.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FOlYn1D/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/hLrXYtZLeiVcjws1E5ALd_xwaQEKYTSbQYIP_sL_YZY=452">
<span>
<strong>Optimizing ML Workload Network Efficiency (Part I): Feature Trimmer (14 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Pinterest built Feature Trimmer to dynamically remove low-value or redundant features from large-scale ML training and inference requests, dramatically reducing network bandwidth usage and cost while maintaining model performance. It combines offline feature importance analysis with online trimming logic, resulting in substantial network bandwidth reduction and improved client-side latency.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fengineering.grab.com%2Fdata-mesh-2%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/SwNACAa43K4lk6KktS9efw35wx583NiYmkWfZ-Y7itU=452">
<span>
<strong>Data Mesh at Grab Part II: The Foundational Tools behind Certification (10 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Grab operationalizes data mesh certification with an event-driven metadata graph built on DataHub, Kafka-backed metadata events, DataHub Actions for continuous certification, Temporal for validation workflows, and Airflow/Lighthouse pipeline-completion events to trigger quality checks. The key idea: trust is computed from live ownership, lineage, contracts, SLAs, and test health, not manually assigned, and contract rules link to concrete health endpoints.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2F7Mg1ij/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/y_Rczz2HzqGGe61DuDEjn-gR9YVTJNRXYzU4XqOe-0I=452">
<span>
<strong>How we rebuilt search ranking at Faire with deep learning (11 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Faire rebuilt its search ranking stack from XGBoost to deep learning to better optimize competing goals like relevance, freshness, brand discovery, and cross-surface consistency. The migration required reworking data pipelines, observability, and production serving, including custom Docker-based infrastructure, shared-memory embeddings, and CPU sandboxing to cut startup latency from 20β30 minutes to a few minutes. The new stack delivered measurable gains, including a ~2% order volume boost on Product Search.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Opinions & Advice</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fhex.tech%2Fblog%2Fautomated-data-validation%2F%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/_2uOLD6LVkjKw1glLrlH22oqTh8ptJg6HYhtOwL4_HI=452">
<span>
<strong>We automated data validation β Here's how we did it (12 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
AI is becoming useful for analytics engineering not by replacing human judgment, but by removing the repetitive audit work around validation. The best pattern is agent-assisted, evidence-heavy workflows where AI runs checks, investigates changes, shows its work, and humans still decide what is acceptable.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fghostinthedata.info%2Fposts%2F2026%2F2026-05-02-five-worlds-data-engineering%2F%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/OvUaTPwEop6G113Uq9YHI6mwj2rKph7wcgB5I382EV4=452">
<span>
<strong>Five Worlds of Data Engineering (10 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Data engineering advice often fails because it's written for one of five very different operating models: startup-style analytics teams, legacy enterprise environments, outcome-critical product/data systems, regulated businesses, or platform/data-mesh organizations. Each has different priorities (speed, stability, consequence, auditability, or adoption) and practices that are βbestβ in one can be dangerous in another. Classify your environment before applying guidance, so architecture, governance, and delivery practices match the actual constraints.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2F6UXi9A/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/usxdQXA7N-E24UM8YTj1688YDgq7bo_1ucNh_Mff1lQ=452">
<span>
<strong>How We Built an AI Second Brain for 60K Knowledge Workers (8 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Meta built an internal AI Second Brain to help its knowledge workers quickly find, synthesize, and reason over vast amounts of internal company information and documents. The system combines retrieval-augmented generation (RAG), advanced search, and agentic capabilities, with careful attention to privacy, accuracy, and enterprise-grade controls.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π»</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Launches & Tools</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwelodata.ai%2Fmultilingual-ai%2F%3Futm_source=tldr-ai%26utm_medium=email%26utm_content=tldr-data-secondary%26utm_campaign=2026-ad-welo-data-multilingual-and-culture/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/-yTymqG3iAUBypMKnheebuAVxOKK_xtxrYV8UCLXYXA=452">
<span>
<strong>Your model scores great on evals. But they were built for English. Does that performance hold in Arabic? (Sponsor)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
<strong>4β5Γ performance degradation</strong> in low-resource languages often stays hidden until production. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwelodata.ai%2Fmultilingual-ai%2F%3Futm_source=tldr-ai%26utm_medium=email%26utm_content=tldr-data-secondary%26utm_campaign=2026-ad-welo-data-multilingual-and-culture/2/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/yEXipSIXM0il57Oq9Dw-OpFbLgv5_g6d6zzo6UIhEm0=452" rel="noopener noreferrer nofollow" target="_blank"><span>Native-language training data & human evals</span></a> in 155+ locales help you benchmark against real users, not just English ones. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwelodata.ai%2Fmultilingual-ai%2F%3Futm_source=tldr-ai%26utm_medium=email%26utm_content=tldr-data-secondary%26utm_campaign=2026-ad-welo-data-multilingual-and-culture/3/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/O01Ul0xywBAMudJ8a9LngJ4qUkWhsRnwPhGJnovO_AA=452" rel="noopener noreferrer nofollow" target="_blank"><span>Don't ship blind β Welo Data</span></a>
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fgithub.com%2Fraulcd%2Fdatanomy%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/WGL3xC93iEDfjM2mGUc8SRYgNki0M9J66KI1G_gkGng=452">
<span>
<strong>Datanomy (GitHub Repo)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Datanomy is a terminal tool for inspecting Parquet files. It shows schemas, metadata, data, statistics, and internal structures in an interactive view.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.decodingai.com%2Fp%2Fship-rag-with-weave-cli%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/rSPR3o8WxiKjCuilf16hbrYmxfH92org9zCA1bU_kAo=452">
<span>
<strong>What Held Up at 3 AM: One Engineer's RAG Case Study (17 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Most RAG systems fail in production because teams hard-code a vector DB, embedding model, and chunking strategy without observability or repeatable evals. Weave CLI addresses this by unifying 11 vector databases, 5 embedding providers, and swappable agents behind a single config-driven interface. OpenTelemetry and Opik tracing is baked in from day one.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fpola.rs%2Fposts%2Fschema-evolution%2F%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/V78A_PivHTsg0fhIhA441J4psRhtbgrHnAYnjh4NYTE=452">
<span>
<strong>Handling Schema Issues in Polars (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Polars has strong built-in support for schema evolution for changes like new or missing columns, type drifts, and breaking changes. Depending on the data format, use parameters such as missing_columns="insert", schema_mode="merge", ScanCastOptions, and diagonal_relaxed concat, so pipelines don't break when upstream schemas change.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><strong><h1>Miscellaneous</h1></strong></div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FKCi5GW/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/SUF7KV44ISSZ-jUzdBccq6ktPJDOCjAxQD0y1H2LtNM=452">
<span>
<strong>Bottling the River: Apache Fluss on EKS (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Apache Fluss is an βindexable Kafkaβ that combines horizontally scalable streaming ingestion with columnar storage, primary-key tables, CDC, and optional tiering to S3 or lakehouse formats like Iceberg and Paimon. In production on EKS, integrating it with Flink requires fixing several issues, such as missing connector JARs, S3 credential/delegation-token issues, and extra dependencies. Fluss can significantly simplify stateful streaming and lookup workloads, but 0.9-era production use still needs careful operational tuning.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FzM5sdJ/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/Y9w7oH4NZed0LjG7_49cLeBcJ_O0XYr-k5P6Z34swUg=452">
<span>
<strong>Effective KV Compression with TurboQuant (4 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
TurboQuant is a quantization and compression algorithm for Key-Value (KV) caches in large language models and vector search systems. It uses PolarQuant to first map vectors into polar coordinates, followed by QJL (Quantized Johnson-Lindenstrauss), which applies a minimal 1-bit correction to remove hidden biases, enabling compression down to ~3 bits per value with virtually no loss in accuracy.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">β‘</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Quick Links</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.theseattledataguy.com%2Fdoes-elt-vs-etl-even-still-matter%2F%23page-content%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/EtEfdOgUUKFRXyFXjvMERYnHNj-AKM3XxQqxEp00-KM=452">
<span>
<strong>Does ELT vs. ETL Even Still Matter? (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Cloud data platforms like Snowflake, BigQuery, Redshift, and Databricks have made ELT the default because it is simpler, faster to iterate on, and lets teams use scalable warehouse compute for transformations.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fneo4j.com%2Fblog%2Fdeveloper%2Fintroducing-neo4j-agent-skills%2F%3Futm_source=tldrdata/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/WStK6RgNj53PONd0veKCGBcqeXAglxNPXkvEcXKQs2I=452">
<span>
<strong>Introducing Neo4j Agent Skills (3 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Neo4j has released a first wave of Agent Skills to keep coding agents current with Cypher 25 and recent GQL-aligned syntax, including SHORTEST 3, REPEATABLE ELEMENTS, quantified path patterns, and path projections.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td align="left" style="word-break: break-word; vertical-align: top; padding: 5px 10px;">
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to advertise in TLDR? π°
</p>
<div class="text-block" style="margin-top: 10px;">
If your company is interested in reaching an audience of data engineering professionals and decision makers, you may want to <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%2F%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisecta/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/isTy_85UtR2dk6BRVu4vi07EfLDZeDzNGh-1bCniE5w=452"><strong><span>advertise with us</span></strong></a>.
</div>
<br>
<!-- New "Want to work at TLDR?" section -->
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to work at TLDR? πΌ
</p>
<div class="text-block" style="margin-top: 10px;">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/B-ul-hZT-_XgcJRXT6zEzpsl5w_UBeVa3eCWihG80mg=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Apply here</strong></a>,
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech%2Fc227b917-a6a4-40ce-8950-d3e165357871/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/LPB_C_bVOoGuxP212Op8ixbmWLikruu_C6eBXCaIDP8=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>create your own role</strong></a> or send a friend's resume to <a href="mailto:jobs@tldr.tech" style="color: #0000EE; text-decoration: underline;">jobs@tldr.tech</a> and get $1k if we hire them! TLDR is one of <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Ffeed%2Fupdate%2Furn:li:activity:7401699691039830016%2F/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/4zVR4IVLo56sZhk4EfThnqNZav-_gv0GMM_3PdUjouw=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Inc.'s Best Bootstrapped businesses</strong></a> of 2025.
</div>
<br>
<div class="text-block">
If you have any comments or feedback, just respond to this email!
<br>
<br> Thanks for reading,
<br>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjoelvanveluwen%2F/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/Al3v4qUuvyLLzXoR5AFKqLb_Bs1PNV5YemzC-F0Zwg4=452"><span>Joel Van Veluwen</span></a>, <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjennytzurueyching%2F/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/3QO9ISng1R4Jmj_hwo71gnxCr1_EfpYoDmb3pSdFVJQ=452"><span>Tzu-Ruey Ching</span></a> & <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fremi-turpaud%2F/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/FHkLTmocsi73VHqhQ4Qf0YSokDEWmKNaCkxmBZsoNpA=452"><span>Remi Turpaud</span></a>
<br>
<br>
</div>
<br>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block" id="testing-id">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%2Fmanage%3Femail=silk.theater.56%2540fwdnl.com/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/A5d0VAlrSE0Ipudp3-_WI7vUxJ1iD3-r5IEO_ddmFUY=452">Manage your subscriptions</a> to our other newsletters on tech, startups, and programming. Or if TLDR Data isn't for you, please <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Funsubscribe%3Fep=1%26l=037ede50-92cc-11ee-b0f2-b761aa2217ad%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=159ab312-4769-11f1-bf34-a10f63a237bd%26pt=campaign%26pv=4%26spa=1777888830%26t=1777889268%26s=3abf8ddb47f205515d9deb2c0916478c775a11f9e04f971f51b0d7bceda78314/1/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/eqaX6Ofx_WtR8IFqvuTpzdDMUmAKC3SYmCaJoUyzINE=452">unsubscribe</a>.
<br>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
<img alt="" src="http://tracking.tldrnewsletter.com/CI0/0100019df275535f-b654d679-b134-48d5-90a3-c1eb4f5cd25e-000000/MBLEuLdnGP4EPFJFqdjJijSWDHSDbuRS2WSEXN8UNq0=452" style="display: none; width: 1px; height: 1px;">
</body></html>