<!DOCTYPE html><html lang="en"><head><meta http-equiv="Content-Type" content="text/html charset=UTF-8"><meta charset="UTF-8"><meta name="viewport" content="width=device-width"><meta name="x-apple-disable-message-reformatting"><title>TLDR Data</title><meta name="color-scheme" content="light dark"><meta name="supported-color-schemes" content="light dark"><style type="text/css">
:root {
color-scheme: light dark; supported-color-schemes: light dark;
}
*,
*:after,
*:before {
-webkit-box-sizing: border-box; -moz-box-sizing: border-box; box-sizing: border-box;
}
* {
-ms-text-size-adjust: 100%; -webkit-text-size-adjust: 100%;
}
html,
body,
.document {
width: 100% !important; height: 100% !important; margin: 0; padding: 0;
}
body {
-webkit-font-smoothing: antialiased; -moz-osx-font-smoothing: grayscale; text-rendering: optimizeLegibility;
}
div[style*="margin: 16px 0"] {
margin: 0 !important;
}
table,
td {
mso-table-lspace: 0pt; mso-table-rspace: 0pt;
}
table {
border-spacing: 0; border-collapse: collapse; table-layout: fixed; margin: 0 auto;
}
img {
-ms-interpolation-mode: bicubic; max-width: 100%; border: 0;
}
*[x-apple-data-detectors] {
color: inherit !important; text-decoration: none !important;
}
.x-gmail-data-detectors,
.x-gmail-data-detectors *,
.aBn {
border-bottom: 0 !important; cursor: default !important;
}
.btn {
-webkit-transition: all 200ms ease; transition: all 200ms ease;
}
.btn:hover {
background-color: #f67575; border-color: #f67575;
}
* {
font-family: Arial, Helvetica, sans-serif; font-size: 18px;
}
@media screen and (max-width: 600px) {
.container {
width: 100%; margin: auto;
}
.stack {
display: block!important; width: 100%!important; max-width: 100%!important;
}
.btn {
display: block; width: 100%; text-align: center;
}
}
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
a {
color: inherit !important; text-decoration: underline !important;
}
</style><!--[if mso | ie]>
<style type="text/css">
a {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
a {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
</style>
<![endif]--></head><body class="">
<div style="display: none; max-height: 0px; overflow: hidden;">Databricks Lakehouse//RT is a real-time data warehouse powered by Reyden that delivers millisecond query performance directly on lakehouse data β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β </div>
<div style="display: none; max-height: 0px; overflow: hidden;">
<br>
</div>
<table align="center" class="document"><tbody><tr><td valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" class="container" width="600"><tbody><tr class="inner-body"><td>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr class="header"><td bgcolor="" class="container">
<table width="100%"><tbody><tr><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" style="margin-top: 0px;" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div style="text-align: center;">
<span style="margin-right: 0px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/7tZCB6wGVuIwmwMJZWZfurFxERhKZk3TU9T1_WmuNxM=452" rel="noopener noreferrer" target="_blank"><span>Sign Up</span></a>
|<span style="margin-right: 2px; margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisetopnav/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/hrn2IupcfT0ySTe02ufv0bG5OM8INXxuVoPxfUy5yJM=452" rel="noopener noreferrer" target="_blank"><span>Advertise</span></a></span>|<span style="margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Fweb-version%3Fep=1%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=7f007f30-6ae1-11f1-8139-8b6863562637%26pt=campaign%26t=1781777301%26s=a0b7f2a7d8bd13458e6f5ffe8b99187e2c58597e568a0f746fd2780daf47ffac/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/SA7EbC8kKxTqBFmTveqxdMu_YIBh5hvb5LPsyYk21aE=452"><span>View Online</span></a></span>
<br>
</span></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="text-align: center;"><span data-darkreader-inline-color="" style="--darkreader-inline-color:#3db3ff; color: rgb(51, 175, 255) !important; font-size: 30px;">T</span><span style="font-size: 30px;"><span data-darkreader-inline-color="" style="color: rgb(232, 192, 96) !important; --darkreader-inline-color:#e8c163; font-size:30px;">L</span><span data-darkreader-inline-color="" style="color: rgb(101, 195, 173) !important; --darkreader-inline-color:#6ec7b2; font-size:30px;">D</span></span><span data-darkreader-inline-color="" style="--darkreader-inline-color:#dd6e6e; color: rgb(220, 107, 107) !important; font-size: 30px;">R</span>
<br>
</td></tr></tbody></table>
<br>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;">
<div style="text-align: center;">
<h1><strong>TLDR Data <span id="date">2026-06-18</span></strong></h1>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr>
<tr bgcolor=""><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π±</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Deep Dives</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2F5Frijj/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/ko_xf7GioG30qaguFHu1ThuS0ckM_W60zVz58Qnj3Yk=452">
<span>
<strong>Predicting model behavior before release by simulating deployment (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
OpenAI's Deployment Simulation is a new pre-release safety technique that replays real (de-identified) user conversation prefixes from previous deployments and generates responses with a candidate model to predict how it will actually behave in production, providing far more realistic coverage and better rate estimates of undesired behaviors than traditional evaluations.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2F6oCNbG/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/lDBddf1iLgHDC_VuQqNhS38_fR5-gw9Nk4MwS9RLsqw=452">
<span>
<strong>Building an AI Database for Agentic GTM Operations (11 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Rippling rebuilt its go-to-market data foundation into an AI Database on a lakehouse to power agentic operations, replacing fragmented warehouses and manual processes with a unified intelligence layer. Key elements include ML-based entity resolution across third-party sources, medallion architecture, semantic search over enriched conversation data, and a natural-language Genie interface used by AI agents.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftech.instacart.com%2Ffrom-scoring-to-spelling-rebuilding-ads-retrieval-at-instacart-cf36b4e8d1bb%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/GUHYHn4h5huWr6axGeZuDR7MnbJq8Pq0sndrp7tCStg=452">
<span>
<strong>From Scoring to Spelling: Rebuilding Ads Retrieval at Instacart (12 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Instacart rebuilt its ads retrieval system by moving from a scoring-based BERT model (that scored every product ID) to a generative approach that βspells outβ recommendations token-by-token using Instacart Semantic IDs. This shift solved vocabulary bottlenecks, cold-start problems, and structural drift, enabling better generalization, full catalog coverage, and stronger session understanding.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FJmhIBi/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/SjVih8RLhVK1m6Uefi6BUfj4eUagLpnrc5ED5Kzj86s=452">
<span>
<strong>Federated Query Platform for ML at Scale: Architecture and Multi-Tenancy (8 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Guidewire used Apache Trino to federate SQL across Iceberg, Redshift, OpenSearch, and customer S3 buckets, speeding exploratory ML workflows. Domain catalogs and Lake Formation ABAC plus Trino RBAC handled isolation, but Trino's S3 layer exposed a governance gap.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Opinions & Advice</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Flinks.tldrnewsletter.com%2FmvGXjY/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/yd8uznyPN2XfPU5UyX8_mjGIjQCUwYbi8lvyDaoVASY=452">
<span>
<strong>Why We Moved from Hive-Style Data Lakes to Apache Iceberg? (12 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Moving from a Hive-style partitioned data lake (Parquet files on S3 + AWS Glue Catalog) to Apache Iceberg after AWS strengthened its ecosystem support (including S3 Tables) solved long-standing pain points with Hive-style architectures. Iceberg enables efficient pruning, seamless schema and partition evolution, time travel, and better query planning performance.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fanyscale.com%2Fblog%2Fdata-processing-becoming-gpu-workload%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/hh7tGwZq_oY1iqtmq4XAHz-F7U0Co1Hqdi300a39mTg=452">
<span>
<strong>Data Processing is Becoming a GPU Workload (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Data processing is moving from CPU-centric SQL ETL to GPU-heavy inference pipelines for video, audio, PDFs, Slack, and sensor data. Models now curate data first, creating embeddings, labels, summaries, and structured records for SQL and vector systems, which pushes platforms toward mixed compute, streaming, and API-aware concurrency.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fmoderndata101.substack.com%2Fp%2Fthe-identity-crisis-entity-resolution%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/VHk8kDX3PfbZ7kWjd9kUnlDNkE8bdeDQP8P_JC2MjJA=452">
<span>
<strong>The Identity Crisis: Why Entity Resolution Is the Missing Foundation of Every Data Product Stack (10 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Identity resolution and warehouse-native MDM are core infrastructure for trusted data products, AI, and compliance. At enterprise scale, local checks fall short, creating duplicate customers, phantom entities, and model-poisoning risk. The pattern combines blocking, rule-based and ML matching, graph clustering, and human review inside the warehouse.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π»</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Launches & Tools</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ffandf.co%2F4vGuPvZ%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/dTJBA6T6tjg-KVRQ2-rq4zKOPAOzj_MjwvglqmMatvA=452">
<span>
<strong>Insights from the 2026 State of Analytics Engineering (Sponsor)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
AI is reshaping analytics engineering, but organizations continue to face challenges around trust, governance, and cost management. Drawing on insights from hundreds of analytics and data professionals, this report examines the trends, priorities, and practices defining the next generation of data teams. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ffandf.co%2F4vGuPvZ/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/3yaee53dJ1ifLpA0InhEN9Ja9mOrkig29I331SC0ZgQ=452" rel="noopener noreferrer nofollow" target="_blank"><span>Read the dbt Labs report</span></a>
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.databricks.com%2Fblog%2Fintroducing-lakehousert-real-time-performance-unified-lakehouse%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/LsfZxBvxy0vCuJzzudk7Q3C3W8tqlkXpz9FxzhQ7ASM=452">
<span>
<strong>Introducing Lakehouse//RT: Real-Time Performance on a Unified Lakehouse (13 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Databricks Lakehouse//RT is a real-time data warehouse powered by Reyden that delivers millisecond query performance directly on lakehouse data without separate serving layers or data movement. It aims to simplify real-time analytics, BI, app serving, and observability by keeping performance, governance, and open data formats inside the Databricks Lakehouse.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fgithub.com%2Fbjonesdataliteracy%2Fdatapitfalls%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/_64DlgQ2WepNVBsDDJqEzFn8dlhPNPw4eWGbe2AhBDs=452">
<span>
<strong>datapitfalls (GitHub Repo)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
datapitfalls is an open-source Claude-powered tool that audits charts, code, written analysis, and documents for common data mistakes across the full reasoning chain, from question framing to communication. It goes beyond chart linting by using Ben Jones' Avoiding Data Pitfalls taxonomy to identify issues like bias, silent pipeline failures, bad aggregation, statistical errors, misleading visuals, and unclear presentation, then explains severity and fixes.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.postgresql.org%2Fabout%2Fnews%2Fpg_kpart-version-10-3316%2F%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/sJnpq6wz_UkfoA0_M7ItNIEhYi6nCru1twkL52AKQOY=452">
<span>
<strong>pg_kpart version 1.0 (2 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
pg_kpart blocks PostgreSQL partitioned-table queries unless the planner can prune by partition key, preventing accidental full scans and I/O storms. It supports audit rollout, whitelist/blacklist scoping, SQLSTATE handling, and is Linux-only.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><strong><h1>Miscellaneous</h1></strong></div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fengineering.salesforce.com%2Fhow-data-360-segmentation-processes-a-quadrillion-records-across-arbitrary-customer-data-models%2F%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/-8P0AmHVuO4jRKZR0brnJW22_IE_pQvmvFCdSjH0tNc=452">
<span>
<strong>How Data 360 Segmentation Processes a Quadrillion Records Across Arbitrary Customer Data Models (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Salesforce's Data 360 segmentation processes 1 quadrillion records per month across arbitrary customer schemas, relationship graphs, and storage systems, while running about 3 million Spark jobs monthly. Metadata became the bottleneck, with some environments hitting 3,000 to 6,000 tables, 500+ MB metadata payloads, and billions of candidate query plans.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.heidihealth.com%2Fblog%2Fclinical-ai-model-fine-tuning%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/B-6gQb4Nd7FTYQw_5KY7zEteBbr8O8IxZaUrOzebrMk=452">
<span>
<strong>Fine-tuning a clinical AI model to frontier parity (8 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Heidi AI fine-tuned a smaller clinical model to match a frontier model in blinded clinician preference tests. Its edge comes from proprietary clinician feedback, safety checks, and a product loop tuned to real clinical judgment.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">β‘</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Quick Links</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fboringsql.com%2Fposts%2Fnot-in-null%2F%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/9kC7RvyQkceSkVz8LlNVXbLTM8ZvWaF6KsMVbzscjak=452">
<span>
<strong>The NULL in your NOT IN (13 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
NOT IN in PostgreSQL is a classic gotcha: a single NULL in the subquery (or left side) causes the entire query to return zero rows due to three-valued logic.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.probably.dev%2F%3Futm_source=tldrdata/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/8fDfH3XI4Pgynzt-1bRTfWHO6MMuMX0Vx0NkKQlJP_I=452">
<span>
<strong>Probably (Tool)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Probably is a local data agent for natural-language analysis across files and warehouses.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td align="left" style="word-break: break-word; vertical-align: top; padding: 5px 10px;">
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to advertise in TLDR? π°
</p>
<div class="text-block" style="margin-top: 10px;">
If your company is interested in reaching an audience of data engineering professionals and decision makers, you may want to <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%2F%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisecta/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/JByzGMF6cZ0iqIDFPSzW-3Y0OvFNt9x8ZiDV6MXck7o=452"><strong><span>advertise with us</span></strong></a>.
</div>
<br>
<!-- New "Want to work at TLDR?" section -->
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to work at TLDR? πΌ
</p>
<div class="text-block" style="margin-top: 10px;">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/Iz4K0gOe97R_C_MXFjIJWq5psQvlHc9AHiY7o2sVWdw=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Apply here</strong></a>,
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech%2Fc227b917-a6a4-40ce-8950-d3e165357871/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/sa1d0I4MxjeuGyHQeHR8_zOLBISZDW5Q_E0fiMiVtLo=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>create your own role</strong></a> or send a friend's resume to <a href="mailto:jobs@tldr.tech" style="color: #0000EE; text-decoration: underline;">jobs@tldr.tech</a> and get $1k if we hire them! TLDR is one of <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Ffeed%2Fupdate%2Furn:li:activity:7401699691039830016%2F/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/8N5eNQ98esgr2aRnhiteIADy8WrlxFqw_erDiQ1OPCM=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Inc.'s Best Bootstrapped businesses</strong></a> of 2025.
</div>
<br>
<div class="text-block">
If you have any comments or feedback, just respond to this email!
<br>
<br> Thanks for reading,
<br>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjoelvanveluwen%2F/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/tK1a3JiUkFIv0XjTc1sUJ_pcYfysMVS7i2Iusfa-OZg=452"><span>Joel Van Veluwen</span></a>, <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjennytzurueyching%2F/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/Pj9lF5qU_-DvH-8wpbzabGAeu-T5qubcp7OzX5R_d6M=452"><span>Tzu-Ruey Ching</span></a> & <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fremi-turpaud%2F/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/umapUOAGaoNq4T8g4W0Ep58MTY6R7pIIKG3DtzzDyPA=452"><span>Remi Turpaud</span></a>
<br>
<br>
</div>
<br>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block" id="testing-id">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%2Fmanage%3Femail=silk.theater.56%2540fwdnl.com/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/BTZlbLd9qUs2p5TXQ79RQyye_Ef5qVR_rZrmeCfrDGM=452">Manage your subscriptions</a> to our other newsletters on tech, startups, and programming. Or if TLDR Data isn't for you, please <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Funsubscribe%3Fep=1%26l=037ede50-92cc-11ee-b0f2-b761aa2217ad%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=7f007f30-6ae1-11f1-8139-8b6863562637%26pt=campaign%26pv=4%26spa=1781776840%26t=1781777301%26s=91d65fc742c96a1b995c14accdce91d329d2e8042aca2041e5732a4c0acce6ea/1/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/8qwI6fKGrVoP4MKdGlzM64WUIYnitLTHs-PJ6szVZLE=452">unsubscribe</a>.
<br>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
<img alt="" src="http://tracking.tldrnewsletter.com/CI0/0100019eda33ff6a-d0d5ce4f-c777-45d5-9083-fb434bd3b3a5-000000/0SQaQYF311AyvsoHmIoyxFfJF0BYQO9bpuVZWY7Hpb0=452" style="display: none; width: 1px; height: 1px;">
</body></html>