<!DOCTYPE html><html lang="en"><head><meta http-equiv="Content-Type" content="text/html charset=UTF-8"><meta charset="UTF-8"><meta name="viewport" content="width=device-width"><meta name="x-apple-disable-message-reformatting"><title>TLDR Data</title><meta name="color-scheme" content="light dark"><meta name="supported-color-schemes" content="light dark"><style type="text/css">
:root {
color-scheme: light dark; supported-color-schemes: light dark;
}
*,
*:after,
*:before {
-webkit-box-sizing: border-box; -moz-box-sizing: border-box; box-sizing: border-box;
}
* {
-ms-text-size-adjust: 100%; -webkit-text-size-adjust: 100%;
}
html,
body,
.document {
width: 100% !important; height: 100% !important; margin: 0; padding: 0;
}
body {
-webkit-font-smoothing: antialiased; -moz-osx-font-smoothing: grayscale; text-rendering: optimizeLegibility;
}
div[style*="margin: 16px 0"] {
margin: 0 !important;
}
table,
td {
mso-table-lspace: 0pt; mso-table-rspace: 0pt;
}
table {
border-spacing: 0; border-collapse: collapse; table-layout: fixed; margin: 0 auto;
}
img {
-ms-interpolation-mode: bicubic; max-width: 100%; border: 0;
}
*[x-apple-data-detectors] {
color: inherit !important; text-decoration: none !important;
}
.x-gmail-data-detectors,
.x-gmail-data-detectors *,
.aBn {
border-bottom: 0 !important; cursor: default !important;
}
.btn {
-webkit-transition: all 200ms ease; transition: all 200ms ease;
}
.btn:hover {
background-color: #f67575; border-color: #f67575;
}
* {
font-family: Arial, Helvetica, sans-serif; font-size: 18px;
}
@media screen and (max-width: 600px) {
.container {
width: 100%; margin: auto;
}
.stack {
display: block!important; width: 100%!important; max-width: 100%!important;
}
.btn {
display: block; width: 100%; text-align: center;
}
}
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
body,
p,
td,
tr,
.body,
table,
h1,
h2,
h3,
h4,
h5,
h6,
div,
span {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
a {
color: inherit !important; text-decoration: underline !important;
}
</style><!--[if mso | ie]>
<style type="text/css">
a {
background-color: #FEFEFE !important; color: #010101 !important;
}
@media (prefers-color-scheme: dark) {
a {
background-color: #27292D !important; color: #FEFEFE !important;
}
}
</style>
<![endif]--></head><body class="">
<div style="display: none; max-height: 0px; overflow: hidden;">Omnigent is an open-source meta-harness that makes agents like Claude Code, Codex, Pi, and custom agents work together through one shared layer β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β β </div>
<div style="display: none; max-height: 0px; overflow: hidden;">
<br>
</div>
<table align="center" class="document"><tbody><tr><td valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" class="container" width="600"><tbody><tr class="inner-body"><td>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr class="header"><td bgcolor="" class="container">
<table width="100%"><tbody><tr><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" style="margin-top: 0px;" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div style="text-align: center;">
<span style="margin-right: 0px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/1j6VunLYA3aw90M8JKqtOFlFsvQPkeb7lZ9OcHFuN2w=452" rel="noopener noreferrer" target="_blank"><span>Sign Up</span></a>
|<span style="margin-right: 2px; margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisetopnav/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/e29CnMyqW1NQDKDe25GjVe6h5wb3hIA84KxkyLjN2W4=452" rel="noopener noreferrer" target="_blank"><span>Advertise</span></a></span>|<span style="margin-left: 2px;"><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Fweb-version%3Fep=1%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=1a2815ca-6873-11f1-8df6-efa7c1aecb22%26pt=campaign%26t=1781518078%26s=4d33175c53830dde8cd56bf727e9dc68d4b5c655b91f7ac2b76e29cc8efb6b4c/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/0PYW7yCBJtx1wHY2Uva_7th4RF4ki4ehvmxrceIBpW0=452"><span>View Online</span></a></span>
<br>
</span></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="text-align: center;"><span data-darkreader-inline-color="" style="--darkreader-inline-color:#3db3ff; color: rgb(51, 175, 255) !important; font-size: 30px;">T</span><span style="font-size: 30px;"><span data-darkreader-inline-color="" style="color: rgb(232, 192, 96) !important; --darkreader-inline-color:#e8c163; font-size:30px;">L</span><span data-darkreader-inline-color="" style="color: rgb(101, 195, 173) !important; --darkreader-inline-color:#6ec7b2; font-size:30px;">D</span></span><span data-darkreader-inline-color="" style="--darkreader-inline-color:#dd6e6e; color: rgb(220, 107, 107) !important; font-size: 30px;">R</span>
<br>
</td></tr></tbody></table>
<br>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;">
<div style="text-align: center;">
<h1><strong>TLDR Data <span id="date">2026-06-15</span></strong></h1>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width:100%;" width="100%"><tbody></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr>
<tr bgcolor=""><td class="container">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td style="padding: 0px;">
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π±</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Deep Dives</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fblog%2Fengineering%2Fai%2Fsemantic-search-for-ai-agents-at-scale-retrieval-and-ranking-for-linkedins-hiring-assistant%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/M77AZroQtWXgETt8TVLdBGhUQQ_oWNR33a2M-zzxxqA=452">
<span>
<strong>Semantic Search for AI Agents at Scale: Retrieval and Ranking for LinkedIn's Hiring Assistant (15 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
LinkedIn built MUSE (Member Understanding Semantic Embeddings) to power semantic search inside Hiring Assistant. It uses a dual-tower Matryoshka embedding model trained on millions of high-quality labels from an LLM Teacher grounded in product policy, combining embedding-based retrieval with a downstream engagement-optimized ranker.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fengineering.atspotify.com%2F2026%2F6%2Fencoding-your-domain-expert-the-context-layer-behind-spotifys-data-assistant%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/oArUnU_TmVTVgTU3CWwu8ObEEXA7WnDxOOpUzaKq-xo=452">
<span>
<strong>Encoding Your Domain Expert: The Context Layer Behind Spotify's Data Assistant (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Spotify built Vedder, an AI data assistant for 2,100+ users across 177 clusters, to move beyond schema-only RAG across 70,000 datasets. Domain experts curate each cluster with datasets, vetted question-SQL pairs, and business docs. Only 12.5% of mined query pairs were accepted, so health scoring tracks drift, validity, coverage, and reproducibility to keep context reliable.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.junaideffendi.com%2Fp%2Fhow-feldera-works-a-true-incremental%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/yQ4DZ45Ocj4yTJ5V62xtYD64JMhO_4-RCgfZswGLds8=452">
<span>
<strong>How Feldera Works: A True Incremental View Maintenance Engine (3 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Feldera treats streams as incremental SQL views, using DBSP to propagate deltas instead of recomputing joins and aggregations. Inserts, deletes, and updates become Z-set changes, so only affected rows are updated. The result is batch-SQL-like semantics for continuous pipelines with lower CPU, less memory pressure, and predictable latency.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Opinions & Advice</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fsnscratchpad.com%2Fposts%2Ffrontier-ecosystem%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/QGZqq31c66XXHT1H3AAKGqXNQZhB2u4DzM81p4g0bHk=452">
<span>
<strong>A frontier without an ecosystem is not stable (4 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Companies need to compound human expertise and AI capability, not just rely on the best model. By owning their workflows, evals, and institutional knowledge, firms can keep improving while avoiding a future where all value flows to a few frontier models.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwesmckinney.com%2Fblog%2Fmythical-agent-month%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/0XjDh17ruUe2uT_OHU7O-qrIow1-qP3caENiIhJLuUs=452">
<span>
<strong>The Mythical Agent-Month (10 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
AI coding agents reduce coding labor, but not the hardest parts of software: design judgment, scope control, testing, and maintainability. They reduce accidental complexity, but can create technical debt, architectural drift, and bloated codebases at machine speed. The edge shifts to experts who can steer the model, say no, and keep systems production-ready.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fcockroachlabs.com%2Fblog%2Fagentic-ai-costs-at-scale%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/n0Qh-xEji8ZhY-YdtsHc2I6ooRghmdAFAfsfyS6S1mQ=452">
<span>
<strong>The Bill Arrives: How to Manage Agentic AI Costs at Scale (17 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Uber's AI budget blowout shows agentic AI is a task-economics problem, not a token-pricing problem. Claude Code adoption hit 84% across 5,000 engineers, exhausting the annual AI budget by mid-April. With spend hidden in re-sent context, retrieval, orchestration, governance, and retries, teams need to measure value per task, control context, and build stateful agent infrastructure.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π»</span></div>
</div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Launches & Tools</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="http://tracking.tldrnewsletter.com/CL0/http:%2F%2Fwww.matia.io%2Fwebinars-events%2Funified-data-ops%3Futm_source=TLDR%2520campaign%26utm_medium=media%26utm_campaign=newsletter%26utm_content=webinar/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/IImcY7x5D95Ssc8ST_XlX7H5kw5OnmHkG0r6Q90bzp0=452">
<span>
<strong>Join renowned data strategist Doug Laney and Matia CEO Benjamin Segal for a discussion on the future of the data stack. (Sponsor)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Your data stack is held together with duct tape. You know it. Your team knows it. <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.matia.io%2Fwebinars-events%2Funified-data-ops%3Futm_source=TLDR%2520campaign%26utm_medium=media%26utm_campaign=newsletter%26utm_content=webinar/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/WE_gee__7Iyd2DWAjQWjV1BUlX0mjrSxE9rcTaw1lYo=452" rel="noopener noreferrer nofollow" target="_blank"><span>On June 24th,</span></a> Matia CEO Benjamin Segal and Doug Laney, author of <em>Infonomics</em> and <em>Data Juice</em>, are doing a live fireside on what comes next.
<br>
<br><a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.matia.io%2Fwebinars-events%2Funified-data-ops%3Futm_source=TLDR%2520campaign%26utm_medium=media%26utm_campaign=newsletter%26utm_content=webinar/2/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/SpYpSTEkuw5KXCfPXZfx7QciiZjlJ1MOAOiwx6uyEJ8=452" rel="noopener noreferrer nofollow" target="_blank"><span>Register nowβ</span></a>
<br>
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.databricks.com%2Fblog%2Fintroducing-omnigent-meta-harness-combine-control-and-share-your-agents%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/RKUoeXLGEjLhaSwT7HRhyKNvlHm5O6e774zMNQgrWJ8=452">
<span>
<strong>Introducing Omnigent: A Meta-Harness to Combine, Control, and Share Your Agents (7 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Omnigent is an open-source Databricks meta-harness that makes agents like Claude Code, Codex, Pi, and custom agents work together through one shared layer. It helps teams compose agents, add security and cost controls, share live sessions, and keep workflows portable as tools change.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fmotherduck.com%2Fblog%2Fflights-agent-native-ingest%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/snh4nsXQmupnHkx9pFxzz4yvMoI6SwIiWlFxjpU3v4o=452">
<span>
<strong>Introducing Flights: Agent-Native Ingest in MotherDuck (4 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Flights is MotherDuck's new agent-native data pipeline feature that lets AI agents easily build, run, and schedule ingestion and transformation workloads using a secure, general-purpose Python runtime. It has native support for dlt pipelines, direct DuckDB execution, logging, scheduling, and versioning. Agents can create Flights via MCP server, SQL table functions, or the UI.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fdatafusion.apache.org%2Fblog%2F2026%2F06%2F12%2Fdatafusion-54.0.0%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/J4QnPkPD1Uy0LEe0NHvDeXOQdoUTFWzPPL3wC7U3fjY=452">
<span>
<strong>Apache DataFusion 54.0.0 Released (7 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Apache DataFusion 54.0.0 adds major SQL upgrades, including LATERAL joins, SQL lambda functions for arrays, a new Arrow-based Avro reader, and spill-to-disk for memory-heavy nested loop joins. Performance also jumps, with near-unique LEFT/FULL sort-merge joins up to 20β50Γ faster and repartition-heavy operations improving by up to 50%.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">π</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><strong><h1>Miscellaneous</h1></strong></div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fxebia.com%2Fblog%2Fhidden-cost-ai-parse-document-production-databricks%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/1azjDcTNtqjIUAuq2hUHFEkKH-jkIKdmZBe3kNNrG44=452">
<span>
<strong>The Hidden Cost of ai_parse_document in Production (10 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Databricks' ai_parse_document + ai_query can turn messy PDFs into structured JSON in a few SQL lines, but the challenge is reliability at scale. Every rerun reopens parsing and LLM costs, corrected documents can create duplicates, and even temperature 0 still produces non-deterministic outputs that undermine auditability. A pipeline design with checkpoints, versioned prompts, and deduplication reduces reprocessing cost and improves reproducibility. Deterministic parsers like OpenDataLoader PDF are more appropriate when document templates are consistent.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linuxfoundation.org%2Fpress%2Flinux-foundation-announces-opensharing-project-to-standardize-ai-asset-and-data-exchange%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/hXXkiFlpU-9fPWWqKVrWmqAwzFH9DzFPWBncmcxPuJA=452">
<span>
<strong>Linux Foundation Announces OpenSharing Project to Standardize AI Asset and Data Exchange (4 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Databricks has handed the Delta Sharing protocol over to the Linux Foundation. OpenSharing extends Delta Sharing to AI models, agent skills, and unstructured data across clouds and platforms. It adds standard APIs for discovery, authorization, and access, with support for existing Delta Sharing recipients plus Apache Iceberg/REST Catalog clients. The project aims to replace proprietary marketplaces with a single standard for enterprise AI asset distribution.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;"><span style="font-size: 36px;">β‘</span></div></div>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding-top: 0px; padding-bottom: 0px;">
<div class="text-block">
<div style="text-align: center;">
<h1><strong>Quick Links</strong></h1>
</div>
</div>
</td></tr></tbody></table>
<table bgcolor="" style="table-layout: fixed; width: 100%;" width="100%"><tbody><tr><td style="padding:0;border-collapse:collapse;border-spacing:0;margin:0;" valign="top">
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fresearch.google%2Fblog%2Fnew-framework-for-auditing-machine-unlearning%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/NyCCxFZ0kRrZ7ogIbf9blaY1A9I6jp30gFywerhmmqI=452">
<span>
<strong>New framework for auditing machine unlearning (6 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
Google Research introduced Regularized f-Divergence Kernel Tests to audit machine unlearning and privacy leakage more reliably than standard two-sample tests.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.kdnuggets.com%2Ffeature-stores-from-scratch-a-minimal-working-implementation%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/trFRxWmP6VBmrrwJSgxhZ2_Nv83hz0835Oi0dSa1bRw=452">
<span>
<strong>Feature Stores from Scratch: A Minimal Working Implementation (5 minute read)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
DuckDB + Redis deliver a five-component DIY feature store that avoids training-serving skew for real-time ML and RAG systems.
</span>
</span>
</div>
</td></tr></tbody></table>
<table align="center" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block">
<span>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fsqltoerdiagram.com%2F%3Futm_source=tldrdata/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/OW_Ko7GrSbhDGmf-iabnuYU_Ry4dPdX1rcBUV1QlQHs=452">
<span>
<strong>SQL to ER Diagram (Tool)</strong>
</span>
</a>
<br>
<br>
<span style="font-family: "Helvetica Neue", Helvetica, Arial, Verdana, sans-serif;">
SQL to ER Diagram is a free, open source, browser-only tool that turns pasted SQL schemas into clean, interactive ER diagrams without uploading your data or requiring signup.
</span>
</span>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td align="left" style="word-break: break-word; vertical-align: top; padding: 5px 10px;">
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to advertise in TLDR? π°
</p>
<div class="text-block" style="margin-top: 10px;">
If your company is interested in reaching an audience of data engineering professionals and decision makers, you may want to <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fadvertise.tldr.tech%2F%3Futm_source=tldrdata%26utm_medium=newsletter%26utm_campaign=advertisecta/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/KlxJi-25lC91bqNypyPQ91X5IUUYJwdAIp1FwH_GQdg=452"><strong><span>advertise with us</span></strong></a>.
</div>
<br>
<!-- New "Want to work at TLDR?" section -->
<p style="padding: 0; margin: 0; font-size: 22px; color: #000000; line-height: 1.6; font-weight: bold;">
Want to work at TLDR? πΌ
</p>
<div class="text-block" style="margin-top: 10px;">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/aHf64cvgA3TDoPpWoiRrCMxnPu8dNVsr8OmEk8NjogA=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Apply here</strong></a>,
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fjobs.ashbyhq.com%2Ftldr.tech%2Fc227b917-a6a4-40ce-8950-d3e165357871/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/2OefDmDMw770uYBzqhm3EFsoZaaEHNPVsTWgOEmK_sk=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>create your own role</strong></a> or send a friend's resume to <a href="mailto:jobs@tldr.tech" style="color: #0000EE; text-decoration: underline;">jobs@tldr.tech</a> and get $1k if we hire them! TLDR is one of <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Ffeed%2Fupdate%2Furn:li:activity:7401699691039830016%2F/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/5JVLKVF8ZflyEgkc94NzHofhLkwYU54OjbdynKt6ZwE=452" rel="noopener noreferrer" style="color: #0000EE; text-decoration: underline;" target="_blank"><strong>Inc.'s Best Bootstrapped businesses</strong></a> of 2025.
</div>
<br>
<div class="text-block">
If you have any comments or feedback, just respond to this email!
<br>
<br> Thanks for reading,
<br>
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjoelvanveluwen%2F/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/2OTzBi2BaXCS3GzqNqiyxpFpCuQj1esh_Amugbwlg1E=452"><span>Joel Van Veluwen</span></a>, <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fjennytzurueyching%2F/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/y-224aIseO5Cop6QaLHrb7APS4MfyRQblZRtFEyKp2I=452"><span>Tzu-Ruey Ching</span></a> & <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fwww.linkedin.com%2Fin%2Fremi-turpaud%2F/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/oBrMhqF-l4DEad2SAmxHOx56Yrgy_2mrtYiJAge44j4=452"><span>Remi Turpaud</span></a>
<br>
<br>
</div>
<br>
</td></tr></tbody></table>
<table align="center" bgcolor="" border="0" cellpadding="0" cellspacing="0" width="100%"><tbody><tr><td class="container" style="padding: 15px 15px;">
<div class="text-block" id="testing-id">
<a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Ftldr.tech%2Fdata%2Fmanage%3Femail=silk.theater.56%2540fwdnl.com/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/WfUMzDeF7MklbZeu8fbsCdMaFkJWVnCQ56hS0dyV0do=452">Manage your subscriptions</a> to our other newsletters on tech, startups, and programming. Or if TLDR Data isn't for you, please <a href="https://tracking.tldrnewsletter.com/CL0/https:%2F%2Fa.tldrnewsletter.com%2Funsubscribe%3Fep=1%26l=037ede50-92cc-11ee-b0f2-b761aa2217ad%26lc=1670a604-84b7-11f0-bcf5-55fc1d40139c%26p=1a2815ca-6873-11f1-8df6-efa7c1aecb22%26pt=campaign%26pv=4%26spa=1781517623%26t=1781518078%26s=63480ac0e975be3eb790ec0e6bdb1d939ba620f16c5de8282a70305900cb638b/1/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/Eb55FZHI6j1raxMmINGXac20hxTr0P6BXml9eoVqhes=452">unsubscribe</a>.
<br>
</div>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
</td></tr></tbody></table>
<img alt="" src="http://tracking.tldrnewsletter.com/CI0/0100019ecac091a5-45125e20-eaf4-4eef-9671-23cd85faccc2-000000/6U5bLS7I6HwT9GLEroOCngZmeuYxDf_bKef_FYRiTUo=452" style="display: none; width: 1px; height: 1px;">
</body></html>