<?xml version="1.0" encoding="UTF-8"?><rss xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:atom="http://www.w3.org/2005/Atom" version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd" xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0"><channel><title><![CDATA[Data Science Weekly Newsletter]]></title><description><![CDATA[In-depth look at the Data Science / Machine Learning / AI / Data Engineering world.]]></description><link>https://datascienceweekly.substack.com</link><image><url>https://substackcdn.com/image/fetch/$s_!I8ji!,w_256,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3294ef46-cb03-42ea-b7d6-9f8e8b0f41f6_253x253.png</url><title>Data Science Weekly Newsletter</title><link>https://datascienceweekly.substack.com</link></image><generator>Substack</generator><lastBuildDate>Sat, 20 Jun 2026 14:28:23 GMT</lastBuildDate><atom:link href="https://datascienceweekly.substack.com/feed" rel="self" type="application/rss+xml"/><copyright><![CDATA[datascienceweekly.org, a service of DATAYOU, LLC]]></copyright><language><![CDATA[en]]></language><webMaster><![CDATA[datascienceweekly@substack.com]]></webMaster><itunes:owner><itunes:email><![CDATA[datascienceweekly@substack.com]]></itunes:email><itunes:name><![CDATA[Data Science Weekly]]></itunes:name></itunes:owner><itunes:author><![CDATA[Data Science Weekly]]></itunes:author><googleplay:owner><![CDATA[datascienceweekly@substack.com]]></googleplay:owner><googleplay:email><![CDATA[datascienceweekly@substack.com]]></googleplay:email><googleplay:author><![CDATA[Data Science Weekly]]></googleplay:author><itunes:block><![CDATA[Yes]]></itunes:block><item><title><![CDATA[Data Science Weekly - Issue 656]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-656</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-656</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 18 Jun 2026 23:25:29 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!eFK_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #656<br>June 18, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://sqltoerdiagram.com/">Free SQL&#8594;ER diagram tool, runs in the browser, nothing uploaded</a><br></strong>Paste a SQL schema (CREATE TABLE statements) &#8594; get a clean, interactive ER diagram. Open source and 100% local &#8212; it runs entirely in your browser, so your schema never leaves your machine. No server, no signup, no upload&#8230;</p></li></ul><ul><li><p><strong><a href="https://osf.io/preprints/psyarxiv/qpj6n_v2">Preschoolers search semantic networks in a broader and more variable way than adults: Implications for hypothesis generation</a></strong><br>We find that adults show greater dependencies between sequential guesses than preschoolers, and generate a less diverse set of options. These findings may support the idea that development can be viewed as analogous to simulated annealing strategies in machine learning that start &#8220;hot&#8221; (in early childhood), generating wider and more variable searches, and eventually cool (in adulthood) to generate narrower searches&#8230;</p><p></p></li><li><p><strong><a href="https://rworks.dev/posts/too-many-R-packages/">New CRAN Packages: signal or noise?</a></strong><br>CRAN continues to be the most accessible repository for statistical knowledge on the planet, and the number of new packages being accepted by CRAN is growing faster than ever. But, is the R community really benefiting from this new growth?&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:612414}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!eFK_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!eFK_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 424w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 848w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 1272w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!eFK_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png" width="633" height="394.7979094076655" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:716,&quot;width&quot;:1148,&quot;resizeWidth&quot;:633,&quot;bytes&quot;:81496,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/202651355?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!eFK_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 424w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 848w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 1272w, https://substackcdn.com/image/fetch/$s_!eFK_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bfa9a21-0ac9-4482-a3b4-0c9c507fe6f4_1148x716.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://shonczinner.github.io/posts/embedding-prediction/">The 90-year-old idea behind JEPA models: Canonical Correlation Analysis (CCA)</a></strong><br>Harold Hotelling&#8217;s 1936 Canonical Correlation Analysis (CCA) [modern terminology, &#8220;CCA is used to find a common signal among two large matrices&#8221;] forms the theoretical and intuitive foundation for modern embedding prediction techniques, including JEPA models&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1u7upnm/2026_tech_stack_at_your_job/">2026 Data Science Tech Stack at your Job [Reddit]</a></strong></p><p>What is your current tech stack at your job?</p><p></p></li><li><p><strong><a href="https://interlatent.com/blog/interlatent-robotics-hardware-guide">A Beginner&#8217;s Guide to Robotics Hardware</a><br></strong>Building an open-source robot begins in a way that is familiar to assembling IKEA furniture&#8230;The similarity ends once the robot is powered on. A bookshelf is designed to stay exactly as assembled, whereas a robot has to move while remaining correct about its own position and the state of its surroundings&#8230;When designing and building robots, this need for correctness both numerically and temporally is a key consideration&#8230;The rest of this post looks at how that difference manifests, using a common framing in robotics that divides the hardware into three parts: the movement, the body, and the sensor&#8230;<br></p></li><li><p><strong><a href="https://www.youtube.com/playlist?list=PLGVZCDnMOq0rFQykYJg7t441AEpN4SszE">PyData London 2026 Talks</a><br></strong>All the talks from the PyData London 2026 are now available&#8230;<br></p></li><li><p><strong><a href="https://www.ssp.sh/brain/data-engineering-acquisitions/">Data Engineering Acquisitions (2022-2026)</a></strong></p><p>Consolidation in the Data Engineering market is happening quickly. Tools from the Modern Data Stack get unified into bigger Data Platforms. This note highlights the latest acquisitions across data engineering. It serves as an overview of the latest consolidations. Find attached the acquisition overview from 2022 to today&#8230;<br></p></li><li><p><strong><a href="https://apenwarr.ca/log/20260531">The software industry: annealing, but wrong</a></strong><br>In recent months I&#8217;ve heard of several teams with an interesting policy: each pull request should be no more than a few files, and no more than a certain number of lines (say 500). And do just one thing and do it well. And be easy for a human to review. And be fully tested by the test suite&#8230;And often, the results are good. Sure, splitting a single 6000-line feature or fix into twelve 500-line PRs is more work, but each of those PRs is surely easier to review. And you can git bisect them when there&#8217;s a bug! And maybe revert the individual change that broke something. ...and also cause 12x as many context switches for your reviewers as they review each one sequentially. But that&#8217;s just the cost of software quality! Right?&#8230;<code><br></code></p></li><li><p><strong><a href="https://www.sharonlohr.com/blog/2026/6/10/ai-and-sampling-problems">AI and Survey Sampling Problems</a><br></strong>My previous post discussed the performance of the artificial intelligence (AI) interface Gemini on undergraduate statistics problems. Now let&#8217;s look at how Gemini answers some of the problems in my sampling textbook (Lohr, 2022), and talk about how Gemini could help students learn sampling&#8230;<br></p></li><li><p><strong><a href="https://jakubsobolewski.com/blog/test-doubles-taxonomy/">Test Doubles Taxonomy for R: Dummy, Stub, Spy, Mock, Fake</a><br></strong>You might call them all &#8220;mock&#8221;&#8230;Mock the database. Mock the API. Mock the function. The word becomes a catch-all for any test double, any object you substitute for a real dependency in a test. Lumping them together makes it harder to choose the right tool, and the wrong choice leads to brittle, misleading tests. There are five distinct types, each with a specific job. Knowing which is which is how you stop writing tests that do the wrong thing&#8230;<br></p></li><li><p><strong><a href="https://iquilezles.org/articles/fbm/">Fractional Brownian Motion</a></strong></p><p>A Brownian Motion (BM), without the &#8220;fractional&#8221; part, is a motion where the position of a given object over time changes in random increments&#8230;A Fractional Brownian Motion is a similar process in which the increments are not completely independent from each other, but there&#8217;s some sort of memory to the process&#8230;I believe fBM is not necessarily a well understood mechanism. So this article describes how it functions and their different spectral and visual characteristics for various values of their main parameter H, backed with some experiments and measurements&#8230;<br></p></li><li><p><strong><a href="https://vickiboykis.com/2026/06/15/running-local-models-is-good-now/">Running local models is good now</a></strong><br>I&#8217;ve been working with local models since they came out, and finally, they&#8217;re surprisingly good now&#8230;<br></p></li><li><p><strong><a href="https://jakubsobolewski.com/blog/snapshot-testing-beyond-screenshots/">Snapshot Testing in R: Beyond Screenshots</a></strong></p><p>In this post I want to walk through using snapshot testing for what it is good for, and the practices that make it efficient&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/AskProgramming/comments/1u5lbig/what_algorithm_is_surprisingly_new/">What algorithm is surprisingly new? [Reddit]</a><br></strong>Other than any AI stuff, I&#8217;m talking about the types of algorithms you learn about in any standard Data Structures and Algorithms University course&#8230;I&#8217;m surprised that alot of these algorithms were actually invented HUNDREDS of years ago&#8230;<br></p></li><li><p><strong><a href="https://arxiv.org/abs/2606.02184">The Ghost Couple: Correlated LLM Name Priors and Their Haunting of the Web and Academic Publishing</a><br></strong>These names do not exist. Elena Vasquez and Marcus Chen have appeared as volcano experts, astronauts, thriller protagonists, podcast hosts, and academic co-authors across hundreds of independently produced AI-generated documents, never having lived. We show that llms do not merely default to high-probability individual names when generating fictional experts: they produce correlated character ensembles, pairs and trios whose co-occurrence rates far exceed chance and are consistent across independent generations. These priors are model-family-specific (Claude: Elena Vasquez + Marcus Chen + Amara Okafor; Gemini: Aris Thorne + Lena Petrova; GPT: Elara Voss with no fixed partner)&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://otexts.com/fpppy/">Forecasting: Principles and Practice, the Pythonic Way</a></strong></p></li><li><p><strong><a href="https://maxhalford.github.io/blog/solution-engineering-advice/">My unvarnished guide to solution engineering</a></strong></p></li><li><p><strong><a href="https://interlatent.com/blog/interlatent-modern-ai-robotics-first-principles">An Overview of Modern AI Robotics from First Principles</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #655 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-655">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://r-posts.com/2026-rousseeuw-prize-for-statistics-awarded-to-r-core-team-for-transforming-statistics-computing-worldwide/">2026 Rousseeuw Prize for Statistics Awarded to R Core Team for Transforming Statistics Computing Worldwide</a></strong></p></li><li><p><strong><a href="https://www.kenkoonwong.com/blog/aa1/">Learning Amino Acids Part 1: Non-Polar Amino Acids, Rodrigues Rotation, and Lennard-Jones Potential</a></strong></p></li><li><p><strong><a href="https://statmodeling.stat.columbia.edu/2026/06/18/gambling-provides-a-gentle-rocking-of-the-emotions-to-put-you-in-a-pleasant-baby-like-state/">Gambling provides a gentle rocking of the emotions to put you in a pleasant baby-like state</a></strong></p></li><li><p><strong><a href="https://statswithcats.net/2026/06/12/the-caitlin-clark-effect/">The Caitlin Clark Effect</a></strong></p></li><li><p><strong><a href="https://blog.janestreet.com/formal-methods-at-jane-street-index/">Formal methods and the future of programming</a></strong></p></li><li><p><strong><a href="https://john.soban.ski/polars2.html">Crunch Big Data on Your Laptop With Polars Streaming</a></strong></p></li></ul><p>.</p><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 655]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-655</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-655</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 11 Jun 2026 22:25:19 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!FVg8!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #655<br>June 11, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://interlatent.com/blog/interlatent-modern-ai-robotics-first-principles">An Overview of Modern AI Robotics from First Principles</a><br></strong>There is a deceptively simple way to describe what physical AI is all about, a way in which anyone with a STEM background will intuitively understand. Like all other AI models, a model which controls a robot is also a function. It takes in observations (camera pixels, joint angles, the felt resistance of a gripper, etc) and it outputs actions, the next set of positions and torques for its motors&#8230;If you&#8217;ve ever trained a model that maps inputs to outputs, you can already grasp the shape of the problem. The interesting part is what happens when you take this familiar shape and drop it into a moving, active world&#8230;This sounds like ordinary machine learning, and for a while you can pretend it is. But robotics introduces a third axis that classic ML never had to respect: inference time&#8230;</p></li></ul><ul><li><p><strong><a href="https://maxhalford.github.io/blog/solution-engineering-advice/">My unvarnished guide to solution engineering</a></strong><br>Nowadays I feel more or less comfortable interacting with customers. But I was awful at first. I know because one of the cofounders gave me harsh feedback after a call with our first serious customer. I still remember slamming the lid of my computer when we debriefed. What I perceived as harsh feedback at the time turned out to help me grow quickly&#8230;I used to be a regular data scientist assigned to internal projects. Talking to prospects and customers got me out of my comfort zone. You owe them a service, and they expect you to deliver something. If something goes wrong they&#8217;ll go above your head to your founders, at which point you start feeling the heat. It can be quite harsh. But it can also be rewarding when things go well&#8230;</p><p></p></li><li><p><strong><a href="https://myzopotamia.dev/navier-stokes-fluid-simulation-explained-with-godot">Navier-Stokes fluid simulation explained with Godot game engine</a></strong><br>Let me start with the mathematical description of what we will do in this blog post. This description might sound daunting, but don&#8217;t worry - we&#8217;ll explain everything as we go. Here goes: we will simulate fluid flow by moving a scalar density field through a vector velocity field. We&#8217;ll simulate velocity diffusion and advection as well as density diffusion and advection. Then we will add velocity projection with the goal of making the fluid obey the law of mass conservation - which will happen by balancing divergence with a pressure field. We will use bilinear interpolation and Gauss-Seidel relaxation for approximating values where needed&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:572144}" data-component-name="PollToDOM"></div><p></p><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!FVg8!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!FVg8!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 424w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 848w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 1272w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!FVg8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png" width="596" height="367.8111888111888" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:706,&quot;width&quot;:1144,&quot;resizeWidth&quot;:596,&quot;bytes&quot;:69118,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/201616122?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!FVg8!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 424w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 848w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 1272w, https://substackcdn.com/image/fetch/$s_!FVg8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a27a4d4-65ab-4318-8de5-ec2de8e962f7_1144x706.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://liangchang.substack.com/p/the-anti-scaling-law-in-biology-and">The Anti-Scaling Law in Biology, and Why AI Could Make Crowding Worse Before Making Drug Development Better</a></strong><br>One of the main reasons for the tech community&#8217;s optimism is the scaling-law. Once you demonstrated 0-1, you can do 1-100 much quicker. The internet, social media, and so on&#8230;In biology and drug development, I think there is a mirror image, the anti-scaling law. Because of that, here&#8217;s my contrarian view: AI could make crowding in drug development worse, before making it better. And that&#8217;s my perspective as a genuine believer in the transformative power of AI, and an AI practitioner who used $14,000 worths of AI tokens in the past 2 months&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/statistics/comments/1u1xnl1/what_is_there_besides_frequentist_and_bayesian/">What is there besides Frequentist and Bayesian stats? [Reddit]</a></strong></p><p>I am wondering whether there are lesser known statistical paradigms. like most people, I was first acquainted with the Frequentist framework, and later got introduced to Bayesian stats. I really like the way this made me reconsider some of what I thought were basic assumptions, so now I&#8217;m wondering what the next thing could be? Are there any other branches/frameworks which are not as well known?&#8230;</p><p></p></li><li><p><strong><a href="https://otexts.com/fpppy/">Forecasting: Principles and Practice, the Pythonic Way</a><br></strong>This textbook is based on Forecasting: Principles and Practice (3rd ed) and is intended to provide a comprehensive introduction to forecasting methods and to present just enough information about each method for readers to be able to use them sensibly. We don&#8217;t attempt to give a thorough discussion of the theoretical details behind each method, although the references at the end of each chapter will hopefully fill in many of those details&#8230;<br></p></li><li><p><strong><a href="https://medium.com/@VictorBanev/the-simplest-learning-machine-pt-2-e735367f546">The Simplest Learning Machine, Pt.2</a><br></strong>In the previous article I outlined the concept of the Simplest Learning Machine. It&#8217;s an imaginary algorithm that uses one byte of persistent memory and learns to predict something about a stream of binary events&#8230;Can we actually write something like that? How would it work?&#8230;One semi-obvious thing we can learn is the rate of positive events in the stream. This would give us some predictive power, as long as that rate is different from 50%. A bit of a stretch to call this &#8220;machine learning&#8221;, sure, but I&#8217;ll get to the questions of usefulness later&#8230;<br></p></li><li><p><strong><a href="https://research.dimensioncap.com/p/on-training-data-for-bio-ai-models">On Training Data for Bio AI Models</a></strong></p><p>As we advance biological foundation models, which lessons from LLM data curation transfer, and which need rethinking?&#8230;<br></p></li><li><p><strong><a href="https://ropensci.org/blog/2026/06/01/goodpractice/">Our goodpractice Package Has New Superpowers</a></strong><br>The goodpractice package has been recommended by rOpenSci since it was first started just over 10 years ago by G&#225;bor Cs&#225;rdi. We used to ask our editors to manually run goodpractice on all packages submitted to software peer-review, and then to ask authors to fix any notable issues flagged by the package&#8230;We&#8217;re really pleased to share that we&#8217;ve recently rolled out a host of updates and extensions to the package. These make it both easier to use, and more powerful&#8230;I think that is the aspect that I found most surprising: That the use of Claude made our collaboration feel less technical, and therefore somehow even more human. And that gave us the ability to work though 70 pull requests representing over 100 new checks, all ready for everybody to use&#8230;<code><br></code></p></li><li><p><strong><a href="https://rwarehouse.netlify.app/">The Warehouse</a><br>The Problem</strong></p><p>With over 23,000 packages on CRAN alone, finding the right package for your task is overwhelming:</p><ul><li><p>Searching by keywords often misses relevant packages</p></li><li><p>No easy way to compare similar packages</p></li><li><p>Quality indicators are scattered or missing</p></li><li><p>GitHub-only packages are hard to discover</p></li></ul><p></p><p><strong>The Warehouse Solution provides:</strong></p><ul><li><p><strong>Function-first search</strong>: &#8220;estimate serial interval&#8221; &#8594; find all relevant packages</p></li><li><p><strong>Quality scores</strong>: Automated assessment of tests, documentation, and maintenance</p></li><li><p><strong>All sources</strong>: CRAN, GitHub, Bioconductor in one place</p></li><li><p><strong>Community reviews</strong>: Real user experiences and recommendations</p></li><li><p><strong>Smart categorization</strong>: Browse by what packages actually do&#8230;<br></p></li></ul></li><li><p><strong><a href="https://cvg.ethz.ch/lectures/Robot-Learning/">Robot Learning: From Fundamentals to Foundation Models</a><br></strong>This course provides a comprehensive introduction to modern robot learning, combining classical techniques with the latest advances in large-scale models: Students will start by learning the fundamentals of imitation learning, reinforcement learning, and policy optimization, and gradually progress to advanced topics including Vision-Language-Action (VLA) models and foundation models for robotics The objectives of this course are:</p><ul><li><p>Understand the core principles of imitation learning, reinforcement learning, and policy learning.</p></li><li><p>Implement basic robot learning systems in simulation and on real robots.</p></li><li><p>Explore state-of-the-art Vision-Language Action and foundation models for robotics.</p></li><li><p>Design and evaluate scalable robot learning pipelines integrating perception, control, and multi-modal reasoning&#8230;<br></p></li></ul></li><li><p><strong><a href="https://silviasapora.github.io/blog/ml-interviews.html">ML Job Interviews: The Ultimate Guide</a></strong></p><p>How I found a Research Scientist role after a PhD in Machine Learning&#8230;My process was, overall, successful: I received offers from every company I completed interviews with including: DeepMind (which I accepted), Isomorphic Labs, Cohere, Meta, and a startup in stealth. A few caveats to the first claim: Anthropic, Mistral, and TeslaAI got back to me too late and I didn&#8217;t complete those processes. ReflectionAI, the one genuine rejection: they didn&#8217;t like me for the RS role but switched me to their Engineering track instead&#8230;<br></p></li><li><p><strong><a href="https://github.com/lucasduthu/stata-mpl">stata-mpl - Give your matplotlib and seaborn charts the Stata 19 look</a></strong><br>Give your matplotlib and seaborn charts the look of Stata 19 (the stcolor scheme, Stata&#8217;s colorblind-friendly default). Calibrated against the official SVG files exported by Stata 18/19&#8230;<br></p></li><li><p><strong><a href="https://theodore.net/projects/AvianVisitors/">Avian Visitors</a></strong></p><p>I mounted a tiny microphone on my apartment balcony to listen for any birds passing by and built a site to collage them as they&#8217;re heard&#8230;so I&#8217;ve thrown together this short writeup for any of you who want to monitor any avian visitors that may be passing by your own place. It&#8217;s short and sweet for now in an attempt to get something out quickly, but this work is part of a longer chain of bird-tangent projects i&#8217;ll write something up about soon!&#8230;<br></p></li><li><p><strong><a href="https://news.ycombinator.com/item?id=48449187">Ask HN: What are tools you have made for yourself since the advent of AI?</a><br></strong>Ask HN: What are tools you have made for yourself since the advent of AI?&#8230;<br></p></li><li><p><strong><a href="https://www.bayesianspectacles.org/why-academics-should-use-ai-for-writing-a-case-study/">Why Academics Should Use AI for Writing: A Case Study</a><br></strong>I violently dislike the idea of AI taking over my writing. My writing is my own, and having it done by AI makes the final product lose its soul. Also, whenever I have used AI to write several paragraphs independently (which I admit to doing for bureaucratic tasks) I ended up rewriting most of it anyway. However, over the past year or so I have become increasingly impressed with what AI can do, and rather than talk about this in abstract terms I would like to present you with a concrete demonstration that shifted my opinion a great deal&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://practicaldatacommunity.substack.com/p/how-to-build-a-simple-bulletproof">How to Build a Simple, Bulletproof Data Pipeline</a></strong></p></li><li><p><strong><a href="https://github.com/mljar/supertree">supertree - Interactive Decision Tree Visualization</a></strong></p></li><li><p><strong><a href="https://www.kaelio.com/blog/building-a-context-layer-for-the-agentic-era">Beyond the Semantic Layer: Building a Context Layer for the Agentic Era</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #654 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-654">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://statswithcats.net/2026/06/06/discover-stats-with-kittens-and-stats-with-cats/">When is detecting AI-generated text worthwhile?</a></strong></p></li><li><p><strong><a href="https://curlewis.co.nz/posts/lines-of-code-got-a-better-publicist/">Lines of Code Got a Better Publicist</a></strong></p></li><li><p><strong><a href="https://www.jstatsoft.org/article/view/v116i03">BayesMultiMode: Bayesian Mode Inference in R</a></strong></p></li><li><p><strong><a href="https://academic.oup.com/qje/article/140/2/943/7925870">Cognitive Endurance as Human Capital</a></strong></p></li><li><p><strong><a href="https://pub.sakana.ai/diffusionblocks/">DiffusionBlocks: Training Neural Networks One Block at a Time</a></strong></p></li><li><p><strong><a href="https://old.reddit.com/r/piano/comments/1u0lyhe/data_from_66000_practice_sessions_how_much_does/">Data from 66,000+ practice sessions. How much does the typical musician actually practice? [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1txc9vv/what_is_the_most_common_reason_data_science/?utm_source=share&amp;utm_medium=mweb3x&amp;utm_name=mweb3xcss&amp;utm_term=1&amp;utm_content=share_button">What is the most common reason data science projects fail to deliver business value? [Reddit]</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 654]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-654</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-654</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 04 Jun 2026 13:02:35 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!rM6T!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #654<br>June 04, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://practicaldatacommunity.substack.com/p/how-to-build-a-simple-bulletproof">How to Build a Simple, Bulletproof Data Pipeline</a><br></strong>In most organizations, a lot of value can be delivered with a setup that avoids high costs and unnecessary complexity. The most common scenario is not real-time streaming or exotic architectures. It is daily extraction from one or more transactional systems backed by a relational database&#8230;In this article, I want to walk through a simple but realistic example and show how a few design decisions, even when they look basic, can make a meaningful difference in robustness, operability, and long-term maintainability&#8230;</p></li></ul><ul><li><p><strong><a href="https://ankitg.me/blog/2026/05/04/fuzzy_api.html">AI for Bio has a Fuzzy API problem</a></strong><br>&#8220;AI for bio&#8221; is getting hot again. Given the excitement in the current moment, I thought I&#8217;d share a bit about what actually makes biology uniquely hard as an application domain for machine learning. The reason is not simply that biology is complicated, though it obviously is. ML is good at many things that are complicated. The deeper reason is that drug discovery does not have the kind of clean feedback loops and clean interfaces that made modern ML so powerful elsewhere&#8230;</p><p></p></li><li><p><strong><a href="https://momentsingraphics.de/Siggraph2026.html">Gaussian Point Splatting</a></strong><br>We propose Gaussian point splatting, a stochastic method to render Gaussian splats that scales extremely well to scenes with many Gaussians. Our core idea is to sample pixel-sized, opaque points from the Gaussians and to splat them to a framebuffer using 64-bit atomics. Through parallel programming primitives, we achieve an even distribution of the workload across millions of threads&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:529508}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rM6T!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rM6T!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 424w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 848w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 1272w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rM6T!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png" width="1148" height="700" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:700,&quot;width&quot;:1148,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:65745,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/200601401?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rM6T!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 424w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 848w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 1272w, https://substackcdn.com/image/fetch/$s_!rM6T!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87268243-9c0b-410e-802b-a4d529bbb84a_1148x700.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://apps.london.gov.uk/state-of-london/">State of London Report, 2026</a></strong><br>The State of London report brings together an array of data about how London is performing across its economy, society and environment. Published annually by the GLA&#8217;s City Intelligence unit, it provides an up&#8209;to&#8209;date, data&#8209;led picture of life in the capital, drawing on a wide range of official and administrative sources. The report highlights trends and patterns and offers a shared evidence base to support debate and decision making&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/rstats/comments/1tqi2e3/what_is_considered_basic_r/">What is considered basic R? [Reddit]</a></strong></p><p>I have a job interview coming up and they want someone who knows basic R, I think I do have it, but what is your opinion on what it entails?&#8230;</p><p></p></li><li><p><strong><a href="https://humynlabs.ai/bridge">BRIDGE (Benchmark of Regional &amp; International Data for Global Evaluation) is the first independent Global South ASR benchmark</a><br></strong>BRIDGE (Benchmark of Regional &amp; International Data for Global Evaluation) is the first independent Global South ASR benchmark evaluating 15 global models across 22 languages on a first-of-its-kind 7 metric stack&#8230;<br></p></li><li><p><strong><a href="https://github.com/mljar/supertree">supertree - Interactive Decision Tree Visualization</a><br></strong><code>supertree</code> is a Python package designed to visualize decision trees in an interactive and user-friendly way within Jupyter Notebooks, Jupyter Lab, Google Colab, and any other notebooks that support HTML rendering. With this tool, you can not only display decision trees, but also interact with them directly within your notebook environment. Key features include:</p><ul><li><p>ability to zoom and pan through large trees,</p></li><li><p>collapse and expand selected nodes,</p></li><li><p>explore the structure of the tree in an intuitive and visually appealing manner&#8230;<br></p></li></ul></li><li><p><strong><a href="https://arxiv.org/abs/2606.02113">A Primer in Post-Training Reasoning Data: What We Know About How It Works</a></strong></p><p>Work on post-training reasoning data has grown rapidly, yet this literature remains scattered across dataset papers, reinforcement-learning recipes, reward-model studies, benchmarks, and frontier system reports. This paper is the first primer to synthesize over 150 key public studies and system reports on post-training reasoning data. We organize the field around four questions: what data objects exist, what makes them useful, how they are constructed, and how they scale. Together, this organization provides an attribution framework for future reasoning-data releases and post-training recipes&#8230;<br></p></li><li><p><strong><a href="https://christopherkrapu.com/blog/2026/dont-know-where-your-data-is-from/">Don&#8217;t know where your data is from? Bayesian modeling for unknown coordinates</a></strong><br>An especially strong motivating case for the usage of spatial probability models comes from the mining industry. During exploration for mineral resources, prospectors will take geologic samples by drilling holes and examining the resulting material for presence or concentration of valuable ores. These data typically show strong spatial correlation, but constructing a fully-detailed geophysical model is at times infeasible as we are able to observe very little of the underground conditions, though the advent of remote sensing techniques like ground-penetrating radar and gravimetry has dramatically improved our ability to characterize Earth&#8217;s subsurface. To address this challenge, we would like to construct a probability model which uses nearby data to predict a variable of interest at a new location&#8230;<code><br></code></p></li><li><p><strong><a href="https://blog.andymasley.com/p/why-i-think-panic-about-local-impacts?hide_intro_popup=true">Why I think panic about local impacts of data centers is just a panic</a><br></strong>In the last year of following increased local resistance to data centers being built, I&#8217;ve listened to lots of recorded testimony at town halls, read through countless comments and articles where people argue for why data centers are so uniquely evil and shut down anyone defending them as shills for AI companies&#8230;whenever I look into where people are actually getting their ideas about the hundreds of other data centers being built, the source always leads back to some confused misreading of local reporting, a wild calculation error, a bad game of telephone, or a wildly misleading article&#8230;<br></p></li><li><p><strong><a href="https://www.kaelio.com/blog/building-a-context-layer-for-the-agentic-era">Beyond the Semantic Layer: Building a Context Layer for the Agentic Era</a><br></strong>A context layer puts your warehouse schema, joins, metric definitions, and business knowledge in one reviewable place so data agents query governed context instead of guessing field names. A look at how it works, and at ktx, the open-source context layer&#8230;<br></p></li><li><p><strong><a href="https://lospino.so/statistics/jensen-shannon-divergence/">Jensen-Shannon Divergence</a></strong></p><p>How different are two discrete or binned probability distributions on the same support?&#8230;<br></p></li><li><p><strong><a href="https://www.mikeash.com/pyblog/fluid-simulation-for-dummies.html">Fluid Simulation for Dummies</a></strong><br>I wrote my Master&#8217;s thesis on high-performance real-time 3D fluid simulation and volumetric rendering. The basics of the fluid simulation that I used are straightforward, but I had a very difficult time understanding it. The available reference materials were all very good, but they were a bit too physics-y and math-y for me. Unable to find something geared towards somebody of my mindset, I&#8217;d like to write the page I wish I&#8217;d had a year ago. With that goal in mind, I&#8217;m going to show you how to do simple 3D fluid simulation, step-by-step, with as much emphasis on the actual programming as possible&#8230;.<br></p></li><li><p><strong><a href="https://www.sei.cmu.edu/blog/a-hitchhikers-guide-to-ml-training-infrastructure/">A Hitchhiker&#8217;s Guide to ML Training Infrastructure</a></strong></p><p>Hardware has made a huge impact on the field of machine learning (ML). Many of the ideas we use today were published decades ago, but the cost to run them and the data necessary were too expensive, making them impractical. Recent advances, including the introduction of graphics processing units (GPUs), are making some of those ideas a reality. In this post we&#8217;ll look at some of the hardware factors that impact training artificial intelligence (AI) systems, and we&#8217;ll walk through an example ML workflow&#8230;.<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tqbfmq/weaponized_phrases_in_data_science_teams/">Weaponized phrases in Data science Teams [Reddit]</a><br></strong>&#8220;No free cycles&#8221; / &#8220;Empty plates&#8221;&#8230;&#8220;We need to focus on the low-hanging fruit&#8221;&#8230;"Be a go-getter, don't get stuck"&#8230;"Let's optimize our sprint velocity"&#8230;&#8220;You&#8217;re making this more complicated than it is&#8221;&#8230;"We need to relentlessly prioritize"&#8230;"I need you to own this initiative"&#8230;"Let's take this offline" / "Parking lot this"&#8230;"We need to leverage AI to unlock enterprise value"&#8230;"We're like a family here"&#8230;<br></p></li><li><p><strong><a href="https://taylorgeospatial.org/agricultural-field-boundaries-mapped-globally-for-the-first-time/">Agricultural Field Boundaries, Mapped Globally for the First Time</a><br></strong>For the first time, every agricultural field on Earth has a boundary on the map. Taylor Geospatial funded and co-developed this work with Microsoft AI for Good Lab because we believe GeoAI should work everywhere, not just in the data-rich regions where labeled training data is abundant. Today, it&#8217;s publicly available for everyone to benefit from&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tknjuv/what_ds_job_market_trends_are_you_seeing/">What DS job market trends are you seeing? [Reddit]</a></strong></p></li><li><p><strong><a href="https://aiweekender.substack.com/p/6-llm-prompting-techniques-for-data">6 LLM Prompting Techniques for Data Scientists and Engineers in 2026</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/selfimprovement/comments/1tjef6k/i_am_faking_my_way_through_a_data_analyst_role/">I am faking my way through a Data Analyst role with AI, how do I actually learn before I get caught? [Reddit]</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #653 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-653">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://www.moderndescartes.com/essays/ai_and_expertise/">Expertise in the Age of AI</a></strong></p></li><li><p><strong><a href="https://vickiboykis.com/2026/05/28/we-should-be-more-tired-than-the-model/">We should be more tired than the model</a></strong></p></li><li><p><strong><a href="https://www.brethorsting.com/blog/2026/05/domain-expertise-has-always-been-the-real-moat/">Domain Expertise Has Always Been the Real Moat</a></strong></p></li><li><p><strong><a href="https://obeli.sk/blog/sqlite-is-all-you-need-for-durable-workflows/">SQLite is All You Need for Durable Workflows</a></strong></p></li><li><p><strong><a href="https://www.fharrell.com/talk/bguide/">Implications of the Draft FDA Bayesian Guidance</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 653]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-653</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-653</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 28 May 2026 19:41:05 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!aks6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #653<br>May 28, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://fedemagnani.github.io/math/2026/04/08/the-quadratic-sandwich.html">The quadratic sandwich</a><br></strong>If you have ever tried to minimize a function with gradient descent, you probably noticed that some functions are a joy to optimize and others are a nightmare. The difference often boils down to two properties: strong convexity and L-smoothness. These two concepts define a &#8220;sandwich&#8221; of quadratic bounds around your function that tells you exactly how well-behaved it is. If the sandwich is tight, life is good. If one slice of bread is missing, things get ugly fast&#8230;In this post we&#8217;ll build up both concepts from scratch, see how they combine into the quadratic sandwich, understand what happens at the level of the Hessian&#8217;s eigenvalues, and pick up a neat trick to verify L-smoothness without ever computing an eigenvalue&#8230;</p></li></ul><ul><li><p><strong><a href="https://gudok.xyz/transpose/">What it takes to transpose a matrix</a></strong><br>In this article we are going to gradually build a sequence of progressively more efficient implementations of matrix transpose, with the most sophisticated implementation being up to x25 times faster than the naive one. During each step we will locate the bottleneck, figure out what has caused it, and think of a solution to overcome it. This article is intended to serve as an introduction to optimizing matrix algorithms for x86_64, presented from the perspective of a real-world problem&#8230;</p><p></p></li><li><p><strong><a href="https://www.johndcook.com/blog/2017/11/08/why-is-kullback-leibler-divergence-not-a-distance/">Why is Kullback-Leibler divergence not a distance?</a></strong><br>The Kullback-Leibler divergence between two probability distributions is a measure of how different the two distributions are. It is sometimes called a distance, but it&#8217;s not a distance in the usual sense because it&#8217;s not symmetric. At first this asymmetry may seem like a bug, but it&#8217;s a feature. We&#8217;ll explain why it&#8217;s useful to measure the difference between two probability distributions in an asymmetric way. The Kullback-Leibler divergence between two random variables X and Y is defined as&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:520345}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aks6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aks6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 424w, https://substackcdn.com/image/fetch/$s_!aks6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 848w, https://substackcdn.com/image/fetch/$s_!aks6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 1272w, https://substackcdn.com/image/fetch/$s_!aks6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aks6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png" width="575" height="352" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:352,&quot;width&quot;:575,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:26143,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/199621460?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aks6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 424w, https://substackcdn.com/image/fetch/$s_!aks6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 848w, https://substackcdn.com/image/fetch/$s_!aks6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 1272w, https://substackcdn.com/image/fetch/$s_!aks6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b83afc3-9536-455b-9f00-9275c0f64179_575x352.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://golfcoursewiki.substack.com/p/friday-pins-vs-sunday-pins-or-how">Friday Pins vs Sunday Pins or: How to Illustrate Something Completely Obvious</a></strong><br>In my previous article, I Spent the Last Month and a Half Building a Model that Visualizes Strategic Golf, I laid out the very basics of the golf model I built, the underlying reason that compelled me to work on it, and novel maps it could create. However, I barely scratched the surface of what this model can illustrate about golf course architecture. Here, I want to talk about how we can specifically look at one kind of dynamic architectural interest. That is, features of golf architecture that appear as we change the course setup. Specifically, I want to look at how different hole locations change the architectural interest for players, how we can show that, and what it looks like&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tknjuv/what_ds_job_market_trends_are_you_seeing/">What DS job market trends are you seeing? [Reddit]</a></strong></p><p>I have 20 YOE, but I do a generic &#8220;data science&#8221; search on LinkedIn every 3 months to see how the job market is trending. Here are my latest observations. I would love to hear what others think.</p><ol><li><p>The number of AI postings is going down. ML and DE skills are back in fashion.</p></li><li><p>Salaries are down across the board.</p></li><li><p>Non-technical responsibility is up. I see &#8220;Data Scientist&#8221; roles being asked to create a roadmap and drive organizational change. That used to be the responsibility of the manager or maybe the lead.</p></li></ol><p>I haven&#8217;t applied for any of these jobs, so I don&#8217;t know what&#8217;s actually real. I wonder if Data Science is no longer the hot keyword and I should be searching for something else&#8230;</p><p></p></li><li><p><strong><a href="https://www.fharrell.com/talk/ai/">Thoughts About the Roles of AI for Statistics</a><br></strong>This talk covers what I&#8217;ve learned from using large language models in my work for the past two years. For statistical programming, success has come when I play the role of specification writer and comprehensive tester. For statistical methodology, AI has been successful serving me as a mathematical statistical assistant and a critic. Instead of avoiding AI we should embrace it, but we should always set a higher bar for the quality of our work as a result&#8230;<br></p></li><li><p><strong><a href="https://stats.stackexchange.com/questions/676087/evaluating-detection-classifier-algorithm-accuracy">Evaluating detection &amp; classifier algorithm accuracy</a><br></strong>Let&#8217;s say i have images with a mixture of normal cells and sick cells on each image. Humans can reliably distinguish normal cells from sick cells, however it takes a lot of time to mark up the images as there are hundreds of cells in one field of view. I have an algorithm that can also distinguish normal and sick cells. The outputs from both manual markup and my algorithm is 2 lists of (x, y) coordinates -- one list for sick cells, one for healthy. What are the best practices for comparing and reporting the accuracy of my algorithm against manual markup?&#8230;<br></p></li><li><p><strong><a href="https://www.statsignificant.com/p/do-most-tv-shows-stick-the-landing">Do Most TV Shows Stick the Landing?</a></strong></p><p>Four decades later, television has changed dramatically, reshaped by streaming and a clearer understanding of what makes for a satisfying conclusion. But has this institutional knowledge led to better endings? Have showrunners learned from the mistakes of St. Elsewhere, Game of Thrones, and other finale fiascos? So today, we&#8217;ll investigate whether omniscient showrunner Tommy Westphall has gotten any better at sticking the landing, how finale quality has changed in recent decades, and whether finality is simply a structural weakness of television itself&#8230;<br></p></li><li><p><strong><a href="https://redwallanalytics.com/posts/2023-02-22-nyed-data-explorer-shows-15-years-of-charter-school-success/">NYED Data Explorer Shows 15 Years of Charter School Success</a></strong><br>When I discovered 15 years of NYED assessment data, the interest to clean and free this data for others to discover in a Shiny app, was immediate. The opportunity to also feature Classical&#8217;s stand-out performance didn&#8217;t hurt my motivation, although this post and the app were built in my spare time, and do not represent the opinions of South Bronx Classical Charter Schools. Unlike many past Redwall posts, this one will not have code, and will be primarily to explain the data and show how to use the app&#8230;<code><br></code></p></li><li><p><strong><a href="https://statmodeling.stat.columbia.edu/2014/08/14/luck-vs-skill-poker/">Luck vs. skill in poker</a><br></strong>The thread of our recent discussion of quantifying luck vs. skill in sports turned to poker, motivating the present post&#8230;Can good poker players really &#8220;read&#8221; my cards and figure out what&#8217;s in my hand?&#8230;<br></p></li><li><p><strong><a href="https://remlapmot.github.io/post/2026/stan-compile-speedup/">Speeding up Stan model builds for R package developers</a><br></strong>My PhD student was interested in Bayesian methods and we put together an R package which included some Stan models. I was always frustrated by how slowly these compiled on our Windows machines&#8230;A few years later, when I got a MacBook Air I was shocked how much faster they compiled. On my Windows machine our mrbayes package takes 3 minutes 55 seconds to compile and install. On my M4 MacBook Air it takes 1 minute 16 seconds. The following tips show how to improve those timings&#8230;<br></p></li><li><p><strong><a href="https://ankitg.me/blog/2025/01/06/unfair-coins.html">How unfair is the coin?</a></strong></p><p>In February 2024, Reverie Labs, the startup I co-founded in 2017, was acquired by Ginkgo Bioworks. I&#8217;m now on leave from Ginkgo and I&#8217;ve joined Y Combinator as a Visiting Partner, giving me the chance to work with the next generation of companies. Especially in this new role, I&#8217;ve been thinking a bit about what worked, what didn&#8217;t work, and what lessons I can take forward&#8230;We had quite the journey &#8211; 6+ years of building at the intersection of AI and drug discovery. We began as a machine learning driven software company selling SaaS tools and consulting services to pharma companies, and at acquisition we were a pharmaceutical company, developing our own in-house pipeline of drug assets and advancing them rapidly using our machine learning technology&#8230;<br></p></li><li><p><strong><a href="https://jcarroll.com.au/2026/05/22/functions-over-idioms-rfuns/">Functions over Idioms - Writing R in Python with rfuns</a></strong><br>Sometimes a problem calls for a particular language to be used, and with that comes adjusting one&#8217;s brain to thinking in that language and using the appropriate idioms to leverage that language&#8217;s features&#8230;But what if I don&#8217;t want to?&#8230;The line between R and Python has been heavily blurred the last few years, particularly with {reticulate} (rstudio.github.io) enabling us to use Python within R code, RStudio rebranding as Posit (posit.co) and taking on a strong Python development effort, releasing Positron (posit.co) as a multi-language IDE, and Quarto (quarto.org) being a multi-language rethink of Rmarkdown&#8230;<br></p></li><li><p><strong><a href="https://aiweekender.substack.com/p/6-llm-prompting-techniques-for-data">LLM Prompting Techniques for Data Scientists and Engineers in 2026</a></strong></p><p>Six techniques matched to six failure modes, including inconsistent output formats, shallow reasoning, instruction drift, and more&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/selfimprovement/comments/1tjef6k/i_am_faking_my_way_through_a_data_analyst_role/">I am faking my way through a Data Analyst role with AI, how do I actually learn before I get caught? [Reddit]</a><br></strong>I graduated with a CS degree, but I spent my undergrad years grinding part-time jobs instead of actually studying. Now I am a Data Analyst at a small business, and the job is nothing like the theory I slept through in school. I am just winging it every day tbh. I rely heavily on openclaw for data scraping and acciowork to handle the processing and archiving. If these AI tools ever went down, I would be fired within an hour. I am terrified of being exposed as a fraud. Where do I even start fixing this? Should I grind python, or is mastering excel still the first step for survival?&#8230;<br></p></li><li><p><strong><a href="https://www.dougmacdowell.com/50-hours-to-draw-some-lines.html">50 Hours to Draw Some Lines</a><br></strong>"What are you working on these days?"<br>"Data visualizations." I told him.<br>"Ah, you using algorithms, machine learning, cloud computing, things like that?"<br>"No." I said. "I'm just trying to draw a line graph."&#8230;.What do I mean by drawing data by hand? I made this data visualization (data viz) about a coffee maker computer by hand, using rulers, pencils, ink, and a lettering kit. Along with my flubs, flukes, and acclimation with tools - it took me 50 hours to make. It&#8217;s statistically accurate, carefully crafted, and like Hackaday said &#8220;right out of a 1970&#8217;s college textbook&#8221;. It&#8217;s how professionals might visualize data before computers could do it for them&#8230;.</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1th87u4/are_there_any_small_quick_things_i_can_do/">Are there any small, quick things I can do everyday to keep my skills sharp? [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tjbn57/after_5_years_in_data_science_im_starting_to/">After 5 years in data science, I&#8217;m starting to realize most &#8220;insights&#8221; we deliver are completely ignored. Is this normal? [Reddit]</a></strong></p></li><li><p><strong><a href="https://datascienceconfidential.github.io/r/predictive-models/2026/05/14/is-logistic-regression-regression.html">Is logistic regression regression?</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #652 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-652">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://sabr.org/lahman-database/">Lahman Baseball Database, created by SABR member Sean Lahman, contains complete major league batting and pitching statistics back to 1871</a></strong></p></li><li><p><strong><a href="https://mlbfranchiseanalysis.netlify.app/">A Data-Driven Survey of MLB Franchise Management</a></strong></p></li><li><p><strong><a href="https://jakubsobolewski.com/blog/bdd-shiny-when/">Behavior-Driven Development in R Shiny: Modeling User Behavior with When Steps</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/learnmath/comments/1t2mevm/i_dont_understand_standard_deviation/">I dont understand Standard Deviation [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tmfjlw/good_practices_in_data_scripts/">Good practices in data scripts [Reddit]</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Who is going to save you?]]></title><description><![CDATA[On the importance of having a corporate sponsor and not putting all of your political eggs in one basket.]]></description><link>https://datascienceweekly.substack.com/p/who-is-going-to-save-you</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/who-is-going-to-save-you</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Fri, 22 May 2026 22:06:43 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2003" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2003,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;two women sits of padded chairs while using laptop computers&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="two women sits of padded chairs while using laptop computers" title="two women sits of padded chairs while using laptop computers" srcset="https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1573164574048-f968d7ee9f20?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Caption: <a href="https://unsplash.com/photos/two-women-sits-of-padded-chairs-while-using-laptop-computers-HocFQHhGjDE">Christina @ wocintechchat.com M</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/who-is-going-to-save-you">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 652]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-652</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-652</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 21 May 2026 22:52:26 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!I8ji!,w_256,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3294ef46-cb03-42ea-b7d6-9f8e8b0f41f6_253x253.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #652<br>May 21, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://ccli.substack.com/p/whats-going-on-in-computational-neuroscience">What&#8217;s going on in computational neuroscience nowadays? (part 1)</a><br></strong>A month ago I came back from Cosyne, the annual Computational and Systems Neuroscience conference&#8230;The days are a haze of tutorials, talks, poster sessions, and workshops, usually appended by dinners and drinks past midnight&#8230;I seem to have a hard time writing one-off pieces, so I&#8217;m leaning into that and writing this as a series. I&#8217;ll only be able to write a very narrow perspective of Cosyne, of course, but most of the talks are on YouTube on the official channel if you want to see for yourself. (That also means this will be more personal thoughts than report)&#8230;</p></li></ul><ul><li><p><strong><a href="https://datascienceconfidential.github.io/r/predictive-models/2026/05/14/is-logistic-regression-regression.html">Is logistic regression regression?</a></strong><br>I came across a post recently by a machine learning engineer who made the bold claim that logistic regression is the worst name for an algorithm ever, or something along those lines&#8230;Many statisticians of the more old-school type seemed to disagree. This led me to think a bit more deeply about the subject. I&#8217;ve already written several posts on bad terminology in statistics (see confidence level, line of best fit, r squared) so I might have been expected to agree with the machine learning view, but in this case I agree with the statisticians, and I would like to explain why&#8230;</p><p></p></li><li><p><strong><a href="https://spawn-queue.acm.org/doi/pdf/10.1145/3778029">What Every Experimenter Must Know About Randomization</a></strong><br>Randomized controlled experiments offer gold-standard insight into cause and effect. The knowledge that informs our most important decisions. Unfortunately, randomization in such experiments is often botched. Randomization errors silently invalidate the interpretation of experimental results, turning a fruitful quest for knowledge into a waste of time and money, or, worse, a wellspring of misinformation. Fortunately, these fatal errors are easy to spot and fix. So whether you&#8217;re a webmaster using A/B testing to increase engagement, a medical researcher evaluating vaccines, a factory manager exploring productivity improvements, or a scientist seeking the laws that govern nature or human affairs, read on&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:516379}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://yihui.org/en/2026/05/testthat-to-testit/">Converting testthat Tests to testit</a></strong><br>Back in 2013, I wrote about testing R packages when I first released testit. Thirteen years later, I still believe that unit testing should be nothing more than &#8220;tell me if something unexpected happened.&#8221; Recently I converted a large testthat test suite to testit, and I thought I&#8217;d share a practical guide for anyone considering the same move&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1tjbn57/after_5_years_in_data_science_im_starting_to/">After 5 years in data science, I&#8217;m starting to realize most &#8220;insights&#8221; we deliver are completely ignored. Is this normal? [Reddit]</a></strong></p><p>I&#8217;ve been in data science roles (both analytics and ML) for about 5 years now across a couple of companies. Lately I&#8217;ve been feeling a bit burned out because I keep seeing the same pattern&#8230;We spend weeks cleaning data, building dashboards, running statistical analysis, or training models&#8230; and then the stakeholders either:</p><ul><li><p>Say &#8220;thanks&#8221; and never use it</p></li><li><p>Cherry-pick the numbers that support their existing opinion</p></li><li><p>Or just completely ignore the findings and go with gut feel anyway</p></li></ul><p>The worst part is when leadership asks for a &#8220;data-driven decision&#8221; but they&#8217;ve already decided what they want to do&#8230;Am I alone in this? Or is this just the reality of data science in most companies?&#8230;</p><p></p></li><li><p><strong><a href="https://vickiboykis.com/2026/05/18/tagging-my-blog-posts-with-bertopic-and-llms/">Tagging my blog posts with BERTopic and LLMs</a><br></strong>I recently added tags to my blog using BERTopic and a mix of LLMs. You can see the tags in the sidebar to the right (or in the footer on mobile). I&#8217;ve done this before in 2023, with GGUF Mistral using llama-cpp, but never finished the project. Now, because the models have been getting so good, and my project was small, relatively well-defined, and easy to evaluate, the project took me about 6-10 hours over a month, using BERTopic, Claude Code, and Pi with Deepseek&#8230;<br></p></li><li><p><strong><a href="https://ericmjl.github.io/blog/2026/5/20/what-data-science-is-actually-about-in-the-age-of-ai/">What data science is actually about in the age of AI</a><br></strong>I reflect on the evolving role of data scientists in the age of AI and LLMs. I argue that our core mission remains rigorous measurement, not full-stack development. While AI tools make building easier, the real value comes from defining and evaluating what truly matters. I share why measurement should be led by those closest to the problem and how data scientists can best contribute. Are we losing sight of what makes data science essential in the rush to build with AI?&#8230;<br></p></li><li><p><strong><a href="https://emma-x1.github.io/writing/transformer-from-scratch">Transformer From Scratch</a></strong></p><p>I&#8217;ve wanted to dive deeper into the fundamentals of AI for a while now - it feels a little bit magical, and a little bit wrong, to operate alongside AI without a strong understanding of how the underlying mechanisms work. Naturally, I had to write a transformer, and Neel Nanda&#8217;s &#8221;GPT-2 From Scratch&#8221; was my resource of choice&#8230;This post is meant to document my process of learning and to address some of the questions I was curious about when implementing the transformer for the first time. It includes an overview of transformer basics and some of my intuitions, followed by some of the points of interest (transformer secrets, if you will) and challenges I ran into&#8230;<br></p></li><li><p><strong><a href="https://simonwillison.net/2026/May/19/5-minute-llms/">The last six months in LLMs in five minutes</a></strong><br>I presented this lightning talk at PyCon US 2026, attempting to summarize the last six months of developments in LLMs in five minutes&#8230;.<code><br></code></p></li><li><p><strong><a href="https://remlapmot.github.io/post/2026/runiverse-tips/">Five tips for managing your R-universe</a><br></strong>rOpenSci&#8217;s R-universe system is an open source platform allowing users to create their own CRAN-like universe of R packages&#8230;This post gives five tips I have developed to help manage my R-universe&#8230;<br></p></li><li><p><strong><a href="https://blog.skypilot.co/research-driven-agents/">Research-Driven Agents: What Happens When Your Agent Reads Before It Codes</a><br></strong>Coding agents working from code alone generate shallow hypotheses. Adding a research phase &#8212; arxiv papers, competing forks, other backends &#8212; produced 5 kernel fusions that made llama.cpp CPU inference 15% faster.<br></p></li><li><p><strong><a href="https://people.duke.edu/~hpgavin/SystemID/References/Ribeiro-KalmanFilter-2004.pdf">Kalman and Extended Kalman Filters: Concept, Derivation and Properties</a></strong></p><p>This report presents and derives the Kalman filter and the Extended Kalman filter dynamics. The general filtering problem is formulated and it is shown that, under linearity and Gaussian conditions on the systems dynamics, the general filter particularizes to the Kalman filter. It is shown that the Kalman filter is a linear, discrete time, finite dimensional time-varying system that evaluates the state estimate that minimizes the mean-square error&#8230;<br></p></li><li><p><strong><a href="https://errorstatistics.com/2026/05/11/39531/">How not to turn power on its head</a></strong><br>In giving some informal remarks about power at a seminar a couple of weeks ago, I proposed that the tendency to turn the notion of power on its head might be avoided by imagining we need to define a test&#8217;s error probabilities in terms of its power alone. We can refer to the power against the null hypothesis, rather than alluding to a type 1 error probability, for example&#8230;What do I mean by turning power on its head? I mean, at least here, supposing that a test provides poor evidence of discrepancies that the test has low power to detect&#8230;<br></p></li><li><p><strong><a href="https://rworks.dev/posts/atlas-learn-sphere/">The Atlas-Learn Approach to the Manifold Hypothesis</a></strong></p><p>The 2025 paper by Robinett et al., &#8216;Atlas-based Manifold Representations for Interpretable Riemannian Machine Learning&#8217;, provides an algorithm for fitting a low dimensional manifold from a point cloud by means of a novel algorithm for approximating an atlas of charts. This post illustrates the Atlas-Learn method by reconstructing a sphere from a 3D point cloud of naive random samples and works through some checks on accuracy&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1th87u4/are_there_any_small_quick_things_i_can_do/">Are there any small, quick things I can do everyday to keep my skills sharp? [Reddit]</a><br></strong>I&#8217;m sure everyone knows about the dilemma of AI at this point. We want to work faster but our skills are atrophying yada yada&#8230;as a junior data scientist, I feel like I barely had any skills to begin with. Now with my company forcing us to use AI, I feel like I&#8217;m not learning much. Now I&#8217;ve been doing leetcode, but I just don&#8217;t think it&#8217;s that applicable to my real job. I don&#8217;t have the bandwidth outside of work to do a project yet, since my company is working us to the bone. What are some quick habits/tools/websites/apps you recommend to keep your skills sharp?..<br></p></li><li><p><strong><a href="https://www.counting-stuff.com/the-measurement-of-loudness/">The Measurement of Loudness</a><br></strong>I&#8217;m not a sound engineer of any sort, but I enjoy music and have been blessed with decent hearing acuity, so I tend to pay attention to noises going on around me. Now, I know what you&#8217;re thinking! Surely, a measurement nerd interested in sound would have bought a cheap SPL meter off the internet and this is what this post is about. And you&#8217;d be wrong! Hah! Because this post goes a bit further off the deep end because SPL and the dB(a) scales that we commonly associate with &#8220;sound volume&#8221; always confused me when I tried to understand them. Like with how measuring color is really difficult because it&#8217;s at the intersection of a physical measurement and human perception (see: How the heck does one measure color?), sound is just as messy because it&#8217;s again physical measurements (sound pressure) mediated by the human auditory system. To measure loudness, we&#8217;re going to have to go back a bit in history&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://idlemachines.co.uk/essays/softmax">Softmax, can you really derive the Jacobian? And should you care?</a></strong></p></li><li><p><strong><a href="https://kyunghyuncho.me/teaching-fundamentals-of-machine-learning/">Teaching &lt;Fundamentals of Machine Learning&gt;</a></strong></p></li><li><p><strong><a href="https://link.springer.com/article/10.1007/s42113-026-00271-1">Illusions of Understanding in the Sciences</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #651 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-651">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://xianblog.wordpress.com/2026/05/13/the-vexing-hausdorff-measure/">the vexing Hausdorff measure</a></strong></p></li><li><p><strong><a href="https://robjhyndman.com/publications/mvhts.html">Multivariate reconciliation for hierarchical time series</a></strong></p></li><li><p><strong><a href="https://possiblywrong.wordpress.com/2026/05/18/comments-on-what-every-experimenter-must-know-about-randomization/">Comments on: What Every Experimenter Must Know About Randomization</a></strong></p></li><li><p><strong><a href="https://www.rilldata.com/blog/introducing-metrics-sql-a-sql-based-semantic-layer-for-humans-and-agents">Introducing Metrics SQL: A SQL-based semantic layer for humans and agents</a></strong></p></li><li><p><strong><a href="https://ropensci.org/blog/2026/04/08/r-universe-bioc/">Collaborating between Bioconductor and R-universe on Development of Common Infrastructure</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Tools: Why AI Agents Need Them]]></title><description><![CDATA[Tools allow AI agents to interact with the world]]></description><link>https://datascienceweekly.substack.com/p/tools-why-ai-agents-need-them</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/tools-why-ai-agents-need-them</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Wed, 20 May 2026 23:03:55 GMT</pubDate><enclosure url="https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2436" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2436,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;clothes iron, hammer, axe, flashlight and pitcher on brown wooden table&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="clothes iron, hammer, axe, flashlight and pitcher on brown wooden table" title="clothes iron, hammer, axe, flashlight and pitcher on brown wooden table" srcset="https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/reserve/oIpwxeeSPy1cnwYpqJ1w_Dufer%20Collateral%20test.jpg?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Image Source: <a href="https://unsplash.com/photos/clothes-iron-hammer-axe-flashlight-and-pitcher-on-brown-wooden-table-IClZBVw5W5A">Todd Quackenbush</a></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/tools-why-ai-agents-need-them">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Monday Statistics: Why Averages Can Mislead]]></title><description><![CDATA[When your data is skewed, the &#8220;average&#8221; may not represent reality]]></description><link>https://datascienceweekly.substack.com/p/monday-statistics-why-averages-can</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/monday-statistics-why-averages-can</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Mon, 18 May 2026 22:32:14 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2003" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2003,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;short-furred white cat&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="short-furred white cat" title="short-furred white cat" srcset="https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1549096454-1b8ba2ef8f1c?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/short-furred-white-cat-diLm-niNsJk">Gaelle Marcel</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/monday-statistics-why-averages-can">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Figure Out Who Your Competition Is]]></title><description><![CDATA[If you applied for a job next week, you&#8217;d be competing with a set of candidates. You should find out who they are and what they are doing.]]></description><link>https://datascienceweekly.substack.com/p/figure-out-who-your-competition-is</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/figure-out-who-your-competition-is</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Fri, 15 May 2026 12:35:20 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2000,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;person in red sweater holding babys hand&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="person in red sweater holding babys hand" title="person in red sweater holding babys hand" srcset="https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1582213782179-e0d53f98f2ca?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/person-in-red-sweater-holding-babys-hand-Zyx1bK9mqmA">Hannah Busing</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/figure-out-who-your-competition-is">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 651]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-651</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-651</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 14 May 2026 20:23:26 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!obNH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #651<br>May 14, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://www.jackhogan.me/blog/marco-polo">Marco Polo: Finding a friend with only distance and motion.</a><br></strong>You walk into a cafe, looking for your friend. Seems like an easy task, until you see it&#8217;s so packed that you can&#8217;t see through the crowd at all, and everyone&#8217;s talking so loud that you can barely hear anything. The only things you know are your movements, and how far you are from your friend (through the special psychic bond you two share). How will you find each other?...I wanted to solve the exact same problem, but with devices instead of people (so no psychic connection for me), existing in a space of hundreds of other devices. Working the problem taught me a lot of really interesting science relating to robotics and state estimation, and I wrote this post so you can learn, too&#8230;</p></li></ul><ul><li><p><strong><a href="https://burrito.bio/essays/biology-is-a-burrito">Biology is a Burrito</a></strong><br>A bacterium&#8217;s genome, pulled into a straight thread, is nearly 1,000 times longer than the cell from which it came. If you placed one E. coli into a gallon-sized jug with some nutrients and waited a few hours, the genomes of its descendants, placed end-to-end, would reach to the moon and back...several times&#8230;.The truth is that biochemistry textbooks often depict cells as spacious places, where molecules float in secluded harmony. &#8220;But a cell looks more like a burrito,&#8221; says Michael Elowitz, a biologist at Caltech. All the biochemicals are pushed together, bumping into each other&#8230;</p><p></p></li><li><p><strong><a href="https://idlemachines.co.uk/essays/softmax">Softmax, can you really derive the Jacobian? And should you care?</a></strong><br>Multiclass output? Softmax. Normalising probabilities? Softmax. Attention weights? Softmax. Partition function? You guessed it, Softmax. This function comes up everywhere, but how often have you really thought about what&#8217;s going on inside?&#8230;What does softmax actually do to your distribution?&#8230;The softmax function is deceptively simple&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><p></p><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!obNH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!obNH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 424w, https://substackcdn.com/image/fetch/$s_!obNH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 848w, https://substackcdn.com/image/fetch/$s_!obNH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 1272w, https://substackcdn.com/image/fetch/$s_!obNH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!obNH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png" width="600" height="353.8732394366197" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:670,&quot;width&quot;:1136,&quot;resizeWidth&quot;:600,&quot;bytes&quot;:68648,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/197745894?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!obNH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 424w, https://substackcdn.com/image/fetch/$s_!obNH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 848w, https://substackcdn.com/image/fetch/$s_!obNH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 1272w, https://substackcdn.com/image/fetch/$s_!obNH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cde0e3c-58c5-49de-8783-47919460d244_1136x670.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://link.springer.com/article/10.1007/s42113-026-00271-1">Illusions of Understanding in the Sciences</a></strong><br>The first part of this essay supports the case for the universality of partial and incomplete levels of understanding by showing the difficulty of reaching a deep level of understanding for even a simple analysis and model that most scientists use and believe they understand: linear regression. The second part highlights some implications of the existence of many levels of understanding and explanation, and their use by scientists for design, testing, analysis, and theory development. It discusses the way that deduction and induction depend on the levels of understanding and the implications of the illusion that a scientist&#8217;s understanding is deep&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/MachineLearning/comments/1t72u1r/people_interested_in_continual_learning_researchr/">People Interested in Continual Learning Research [Reddit]</a></strong></p><p>Recently, I&#8217;ve become fascinated by Continual Learning, especially the idea of AI systems that can continuously adapt and improve from experience rather than staying static after training. I&#8217;m a student just starting my journey in CL research and would love to connect with people exploring similar ideas. Whether you&#8217;re a student, researcher, or just curious about the field, feel free to DM me. Would also love paper recommendations and interesting research directions&#8230;</p><p></p></li><li><p><strong><a href="https://www.youtube.com/watch?v=eSZ9FB5Dqnk">You Should Probably Map That: Introduction to Geospatial Analysis in R</a><br></strong>Anjile An, Weill Cornell Medical College&#8230;Data comes in many forms, but the spatial components can be overlooked. You&#8217;ll get some history of mapping and learn the basic building blocks of spatial data.  The demo portion will go over how to use the trusty {ggplot2} as well as some new tools like {sf} and {tmap} to plot different types of spatial data&#8230;<br></p></li><li><p><strong><a href="https://kiro.dev/blog/deep-spec-analysis/">Requirements analysis: catching requirement bugs before they become code</a><br></strong>Every experienced engineer has a story where a feature shipped, worked on the happy path, and then quietly did the wrong thing on some edge case no one had thought about. Trace the bug back far enough and it rarely ends at the code; it ends at a sentence in a requirement document that meant one thing to the person who wrote it and something else to the person who implemented it&#8230;<br></p></li><li><p><strong><a href="https://kyunghyuncho.me/teaching-fundamentals-of-machine-learning/">Teaching &lt;Fundamentals of Machine Learning&gt;</a></strong></p><p>This past spring, i taught &lt;Fundamentals of Machine Learning&gt; for computer science seniors (with some juniors as well as seniors from other majors, including data science and economics) at NYU. last time i taught this course, the course was titled &lt;Introduction to Machine Learning&gt;, it was pre-ChatGPT and it was pre-pandemic; in fact, i was teaching this course in the spring of 2020, and the whole university, city and world went into its first lock down mid-way. in other words, i taught this course in the old world, and i was asked to teach this course in this brave new world&#8230;<br></p></li><li><p><strong><a href="https://robotchinwag.com/posts/jensen-shannon-divergence-visualisation/">Interactive Jensen&#8211;Shannon Divergence Visualisation</a></strong><br>An interactive visualisation of Jensen&#8211;Shannon divergence - the symmetric, always-finite cousin of KL. Shape two distributions and watch JSD, its ceiling of one bit, and the per-point contribution respond in real time&#8230;<code><br></code></p></li><li><p><strong><a href="https://puntofisso.net/eurovision/">70 years of love, empowerment, and freedom. Here&#8217;s a look at Eurovision by its lyrics.</a><br></strong>Famous for its upbeat rhythms, flamboyant performances, and political voting patterns, the competition has another dimension that moves with the zeitgeist: its song lyrics&#8230;<br></p></li><li><p><strong><a href="https://margaretstorey.com/blog/2026/02/18/cognitive-debt-revisited/">What I&#8217;m Hearing About Cognitive Debt (So Far)</a><br></strong>A week ago, I wrote about how Generative and Agentic AI may be amplifying what I&#8217;ve been calling cognitive debt: the accumulated gap between a system&#8217;s evolving structure and a team&#8217;s shared understanding of how and why that system works and can be changed over time. The post sparked thoughtful discussion across different communities. Rather than respond thread by thread, I want to synthesize what I&#8217;m hearing and connect it to other reflections I&#8217;ve been reading. I will likely update this as the conversation evolves&#8230;<br></p></li><li><p><strong><a href="https://ivanpleshkov.dev/blog/polynomial-autoencoder/">Polynomial autoencoder</a></strong></p><p>The most direct way to compress an embedding (other than quantization) is to fit PCA on the corpus and keep the top-d eigenvectors. It works, but PCA is a linear projection, and neural-network embeddings on the sphere are structurally nonlinear &#8212; the well-known cone effect in transformers. Some of the variance lives in a nonlinear tail that a linear decoder can&#8217;t reach&#8230;This post is about a closed-form way to add a quadratic decoder on top of PCA, to capture part of that nonlinear tail. The encoder stays as plain PCA. The decoder is a degree-2 polynomial lift plus Ridge OLS (ordinary linear regression with L2 regularization), also closed-form. No SGD, no epochs, no hyperparameter search. One np.linalg.solve over corpus statistics&#8230;<br></p></li><li><p><strong><a href="https://brrrviz.com/">Visualize the Brrr - Learn GPU programming</a></strong><br><strong>Who This Is For: </strong>This is for anyone interested in GPU programming or performance engineering, whether you&#8217;re writing CUDA, HIP, Triton, cuTile, Gluon, Helion, JAX, or nothing at all. If you&#8217;ve ever struggled to conceptualize parallelism, memory coalescing, or tiling, these visualizations are meant to make those ideas concrete. No prior GPU experience required.</p><p><strong>What You&#8217;ll Learn: </strong>The lessons walk through fundamental concepts of GPU programming, parallelism, memory hierarchy, and more. Each chapter pairs a short explanation with an interactive visualization you can poke at&#8230;<br></p></li><li><p><strong><a href="https://github.com/RussellSB/pytrendy">PyTrendy</a></strong></p><p>PyTrendy is a robust solution for identifying and analyzing trends in time series. Unlike other trend detection packages, it is robust to noisy &amp; flat segments, and handles for gradual &amp; abrupt trend cases with a high precision. It aims to be the best package for trend detection in python&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1sw6b6w/standardization_vs_log_transform/">Standardization vs Log transform? [Reddit]</a><br></strong>I have been trying to understand the use cases of both of these and I am really confused. I know log transform fixes the features and makes their distribution normal and standardization on the other hand only fixes the scale of the feature by keeping the distribution the same. Are these things which I use one after the other ? Or just simply use one depending on the case (which I also don&#8217;t understand when) ?&#8230;<br></p></li><li><p><strong><a href="https://www.seascapemodels.org/posts/2026-03-28-agentic-AI-ecological-modelling/">AI agents can create convincing ecological models, but you still need to know what you&#8217;re doing</a><br></strong>Agentic AI tools like Claude Code can write and run code, fix its own errors, and produce a formatted report with figures. I wanted to know whether that translates into reliable ecological modelling, so we ran a test: three fisheries tasks, four AI models, ten independent runs each, scored against a rubric. The results are published in <em>Fish and Fisheries</em>. We found agents can be genuinely useful, but only if you know how to use them well and only if you know enough about the analysis to catch what they miss&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1t2nasr/a_decade_of_being_an_average_data_scientist_my/">A decade of being an average Data Scientist! My personal experience [Reddit].</a></strong></p></li><li><p><strong><a href="https://www.interconnects.ai/p/notes-from-inside-chinas-ai-labs">Notes from inside China&#8217;s AI labs: Lessons from my trip to talk to most of the leading AI labs in China.</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1t19v2s/ds_market_is_kind_of_insane_right_now/">DS market is kind of insane right now [Reddit]</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #650 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-650">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://arxiv.org/abs/1912.10642">Notes on Category Theory with examples from basic mathematics</a></strong></p></li><li><p><strong><a href="https://planetscale.com/learn/courses/mysql-for-developers">MySQL for Developers</a></strong></p></li><li><p><strong><a href="https://metr.org/blog/2025-07-10-early-2025-ai-experienced-os-dev-study/">Measuring the Impact of Early-2025 AI on Experienced Open-Source Developer Productivity</a></strong></p></li><li><p><strong><a href="https://www.seascapemodels.org/posts/2026-04-23-clear-plots-ggplot-for-mobile/">Design your plots (ggplot) for mobile</a></strong></p></li><li><p><strong><a href="https://rtichoke.netlify.app/posts/assessing-score-reliability.html">Assessing Credit Score Prediction Reliability Using Bootstrap Resampling</a></strong></p></li><li><p><strong><a href="https://appliedscientific.ai/research/scientific-ai-literature-agent-nvidia-nemotron-nano-omni">The Figure Problem in Scientific AI: Building a Multimodal Literature Agent for Biology, Powered by NVIDIA Nemotron 3 Nano Omni</a></strong></p></li><li><p><strong><a href="https://mfatihtuzen.github.io/posts/2026-04-24_quarto_blog_github/">Publishing a Quarto Blog: What I Learned Moving from Netlify to GitHub Pages</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[AI Agents for Data Scientists: Automations vs Agents]]></title><description><![CDATA[Why boring workflows with one LLM call often outperform &#8220;fully autonomous&#8221; systems]]></description><link>https://datascienceweekly.substack.com/p/ai-agents-for-data-scientists-automations</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/ai-agents-for-data-scientists-automations</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Wed, 13 May 2026 14:30:10 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="1995" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1995,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;red and green plastic toy&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="red and green plastic toy" title="red and green plastic toy" srcset="https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1607601191544-fd61c99dd3c9?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/red-and-green-plastic-toy-jS_T9wWFTyE">Brian Kamau</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/ai-agents-for-data-scientists-automations">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Monday Statistics: Skewed Data and Transformations]]></title><description><![CDATA[Why your data looks &#8220;lopsided,&#8221; and what to do about it]]></description><link>https://datascienceweekly.substack.com/p/monday-statistics-skewed-data-and</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/monday-statistics-skewed-data-and</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Mon, 11 May 2026 21:39:22 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2000,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Modern building with glass and red brick facade&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Modern building with glass and red brick facade" title="Modern building with glass and red brick facade" srcset="https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1762889577454-6c29b20b0e9b?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/modern-building-with-glass-and-red-brick-facade-awLg1eJFhaU">Pix Tresa</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/monday-statistics-skewed-data-and">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 650]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-650</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-650</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 07 May 2026 20:50:12 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!gZvZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #650<br>May 07, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://www.interconnects.ai/p/notes-from-inside-chinas-ai-labs">Notes from inside China&#8217;s AI labs</a><br></strong>Lessons from my trip to talk to most of the leading AI labs in China&#8230;</p></li></ul><ul><li><p><strong><a href="https://www.kenkoonwong.com/blog/survival/">Learning &amp; Exploring Survival Analysis Part 1 - A Note To Myself</a></strong><br>A note to myself on survival analysis &#8212; KM curves, log-rank tests &amp; Cox models &#129518; If I wrote it the way I understood it, maybe I&#8217;ll actually remember it &#129310;&#8230;</p><p></p></li><li><p><strong><a href="https://www.youtube.com/watch?v=7OJlS2NW00g">Two Cartography Expert Review MOVIE MAPS</a></strong><br>John Nelson and Peter Attwood review maps in films. What they get right, what they might get wrong, and what we think of them as cartography nerds. Includes thoughts on: Indiana Jones, The Lord of the Rings, Avatar, War Games, Prometheus, Harry Potter, The Muppets, Pirates of the Caribbean, Game of Thrones, Moonrise Kingdom, The Goonies, and The Emperor&#8217;s New Groove&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:508882}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gZvZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gZvZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 424w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 848w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 1272w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gZvZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png" width="600" height="326.8041237113402" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:634,&quot;width&quot;:1164,&quot;resizeWidth&quot;:600,&quot;bytes&quot;:82342,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/196824414?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gZvZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 424w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 848w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 1272w, https://substackcdn.com/image/fetch/$s_!gZvZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8a305f6c-c067-4773-b025-2fb7676fde03_1164x634.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://kieranhealy.org/blog/archives/2026/05/02/bad-weather-and-the-subway/">Bad Weather and the Subway</a></strong><br>I&#8217;ve been looking at hourly ridership data from the New York City Subway. Last time we learned that people go to work in the morning and come home in the evening, for example. (All together now: &#8220;Only in New York, baby!&#8221;) Today, we&#8217;ll learn that bad weather makes people stay at home. Except, sometimes it doesn&#8217;t&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1t2nasr/a_decade_of_being_an_average_data_scientist_my/">A decade of being an average Data Scientist! My personal experience. [Reddit]</a></strong></p><p>Hello! I know there&#8217;s people here with PhDs, working in FAANG, on top of the newest tech, and are absolutely brilliant Data Scientists. I&#8217;m not one of them&#8230;I just wanted to share my positive experience from someone who is painfully average lol!! I wanted to show people, especially new grads and/or people pivoting into the field, that you don&#8217;t have to be the smartest person in the room to get hired. You need to drill into the solid foundations and a have a drive to make change/bring value to a company&#8230;</p><p></p></li><li><p><strong><a href="https://www.goodfire.ai/research/the-world-inside-neural-networks#">The World Inside Neural Networks</a><br></strong>How neural geometry will unlock understanding and control of AI&#8230;If we understand how a model carves up and represents the world conceptually (i.e., its ontology), this will unlock a far deeper understanding of both its algorithms that operate over that ontology and the intelligent behaviors produced by those algorithms. We thus need new methods to gain that understanding; this series of posts details our early efforts to develop them, building upon &#8211; and alongside &#8211; numerous related efforts from others&#8230;<br></p></li><li><p><strong><a href="https://pawankjha.substack.com/p/quantum-machine-learning-the-pragmatic">Quantum Machine Learning: The Pragmatic Guide for classical ML Engineers</a><br></strong>Part 1 of the &#8220;Quantum ML for Engineers&#8221; series: From Transformers and GPUs to QPUs and Hybrid Intelligence&#8230;<br></p></li><li><p><strong><a href="https://opensource.posit.co/blog/2026-05-07_opentelemetry/">Bringing OpenTelemetry to R in production</a></strong><br>Posit has instrumented Shiny, plumber2, mirai, httr2, ellmer, knitr, testthat, and DBI with OpenTelemetry, and created tools for you to instrument your own packages, bringing production-grade observability to R&#8230;<br></p></li><li><p><strong><a href="https://ds100.org/sp26/">Data 100: Principles and Techniques of Data Science UC Berkeley, Spring 2026</a></strong><br>This intermediate level class bridges between Data 8 and upper division computer science and statistics courses as well as methods courses in other fields. In this class, we explore key areas of data science including question formulation, data collection and cleaning, visualization, statistical inference, predictive modeling, and decision making.&#8203; Through a strong emphasis on data centric computing, quantitative critical thinking, and exploratory data analysis, this class covers key principles and techniques of data science&#8230;<code><br></code></p></li><li><p><strong><a href="https://nejsds.nestat.org/journal/NEJSDS/article/114/info">Inverse Probability Weighting: From Survey Sampling to Evidence Estimation</a><br></strong>We consider the class of inverse probability weight (IPW) estimators, including the popular Horvitz&#8211;Thompson and H&#225;jek estimators used routinely in survey sampling, causal inference and for Bayesian computation. We focus on the &#8216;weak paradoxes&#8217; for these estimators due to two counterexamples by Basu (1988) and Wasserman (2004) and investigate the two natural Bayesian answers to this problem: one based on binning and smoothing: a &#8216;Bayesian sieve&#8217; and the other based on a conjugate hierarchical model that allows borrowing information via exchangeability&#8230;<br></p></li><li><p><strong><a href="https://blog.ephorie.de/the-magic-of-in-context-learning-icl-when-your-model-already-knows-your-data">The Magic of In-Context Learning (ICL): When Your Model Already Knows Your Data</a></strong><br>As an experienced data scientist, you have seen thousands of datasets in your career. When confronted with new data, your natural neural network (a.k.a. brain) simply draws on this vast library of past mathematical shapes and immediately recognizes the pattern. But what if an artificial neural network could do exactly the same thing? What if it could predict your data without actually being trained on it?&#8230;Welcome to the mind-bending world of <em>In-Context Learning (ICL)</em> for tabular data, brought to R via the incredible new <code>TabPFN</code> package (on CRAN)&#8230;<br></p></li><li><p><strong><a href="https://www.johndcook.com/blog/2026/04/30/derivative-of-relu/">Three ways to differentiate ReLU</a></strong></p><p>When a function is not differentiable in the classical sense there are multiple ways to compute a generalized derivative. This post will look at three generalizations of the classical derivative, each applied to the ReLU (rectified linear unit) function. The ReLU function is a commonly used activation function for neural networks. It&#8217;s also called the ramp function for obvious reasons&#8230;<br></p></li><li><p><strong><a href="https://thierrymoudiki.github.io//blog/2026/05/02/r/rvflnet">You Don&#8217;t Need to Learn All the Weights on tabular data: The Case for rvflnet (a nonlinear expressive glmnet) on regression, classification and survival analysis</a></strong><br>Random Vector Functional Link (RVFL) networks offer a simple yet powerful alternative to traditional neural networks for tabular data. Instead of learning hidden layers through backpropagation, RVFL generates them randomly (or not, if using a deterministic sequence of quasi-random numbers) and focuses all learning effort on a final, regularized linear model&#8230;<br></p></li><li><p><strong><a href="https://jcarroll.com.au/2026/05/04/comparing-r-s-targets-and-dbt-for-data-engineering/">Comparing R&#8217;s {targets} and dbt for Data Engineering</a></strong></p><p>I&#8217;m getting more and more into data engineering these days and having used R for a long time, I&#8217;m seeing a lot of problems that look nail-shaped to my R-shaped hammer. The available tools to solve those problems exist for (presumably) very good reasons, so I wanted to take some time to dig into how to use them and compare their workflows to what I would otherwise naively do in R&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1t19v2s/ds_market_is_kind_of_insane_right_now/">DS market is kind of insane right now [Reddit]</a><br></strong>So here&#8217;s the story: another team in my company opened an associate-level DS role last week, we got 300+ applications, and somehow there were 30+ senior-level guys applying for it. Not fake senior either. Like actually senior all with 10+ yoe&#8230;.Curious that are other people &amp; teams seeing the same thing, or is this just a weird sample on our side?&#8230;<br></p></li><li><p><strong><a href="https://publicdomainreview.org/collection/visualizing-history-the-polish-system/">Visualizing History: The Polish System</a><br></strong>For the Polish educator Antoni Ja&#380;wi&#324;ski, history was best represented by an abstract grid &#8212; or at least it was for the purposes of remembering it. The so-called &#8220;Polish System&#8221; originated in the 1820s and was later brought to public attention in the 1830s and 1840s by General J&#243;zef Bem, a military engineer with a penchant for mnemonics&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1srp178/warning_dont_get_gptbrained/">Warning: Don&#8217;t get GPT-brained [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.youtube.com/watch?v=sxX8BMscce0">Principles for Autonomous System Design: OpenClaw Deep Dive</a></strong></p></li><li><p><strong><a href="https://perthirtysix.com/how-the-heck-does-shazam-work">How The Heck Does Shazam Work?</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #649 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-649">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://www.allendowney.com/blog/2026/05/01/planning-for-your-midlife-crisis/">Planning for your midlife crisis (or Counterfactual Analysis with Bayesian Models: What Drives the Life Expectancy Gap?)</a></strong></p></li><li><p><strong><a href="https://blog.isquaredsoftware.com/2026/05/ai-thoughts-part-1-fears-opinions-journey/">My Thoughts on AI, Part 1: Fears, Opinions, and Mental Journey</a></strong></p></li><li><p><strong><a href="https://yihui.org/en/2026/05/ai-reflections/">Reflections on AI-assisted Programming</a></strong></p></li><li><p><strong><a href="https://mindfulmodeler.substack.com/p/time-series-forecasting-with-tabular">Time series forecasting with tabular foundation models</a></strong></p></li><li><p><strong><a href="https://www.statsignificant.com/p/should-you-trust-the-netflix-top">Should You Trust the Netflix Top 10? A Statistical Analysis</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 649]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-649</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-649</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 30 Apr 2026 21:37:33 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!nTV4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #649<br>April 30, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://arxiv.org/abs/2604.26268">The Difference Between &#8220;Replicable&#8221; and &#8220;Not replicable&#8221; is not Itself Scientifically Replicable</a><br></strong>Replication studies estimate the replicability rate of scientific results by aggregating binary verdicts of experiments. Exact replications are rarely attainable, so most replication sequences are non-exact. Experiments differ in ways that matter and do not share a single data-generating process. We formalize two statistical interpretations of non-exactness. In a shared latent rate (benchmark) model, experiments are exchangeable and depend on a common random replicability rate. In a conditionally independent rates (operational) model, each experiment has its own replicability rate drawn from a population distribution&#8230;&#8230;&#8230;The replication crisis, if there is one, cannot be established by the methods used to declare it&#8230;.</p></li></ul><ul><li><p><strong><a href="https://lemire.me/blog/2026/04/27/you-can-beat-the-binary-search/">You can beat the binary search</a></strong><br>Binary search is a classic algorithm that efficiently locates a target value in a sorted array by repeatedly dividing the search interval in half&#8230;In C++, this is implemented by the <code>std::binary_search</code> function, which returns a boolean indicating whether the value is present&#8230;The popular Roaring Bitmap format uses arrays of 16-bit integers of size ranging from 1 to 4096. We sometimes have to check whether a value is present. We use a binary search&#8230;I wanted a faster approach. I had two insights&#8230;Virtually all processors today have data parallel instructions (sometimes called SIMD) that can check several values at once&#8230;The binary search checks one value at a time. However, recent processors can load and check more than one value at once&#8230;Thus, I created something I call the SIMD Quad algorithm. It is an efficient search algorithm for sorted arrays of 16-bit unsigned integers, combining a quaternary interpolation search with SIMD (Single Instruction, Multiple Data)&#8230;</p><p></p></li><li><p><strong><a href="https://www.youtube.com/watch?v=sxX8BMscce0">Principles for Autonomous System Design: OpenClaw Deep Dive</a></strong><br>In this talk, Alex Krentsel (UC Berkeley, NetSys Lab / Google Research) does a deep-dive into OpenClaw &#8212; a fully open-source autonomous AI agent system &#8212; and uses it as a lens to explore the emerging design principles behind truly autonomous agents. We&#8217;re in Phase 3 of the AI evolution: LLM + tool-use + dynamic tool discovery. The agents that exist today aren&#8217;t chatbots. They read your email, write code, schedule work, remember context across sessions, and spawn other agents. This talk breaks down exactly how that works&#8230;.</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:504914}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!nTV4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!nTV4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 424w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 848w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 1272w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!nTV4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png" width="590" height="390.9138840070299" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:754,&quot;width&quot;:1138,&quot;resizeWidth&quot;:590,&quot;bytes&quot;:99059,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/196043785?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!nTV4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 424w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 848w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 1272w, https://substackcdn.com/image/fetch/$s_!nTV4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93db8bd7-89d2-41e1-9018-6b1f622271c9_1138x754.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://www.mdpi.com/1424-8220/22/5/1885">Linear Regression vs. Deep Learning: A Simple Yet Effective Baseline for Human Body Measurement</a></strong><br>We propose a linear regression model for the estimation of human body measurements. The input to the model only consists of the information that a person can self-estimate, such as height and weight. We evaluate our model against the state-of-the-art approaches for body measurement from point clouds and images, demonstrate the comparable performance with the best methods, and even outperform several deep learning models on public datasets. The simplicity of the proposed regression model makes it perfectly suitable as a baseline in addition to the convenience for applications such as the virtual try-on. To improve the repeatability of the results of our baseline and the competing methods, we provide guidelines toward standardized body measurement estimation&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1srp178/warning_dont_get_gptbrained/?utm_source=share&amp;utm_medium=mweb3x&amp;utm_name=mweb3xcss&amp;utm_term=1&amp;utm_content=share_button">Warning: Don&#8217;t get GPT-brained [Reddit]</a></strong></p><p>At my last role we had to move fast, so we relied on an LLM to help with a lot of the thinking and coding for us so we could focus on the business use case and managing meetings and stakeholders. The role was heavy on project management as well as development, research, and deployment so basically doing everything While I got good at scoping projects and managing them, my technical skills totally deteriorated in less than 1 year. It&#8217;s scary going back to problems I know I can solve and but have some brain fog when getting to the answer. If I could have gone slower, had more time to thinking about modeling/coding than I probably wouldn&#8217;t feel like this Don&#8217;t get GPT brained. You&#8217;ll have to crawl out of that pit eventually. Like technical debt but for your brain&#8230;</p><p></p></li><li><p><strong><a href="https://arxiv.org/abs/2604.21691">There Will Be a Scientific Theory of Deep Learning</a><br></strong>In this paper, we make the case that a scientific theory of deep learning is emerging. By this we mean a theory which characterizes important properties and statistics of the training process, hidden representations, final weights, and performance of neural networks. We pull together major strands of ongoing research in deep learning theory and identify five growing bodies of work that point toward such a theory: (a) solvable idealized settings that provide intuition for learning dynamics in realistic systems; (b) tractable limits that reveal insights into fundamental learning phenomena; (c) simple mathematical laws that capture important macroscopic observables; (d) theories of hyperparameters that disentangle them from the rest of the training process, leaving simpler systems behind; and (e) universal behaviors shared across systems and settings which clarify which phenomena call for explanation&#8230;<br></p></li><li><p><strong><a href="https://arxiv.org/abs/2509.09892">What do the fundamental constants of physics tell us about life?</a><br></strong>In the 1970s, the renowned physicist Victor Weisskopf famously developed a research program to qualitatively explain properties of matter in terms of the fundamental constants of physics. But there was one type of matter prominently missing from Weisskopf&#8217;s analysis: life. Here, we develop Weisskopf-style arguments demonstrating how the fundamental constants of physics can be used to understand the properties of living systems. By combining biophysical arguments and dimensional analysis, we show that vital properties of chemical self-replicators, such as growth yield, minimum doubling time, and minimum power consumption in dormancy, can be quantitatively estimated using fundamental physical constants. The calculations highlight how the laws of physics constrain chemistry-based life on Earth, and if it exists, elsewhere in our universe&#8230;<br></p></li><li><p><strong><a href="https://github.com/entropich3atdeath/gpr-thermodynamic-hardware/blob/main/GPR_ThermodynamicHardware_v1.ipynb">Gaussian Process Regression (GPR) &amp; Physics-driven Computing</a></strong><br>Gaussian Process Regression (GPR) is a non-parametric, Bayesian approach to regression. Unlike parametric models (like linear regression) where we find a distribution over parameters, a Gaussian Process defines a prior <strong>distribution over functions</strong>&#8230;<br></p></li><li><p><strong><a href="https://opendatastructures.org/">Open Data Structures - An open content textbook</a></strong><br><em>Open Data Structures</em> covers the implementation and analysis of data structures for sequences (lists), queues, priority queues, unordered dictionaries, ordered dictionaries, and graphs&#8230;Data structures presented in the book include stacks, queues, deques, and lists implemented as arrays and linked-lists; space-efficient implementations of lists; skip lists; hash tables and hash codes; binary search trees including treaps, scapegoat trees, and red-black trees; integer searching structures including binary tries, x-fast tries, and y-fast tries; heaps, including implicit binary heaps and randomized meldable heaps; graphs, including adjacency matrix and ajacency list representations; and B-trees&#8230;<code><br></code></p></li><li><p><strong><a href="https://stormatics.tech/blogs/postgresql-is-not-slow-your-queries-are">PostgreSQL is Not Slow. Your Queries Are.</a><br></strong>A field guide to the seven things that are actually making our database feel slow and how to stop blaming the wrong suspect&#8230;Culprit #1: The Missing Index&#8230;Culprit #2: The N+1 Query, Death by a Thousand Cuts&#8230;Culprit #3: Stale Statistics, The Planner Is Flying Blind&#8230;Culprit #4: The Query That Runs Fine, Alone&#8230;Culprit #5: EXPLAIN ANALYZE Exists, Use It&#8230;Culprit #6: Connection Exhaustion, PostgreSQL is Full&#8230;Culprit #7: Reporting Queries Running on Production&#8230;<br></p></li><li><p><strong><a href="https://globalresearchspace.com/space#7.02/-4.771/61.204/-52.6/30">An interactive semantic map of the latest 10 million published papers</a></strong><br>I built a map to help navigate the complex scientific landscape through spatial exploration. How it works: Sourced the latest 10M papers from OpenAlex and generated embeddings using SPECTER 2 on titles and abstracts. Reduced dimensionality with UMAP, then applied Voronoi partitioning on density peaks to create distinct semantic neighborhoods. The floating topic labels are generated via custom labelling algorithms (definitely still a work in progress!). There is also support for both keyword and semantic queries, and there&#8217;s an analytics layer for ranking institutions, authors, and topics etc&#8230;<br></p></li><li><p><strong><a href="https://perthirtysix.com/how-the-heck-does-shazam-work">How The Heck Does Shazam Work?</a></strong></p><p>How audio fingerprinting and a connect-the-dots trick lets Shazam identify a song in seconds&#8230;By throwing away almost everything and keeping only a handful of landmark peaks, a noisy 5-second clip from a coffee shop becomes a set of coordinates precise enough to pinpoint one song out of millions. Recognition, it turns out, is mostly an exercise in ignoring the right things&#8230;<br></p></li><li><p><strong><a href="https://rtichoke.netlify.app/posts/generating-correlated-random-numbers.html">Generating Correlated Random Numbers in R Using Matrix Methods</a></strong><br>Generating random data with a specific correlation structure is a common need in statistical simulation. In this post, let&#8217;s walk through how to do it in R using matrix decomposition methods&#8230;<br></p></li><li><p><strong><a href="https://jcarroll.com.au/2026/04/17/schotter-plots-in-r/">Schotter Plots in R</a></strong></p><p>Translating things between languages reveals how each language approaches different design trade-offs, and I believe it&#8217;s a useful exercise. Having something to translate is the first step. I found a plot I wanted to generate (Georg Nees&#8217; &#8220;Schotter&#8221; computer-generated art from 1968 which shows a grid of squares which get increasingly displaced in position and rotation), and some code that reproduced it, so off we go!&#8230;<br></p></li><li><p><strong><a href="https://mfatihtuzen.github.io/posts/2026-04-16_timeseries_stationary/">Why Most Time Series Models Fail Before They Start</a><br></strong>A practical look at stationarity and transformations with real CPI data in R&#8230;Many time series models fail before they even begin. Not because the software crashes. Not because the code is wrong. But because the data entering the model violate one of the most important assumptions in time series analysis: stationarity&#8230;The goal is simple: show why raw time series levels often mislead us, what stationarity really means, and why transformations such as differencing and log-differencing are not cosmetic tricks but conceptual necessities&#8230;<br></p></li><li><p><strong><a href="https://kieranhealy.org/blog/archives/2026/04/25/hourly-subway-station-flows/">Hourly Subway Station Flows</a><br></strong>Pie charts are bad, as any fule kno. We&#8217;re not as good at judging relative differences between angles and areas as we are at judging relative differences in lengths on a common baseline. This is especially true when we have more than two things to compare at the same time. So, as a rule, you shouldn&#8217;t use them. You should figure out some other way of viewing your data instead. On the other hand, I just made 424 animated pie charts because if you&#8217;re going to break a rule you should break it good and hard&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://science.nasa.gov/specials/your-name-in-landsat/">Your Name in Landsat &#128752;&#65039;</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/analytics/comments/1sqwb5l/ceo_cancels_bi_tooling_replaces_it_with_ai_breaks/">CEO cancels BI tooling, replaces it with AI, breaks everything [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1srxbjb/anyone_else_paranoid_using_ai_for_analysis/">Anyone else paranoid using AI for analysis? [Reddit]</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #648 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-648">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://perthirtysix.com/how-the-heck-does-gps-work">How The Heck Does GPS Work?</a></strong></p></li><li><p><strong><a href="https://www.dbos.dev/blog/benchmarking-workflow-execution-scalability-on-postgres">Does Postgres Scale?</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/MachineLearning/comments/1sx3p40/how_do_you_test_ai_agents_in_production_the/">How do you test AI agents in production? The unpredictability is overwhelming. [Reddit]</a></strong></p></li><li><p><strong><a href="https://flovv.github.io/loyalty-programs-revisited/">Do Loyalty Programs Actually Create Loyalty?</a></strong></p></li><li><p><strong><a href="https://guillaumepressiat.github.io/blog/2026/04/logrittr-re">logrittr: A Verbose Pipe Operator for Logging dplyr Pipelines</a></strong></p></li><li><p><strong><a href="https://redwallanalytics.com/posts/2026-04-19-a-data-driven-survey-of-mlb-franchise-management/">A Data-Driven Survey of MLB Franchise Management - A search for factors leading to playoff success</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 648]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-648</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-648</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 23 Apr 2026 21:31:23 GMT</pubDate><enclosure url="https://substack-post-media.s3.amazonaws.com/public/images/628f5d89-aae7-48fb-9d15-5ea67f42821f_250x250.gif" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #648<br>April 23, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><h6><strong>Sponsor Message</strong></h6><h1><strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">Online Data Science Programs from Drexel University</a></strong></h1><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-o3G!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 424w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 848w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1272w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif" width="250" height="250" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:250,&quot;width&quot;:250,&quot;resizeWidth&quot;:250,&quot;bytes&quot;:14392,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/gif&quot;,&quot;href&quot;:&quot;https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146&quot;,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/176125667?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!-o3G!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 424w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 848w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1272w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Find your algorithm for success with an <strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">online data science degree</a></strong> from Drexel University. Gain essential skills in tool creation and development, data and text mining, trend identification, and data manipulation and summarization by using leading industry technology to apply to your career. <strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">Learn more</a></strong>.</p><p>.</p><p><em>* Want to sponsor the newsletter? Email us for details --&gt; <a href="mailto:team@datascienceweekly.org">team@datascienceweekly.org</a></em></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://science.nasa.gov/specials/your-name-in-landsat/">Your Name in Landsat &#128752;&#65039;</a><br></strong>Type your name and see it spelled out in stunning Landsat satellite imagery. Explore Earth from space, letter by letter, with NASA and USGS Landsat images&#8230;</p></li></ul><ul><li><p><strong><a href="https://blog.nilenso.com/blog/2026/04/20/trajectory-shapes/">Trajectory shapes</a></strong><br>Why are we managing our coding agents based on vibes instead of their actual work habits?&#8230;I analyzed the latest SWE-Bench Pro trajectories I could find: runs from October 2025 for Sonnet 4.5 and GPT-5, 730 task trajectories per model. I deterministically classified each step into activities like understand, edit, verify, and cleanup using only tool calls, literal command/filename matches, and regex heuristics, and then computed their share over time. This &#8220;trajectory shape&#8221; chart I got as a result is very interesting!&#8230;If I were to condense the above to &#8220;vibes&#8221;, I might say &#8220;<em>Claude starts editing early and figures it out in the loop. GPT reads first, then goes for the one-shot</em>.&#8221; That is also close to what people on my timeline were saying when these runs were current. For example&#8230;</p><p></p></li><li><p><strong><a href="https://vickiboykis.com/2026/04/20/build-yourself-flowers/">Build yourself flowers</a></strong><br>This is an edited transcript of the keynote I gave at the Applied Machine Learning Conference in Charlottesville, VA in April 2026&#8230;I&#8217;m Vicki, and I build machine learning systems&#8230;I debated for a long time how to introduce myself. Am I a data scientist? Am I still a machine learning engineer? Am I an AI engineer now? I&#8217;m not really sure. I think, like a lot of people over the past six months in the industry, I&#8217;ve been having existential angst. So, I&#8217;ll go with &#8220;I build machine learning systems.&#8221;...The larger question behind my existential angst is, what is the state of machine learning engineering as an industry today? That is - is it still worth doing machine learning engineering?&#8230;And the second question that came to me was, not only is it still worth doing ML, but, in an era where we&#8217;re having LLMs generate a lot of code, when the most important thing is for us to ship quickly, to get to a prototype quickly, is it still worth doing machine learning well?&#8230;the same question of, in a world where it&#8217;s easy and fast to write code, why is technical excellence still important?&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:500823}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!imfz!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!imfz!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 424w, https://substackcdn.com/image/fetch/$s_!imfz!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 848w, https://substackcdn.com/image/fetch/$s_!imfz!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 1272w, https://substackcdn.com/image/fetch/$s_!imfz!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!imfz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png" width="600" height="339.86013986013984" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:648,&quot;width&quot;:1144,&quot;resizeWidth&quot;:600,&quot;bytes&quot;:73588,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/195279766?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!imfz!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 424w, https://substackcdn.com/image/fetch/$s_!imfz!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 848w, https://substackcdn.com/image/fetch/$s_!imfz!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 1272w, https://substackcdn.com/image/fetch/$s_!imfz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ee8cf68-f6b3-4ff5-b080-7c552bab482f_1144x648.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://buttondown.com/jaffray/archive/columnar-storage-is-normalization/">Columnar Storage is Normalization</a></strong><br>Something I didn&#8217;t understand for a while is that the process of turning row-oriented data into column-oriented data isn&#8217;t a totally bespoke, foreign concept in the realm of databases. It&#8217;s still of the relational abstraction. Or can be. As an example, say we have this data&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1srxbjb/anyone_else_paranoid_using_ai_for_analysis/">Anyone else paranoid using AI for analysis? [Reddit]</a></strong></p><p>With the LLM in the loop, I touch the data less, and I catch less.</p><ol><li><p>Do you also feel one step removed from the data compared to before these tools existed?</p></li><li><p>What are you doing to safeguard and double-check AI-assisted analysis?</p></li><li><p>Has AI-assisted analysis ever caused you to ship a wrong number to a stakeholder? What happened?&#8230;</p></li></ol><p></p></li><li><p><strong><a href="https://web.stanford.edu/~bvr/pubs/TS_Tutorial.pdf">A Tutorial on Thompson Sampling</a><br></strong>Thompson sampling is an algorithm for online decision problems where actions are taken sequentially in a manner that must balance between exploiting what is known to maximize immediate performance and investing to accumulate new information that may improve future performance. The algorithm addresses a broad range of problems in a computationally efficient manner and is therefore enjoying wide use. This tutorial covers the algorithm and its application, illustrating concepts through a range of examples, including Bernoulli bandit problems, shortest path problems, product recommendation, assortment, active learning with neural networks, and reinforcement learning in Markov decision processes&#8230;<br></p></li><li><p><strong><a href="https://www.emberdione.com/on-rejection-and-competition/">On Rejection and Competition</a><br></strong>This blog post will cover two topics. First, how to deal with the emotional feeling of being rejected for a role. Second, a re-framing and discussion of how to feel about the person who did get the role&#8230;<br></p></li><li><p><strong><a href="https://link.springer.com/article/10.1186/s13041-020-0552-2">No raw data, no science: another possible source of the reproducibility crisis</a></strong><br>As an Editor-in-Chief of <em>Molecular Brain</em>, I have handled 180 manuscripts since early 2017 and have made 41 editorial decisions categorized as &#8220;Revise before review,&#8221; requesting that the authors provide raw data. Surprisingly, among those 41 manuscripts, 21 were withdrawn without providing raw data, indicating that requiring raw data drove away more than half of the manuscripts&#8230;<br></p></li><li><p><strong><a href="https://iclr-blogposts.github.io/2026/blog/2026/mdp-to-gcmdp/">Learning to Maximize Rewards via Reaching Goals</a></strong><br>Goal-conditioned reinforcement learning learns to reach goals instead of optimizing hand-crafted rewards. Despite its popularity, the community often categorizes goal-conditioned reinforcement learning as a special case of reinforcement learning. In this post, we aim to build a direct conversion from any reward-maximization reinforcement learning problem to a goal-conditioned reinforcement learning problem, and to draw connections with the stochastic shortest path framework. Our conversion provides a new perspective on the reinforcement learning problem: <em>maximizing rewards is equivalent to reaching some goals</em>&#8230;.<code><br></code></p></li><li><p><strong><a href="https://quantixed.org/2026/04/06/marathon-man-how-to-pace-a-marathon/">Marathon Man: how to pace a marathon</a><br></strong>Let&#8217;s take a look at a big dataset of marathon times &#8211; we&#8217;ll use the New York City Marathon from 2025 &#8211; to see if we can understand how to pace a marathon. There&#8217;s an available dataset of chip times (meaning we don&#8217;t have to worry about dodgy GPS data) and the course has similar first and second half profiles, allowing us to use these times to understand negative/even/positive splitting. Let&#8217;s dive in&#8230;.<br></p></li><li><p><strong><a href="https://www.jumpingrivers.com/blog/teaching-r-packages-reporting-gitlab/">Using R to Teach R: Lessons for Software Development</a></strong><br>If you have read our blogs previously then you will be aware that Jumping Rivers is a consultancy and training provider in all things data science. But did you know that we offer over 50 different courses spanning R, Python, Git, SQL and more?&#8230;In this blog we will provide a glimpse into our internal process and share how we have streamlined the task of maintaining so many courses. Along the way we will share some good practices applicable to any big coding project, including packaging of source code and automated CI/CD&#8230;<br></p></li><li><p><strong><a href="https://rtichoke.netlify.app/posts/ml-frameworks-in-r.html">Machine Learning Frameworks in R</a></strong></p><p>R&#8217;s ecosystem offers a rich selection of machine learning frameworks, each with distinct design philosophies and strengths. This post is a side-by-side comparison of five ML frameworks in R that provide unified interfaces over multiple algorithms, with runnable code examples on the same dataset so you can compare APIs directly. The focus is on packages that let you swap algorithms without rewriting your code&#8230;<br></p></li><li><p><strong><a href="https://medium.com/quantumblack/creating-a-future-proof-enterprise-agentic-platform-architecture-c21fc48406a5">Creating a future-proof enterprise agentic platform architecture</a></strong><br>A difficult (though familiar) set of questions:</p><ul><li><p>How do we capture short-term impact without creating waste or long-term technical debt?</p></li><li><p>What architecture best supports a mesh of AI agents and traditional, deterministic capabilities across workflows?</p></li><li><p>Which services and capabilities do we need to build now to support what we&#8217;ll need in two years?</p></li><li><p>Is it even worth building today when a viable market solution may exist in a couple of years?</p></li><li><p>How do we balance speed with control, and set standards for security, traceability, and observability in an agentic system that&#8217;s non-deterministic?</p></li></ul><p>There are no universal answers to these questions yet. But through our work with three financial institutions deploying agentic systems at scale, we have developed a set of practical approaches that define what matters most, where teams risk over-investment, and what tends to be harder than expected&#8230;<br></p></li><li><p><strong><a href="https://arxiv.org/abs/2412.02670">The Broader Landscape of Robustness in Algorithmic Statistics</a></strong></p><p>The last decade has seen a number of advances in computationally efficient algorithms for statistical methods subject to robustness constraints. An estimator may be robust in a number of different ways: to contamination of the dataset, to heavy-tailed data, or in the sense that it preserves privacy of the dataset. We survey recent results in these areas with a focus on the problem of mean estimation, drawing technical and conceptual connections between the various forms of robustness, showing that the same underlying algorithmic ideas lead to computationally efficient estimators in all these settings&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/analytics/comments/1sqwb5l/ceo_cancels_bi_tooling_replaces_it_with_ai_breaks/">CEO cancels BI tooling, replaces it with AI, breaks everything [Reddit]</a><br></strong>This happen with a client a coupla months ago. they had their dashboards in metabase, he cancelled &gt; handed the team claude &gt; &#8220;dashboards are a waste and just go and ask ai&#8221;. as you can guess he then called me saying he thinks he broke sth&#8230;.heard almost the same story from another data consultant last week. different company, same swap, same outcome is this becoming a pattern or if we just both got unlucky clients?&#8230;<br></p></li><li><p><strong><a href="https://ajitem.com/blog/iron-core-part-2-six-characters/">Six Characters</a><br></strong>What the PNR locator on your boarding pass actually contains, and why the fare calculation line on your e-ticket is written in a currency that does not exist&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://valuedrivendatascience.com/101">Why Traditional Statistics Still Matters in the Age of AI</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/dataanalysis/comments/1s9i98m/what_is_a_data_analysis_mistake_you_made_early_in/">What is a data analysis mistake you made early in your career that you will never make again? [Reddit]</a></strong></p></li><li><p><strong><a href="https://timzaman.com/getting-into-ai-infra">Getting Into AI Infra</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #647 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-647">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://blog.janestreet.com/can-you-reverse-engineer-our-neural-network/">Can you reverse engineer our (Jane Street) neural network?</a></strong></p></li><li><p><strong><a href="https://www.argmin.net/p/engineering-architecture-a-syllabus">Engineering Architecture: A Syllabus?</a></strong></p></li><li><p><strong><a href="https://flovv.github.io/test-and-roll-profit-maximizing-ab-tests/">Test &amp; Roll: Why Smaller A/B Tests Can Make More Money</a></strong></p></li><li><p><strong><a href="https://andymatuschak.org/tat/">Apps and programming: two accidental tyrannies</a></strong></p></li><li><p><strong><a href="https://lattice.project89.org/">The Living Lattice - Explorables of the intelligence theorem.</a></strong></p></li><li><p><strong><a href="https://github.com/google/skills">Agent Skills for Google products and technologies, including Google Cloud.</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 647]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-647</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-647</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 16 Apr 2026 21:47:59 GMT</pubDate><enclosure url="https://substack-post-media.s3.amazonaws.com/public/images/68e3b6c2-c216-4c4c-9628-96fb4fd7154a_250x250.gif" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #647<br>April 16, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><h6><strong>Sponsor Message</strong></h6><h1><strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">Online Data Science Programs from Drexel University</a></strong></h1><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-o3G!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 424w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 848w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1272w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif" width="250" height="250" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:250,&quot;width&quot;:250,&quot;resizeWidth&quot;:250,&quot;bytes&quot;:14392,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/gif&quot;,&quot;href&quot;:&quot;https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146&quot;,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/176125667?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!-o3G!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 424w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 848w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1272w, https://substackcdn.com/image/fetch/$s_!-o3G!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef4cda8a-27b8-482e-a948-4c5f22a8a591_250x250.gif 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Find your algorithm for success with an <strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">online data science degree</a></strong> from Drexel University. Gain essential skills in tool creation and development, data and text mining, trend identification, and data manipulation and summarization by using leading industry technology to apply to your career. <strong><a href="https://duo.online.drexel.edu/ms-in-data-science/?campaign=201146&amp;ccid=201146&amp;utm_source=Sebastian+Guitierrez&amp;utm_medium=newsletter&amp;utm_content=MS+Data+Science&amp;utm_campaign=201146">Learn more</a></strong>.</p><p>.</p><p><em>* Want to sponsor the newsletter? Email us for details --&gt; <a href="mailto:team@datascienceweekly.org">team@datascienceweekly.org</a></em></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://arxiv.org/abs/2602.14487">Estimating &#960; with a Coin</a><br></strong>We describe a simple Monte Carlo method for estimating &#960; by tossing a coin. Although the underlying Catalan-number series identities appear implicitly in the probability theory literature, the interpretation of &#960;/4 presented here seems to be new&#8230;</p></li></ul><ul><li><p><strong><a href="https://gastruc.github.io/unigeoclip">UniGeoCLIP - Unified Geospatial Contrastive Learning</a></strong><br>Geospatial understanding requires reasoning across fundamentally different kinds of data -- a satellite view from above, a street photo at ground level, a 3D elevation map, a text description of a neighborhood, and a pair of GPS coordinates. These modalities are complementary: each one captures something the others miss&#8230;UniGeoCLIP is the first contrastive framework to jointly align all five modalities into a single unified embedding space, enabling seamless retrieval and reasoning across any combination of inputs, without relying on a privileged &#8220;pivot&#8221; modality&#8230;</p><p></p></li><li><p><strong><a href="https://timzaman.com/getting-into-ai-infra">Getting Into AI Infra</a><br></strong>My next blog post will be about my 10-year Silicon Valley AI tour of duty &#8212; NVIDIA -&gt; Tesla AI -&gt; X -&gt; DeepMind -&gt; OpenAI&#8230;but I wanted to start with something more practical: how to get into AI infra. I joined NVIDIA in 2016, back when the Deep Learning Systems team still fit in one room. &#8220;AI infra&#8221; was not really a &#8216;thing&#8217; yet. When clmt started the &#8216;AI Infra&#8217; org I was the first engineer to join. This post is my version of how I made my way there, and a fun way to catch up&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:496288}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8w2i!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8w2i!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 424w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 848w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 1272w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8w2i!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png" width="600" height="390.625" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:750,&quot;width&quot;:1152,&quot;resizeWidth&quot;:600,&quot;bytes&quot;:95405,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/194451888?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!8w2i!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 424w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 848w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 1272w, https://substackcdn.com/image/fetch/$s_!8w2i!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7184921d-e026-4f9f-8d4a-ce91f0040637_1152x750.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://notstatschat.rbind.io/2026/04/13/are-predictive-models-enough/">Are predictive models enough?</a></strong><br>In one of the social media discussions about causal inference, the suggestion was made that predictive models are all you need: a good predictive model gives you all the conditional distributions you could want, and you don&#8217;t need any special causal inference stuff&#8230;I think there&#8217;s something to this point of view, but there are a few limitations&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1shxrj5/how_many_production_mlai_projects_do_you_complete/">How many production ML/AI projects do you complete in a year? [Reddit]</a></strong></p><p>Wondering what it looks like at other companies. I usually deliver around 3 or 4 ML/AI projects each year. I&#8217;m also expected to do multiple analyses separate from this so I&#8217;m not only focused on ML/AI. We have a small team of 7 people and we rarely collaborate on projects. What is it like at your company?&#8230;</p><p></p></li><li><p><strong><a href="https://www.owlposting.com/p/on-creating-new-knobs-of-control">On creating &#8216;new knobs of control&#8217; in biology</a></strong><br>How can we regain more control over our poorly built physiology? Or, in other words, how we install more &#8216;knobs of control&#8217;? I had this question too! It turns out there&#8217;s a lot of new emerging therapeutic modalities that fit this criteria, and I decided to turn my research over them into an essay&#8230;<br></p></li><li><p><strong><a href="https://ropensci.org/blog/2026/04/02/tree-sitter-overview/">A Better R Programming Experience Thanks to Tree-sitter</a><br></strong>R tooling around Tree-sitter is how you get</p><ul><li><p>reformatting through <a href="https://posit-dev.github.io/air/">Air</a> and linting through <a href="https://jarl.etiennebacher.com/">Jarl</a>;</p></li><li><p>auto-completion or help on hover in the <a href="https://lionel-.github.io/slidedecks/2024-07-11-ark">Positron IDE</a>;</p></li><li><p>better <a href="https://github.com/orgs/community/discussions/120397">search</a> for R on GitHub;</p></li><li><p>and more!</p></li></ul><p>In this post, we&#8217;ll explain what Tree-sitter is, and how tools built on Tree-sitter can benefit your R development workflow&#8230;<br></p></li><li><p><strong><a href="https://valuedrivendatascience.com/101">Why Traditional Statistics Still Matters in the Age of AI</a></strong><br>In this episode, Prof. Rob Hyndman joins Dr. Genevieve Hayes to make the case for why rigorous statistical thinking remains indispensable in the age of AI, and what data scientists are giving up when they abandon it&#8230;.In this episode, you&#8217;ll discover:</p><ol><li><p>Why throwing data at an LLM is no substitute for building a model that understands the problem</p></li><li><p>How combining classical statistics and machine learning can produce better forecasting results than either approach alone</p></li><li><p>What data scientists lose when they stop thinking probabilistically - and why it matters for decision making</p></li><li><p>Where to start if you want to strengthen your statistical foundations&#8230;<br></p></li></ol></li><li><p><strong><a href="https://www.cockroachlabs.com/blog/raft-is-so-fetch/">Raft is so fetch: The Raft Consensus Algorithm explained through &#8220;Mean Girls&#8221;</a></strong><br>Raft is a consensus algorithm used in distributed systems to ensure that data is replicated safely and consistently. That sentence alone can be confusing&#8230;In fact, I&#8217;ve seen conversations recently on social media in which actual technical leaders of infrastructure companies demonstrate a lack of understanding (!). Point being, you&#8217;re not alone. Get in, losers, we&#8217;re going back to (Hollywood) high school&#8230;<code><br></code></p></li><li><p><strong><a href="https://stevehanov.ca/blog/succinct-data-structures-cramming-80000-words-into-a-javascript-file">Succinct Data Structures: Cramming 80,000 words into a Javascript file</a><br></strong>Let&#8217;s continue our short tour of data structures for storing words. Today, we will over-optimize John Resig&#8217;s Word Game. Along the way, we shall learn about a little-known branch of computer science, called succinct data structures&#8230;.<br></p></li><li><p><strong><a href="https://magazine.sebastianraschka.com/p/components-of-a-coding-agent">Components of A Coding Agent</a></strong><br>In this article, I want to cover the overall design of coding agents and agent harnesses: what they are, how they work, and how the different pieces fit together in practice. Readers of my Build a Large Language Model (From Scratch) and Build a Large Reasoning Model (From Scratch) books often ask about agents, so I thought it would be useful to write a reference I can point to&#8230;In this article, I lay out six of the main building blocks of a coding agent&#8230;<br></p></li><li><p><strong><a href="https://nathanbenaich.substack.com/p/state-of-ai-april-2026-newsletter">State of AI: April 2026 newsletter</a></strong></p><p>Welcome to the latest issue of the State of AI, an editorialized newsletter that covers the key developments in AI policy, research, industry, and start-ups from February 1 to April 7, 2026&#8230;<br></p></li><li><p><strong><a href="https://mindfulmodeler.substack.com/p/regression-should-predict-full-distributions">Regression should predict full distributions</a></strong><br>While approaches like linear regression can output full predictive distributions, these often come with (too) strong distributional assumptions. What if we always worked with machine learning models that produce the full predictive distribution? With classification, we are already at this point: Modern machine learning approaches output not just the majority class, but a probability for each class. Whether this probability is calibrated is another question. With regression, we are a bit stuck with a point-based mindset. However, this could change with tabular foundation models. At least in theory: While these models produce the full predictive distribution (or at least a discretized approximation over a fixed support), it&#8217;s not the default and the output is a bit hidden&#8230;<br></p></li><li><p><strong><a href="https://www.astrolog.org/labyrnth/algrithm.htm">Maze Classification</a></strong></p><p>Mazes in general (and hence algorithms to create Mazes) can be organized along seven different classifications. These are: Dimension, Hyperdimension, Topology, Tessellation, Routing, Texture, and Focus. A Maze can take one item from each of the classes in any combination&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/dataanalysis/comments/1s9i98m/what_is_a_data_analysis_mistake_you_made_early_in/">What is a data analysis mistake you made early in your career that you will never make again? [Reddit]</a><br></strong>For those who are working as data analysts or learning analytics, what&#8217;s one mistake you made early on that taught you a big lesson? Could be technical, communication, dashboards, SQL, Excel, anything. I think beginners like me could learn a lot from real experiences&#8230;<br></p></li><li><p><strong><a href="https://www.evanlin.ca/writing/exploring-attnres">What I Learned Building Attention Residuals from Scratch</a><br></strong>Naively reimplementing a paper in PyTorch changed how I think about how transformers route information, and about the gap between academic math and physical silicon&#8230;I wanted to understand how transformers actually route information between layers. Not at the level of &#8220;attention computes weighted averages,&#8221; but at the level of what physically happens to a tensor as it moves through the network. What gets preserved, what gets overwritten, and why&#8230;.</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1sfsijd/built_a_dashboard_to_analyze_how_ai_skills_are/">Built a dashboard to analyze how AI skills are showing up in data science job postings (open source) [Reddit]</a></strong></p></li><li><p><strong><a href="https://piechowski.io/post/git-commands-before-reading-code/">The Git Commands I Run Before Reading Any Code</a></strong></p></li><li><p><strong><a href="https://www.pymc-labs.com/blog-posts/open-sourcing-decision-lab-scaling-ai-judgment-data-science">Agentic Data Science Done Right: Why AI Coding Agents Make Bad Analytical Decisions - And How to Fix It</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #646 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-646">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1sbfbv7/whats_you_recommendation_to_get_interview_ready/">What&#8217;s you recommendation to get interview ready again the fastest? [Reddit]</a></strong></p></li><li><p><strong><a href="https://www.reddit.com/r/MachineLearning/comments/1sdmn97/d_how_to_break_free_from_llms_chains_as_a_phd/">How to break free from LLM&#8217;s chains as a PhD student? [Reddit]</a></strong></p></li><li><p><strong><a href="https://howhttps.works/">How HTTPS Works</a></strong></p></li><li><p><strong><a href="https://koaning.io/posts/legos-vs-3d-printers/">legos vs 3d printers</a></strong></p></li><li><p><strong><a href="https://www.youtube.com/watch?v=6xeeK8jwd5k">Guest Lecture by Eric Wallace of OpenAI on hardening LLMs</a></strong></p></li><li><p><strong><a href="https://itcanthink.substack.com/p/why-is-everyones-robot-folding-clothes">Why is Everyone&#8217;s Robot Folding Clothes?</a></strong></p></li><li><p><strong><a href="https://arxiv.org/abs/2604.13036">Lyra 2.0: Explorable Generative 3D Worlds</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,500 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 646]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-646</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-646</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 09 Apr 2026 19:45:36 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!4vPZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #646<br>April 09, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://blog.runevision.com/2026/03/fast-and-gorgeous-erosion-filter.html">Fast and Gorgeous Erosion Filter</a><br></strong>This blog post and the companion video both explain an erosion technique I&#8217;ve worked on over the past eight months. The video has lots of elaborate animated visuals, and is more focused on my process of discovering, refining, and evolving the technique, while this post has a bit more implementation details on the final iteration&#8230;.</p></li></ul><ul><li><p><strong><a href="https://ai-project-website.github.io/AI-assistance-reduces-persistence/">AI Assistance Reduces Persistence and Hurts Independent Performance</a></strong><br>Through a series of randomized controlled trials on human-AI interactions (N = 1,222), we provide causal evidence for two key consequences of AI assistance: reduced persistence and impairment of unassisted performance. Across a variety of tasks, including mathematical reasoning and reading comprehension, we find that although AI assistance improves performance in the short-term, people perform significantly worse without AI and are more likely to give up. Notably, these effects emerge after only brief interactions with AI (approximately 10 minutes). These findings are particularly concerning because persistence is foundational to skill acquisition and is one of the strongest predictors of long-term learning&#8230;</p><p></p></li><li><p><strong><a href="https://news.ycombinator.com/item?id=47654062">Ask HN: Any interesting niche hobbies?</a><br></strong>I&#8217;m looking for something novel and interesting, that isn&#8217;t absolutely crowded that I could meaningfully contribute to&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:492348}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4vPZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4vPZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 424w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 848w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 1272w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4vPZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png" width="1136" height="432" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:432,&quot;width&quot;:1136,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:52357,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/193702222?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4vPZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 424w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 848w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 1272w, https://substackcdn.com/image/fetch/$s_!4vPZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F437e63d0-4e7f-4560-aed2-861639b6881c_1136x432.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://mchav.github.io/what-category-theory-teaches-us-about-dataframes/">What Category Theory Teaches Us About DataFrames</a></strong><br>Every dataframe library ships with hundreds of operations. pandas alone has over 200 methods on a DataFrame&#8230;Without a framework for telling them apart, you end up memorizing APIs instead of understanding structure&#8230;I ran into this question while building my own dataframe library. I needed to decide which operations were truly fundamental and which were just surface-level variations. That search led me to Petersohn et al.&#8217;s Towards Scalable Dataframe Systems&#8230;They analyzed 1 million Jupyter notebooks, cataloged how people use pandas, and proposed a dataframe algebra: a formal set of about 15 operators that can express what all 200+ pandas operations do&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/datascience/comments/1sfsijd/built_a_dashboard_to_analyze_how_ai_skills_are/">Built a dashboard to analyze how AI skills are showing up in data science job postings (open source) [Reddit]</a></strong></p><p>I&#8217;ve been scraping thousands of U.S. data science jobs for the past couple of months and writing about the findings in my newsletter&#8230;At some point, I figured the dashboard was more useful than anything I was writing, so I decided to open-source it&#8230;Here&#8217;s what it covers:</p><ul><li><p>Top skills companies are actually hiring for, ranked by frequency</p></li><li><p>Skills broken down by category (ML/DL, GenAI, Cloud, MLOps, etc.)</p></li><li><p>What % of roles now require AI skills, broken down by seniority level</p></li><li><p>Salary premium for candidates with AI skills</p></li><li><p>An interactive explorer where you can browse individual postings with matched skills highlighted</p></li></ul><p>The skill extraction is built on around 230 curated keyword groups, so it&#8217;s pretty granular&#8230;</p><p></p></li><li><p><strong><a href="https://slicker.me/sqlite/features.htm">Modern SQLite: Features You Didn&#8217;t Know It Had</a></strong><br>Working with JSON data&#8230;Full-text search with FTS5&#8230;Analytics with window functions and CTEs&#8230;Strict tables and better typing&#8230;Generated columns for derived data&#8230;Write-ahead logging and concurrency&#8230;<br></p></li><li><p><strong><a href="https://ngrok.com/blog/quantization">Quantization from the ground up</a><br></strong>Qwen-3-Coder-Next is an 80-billion-parameter model, 159.4 GB in size. That&#8217;s roughly how much RAM you would need to run it, and that&#8217;s before thinking about long context windows. This is not considered a big model. Rumors have it that frontier models have over 1 trillion parameters, which would require at least 2TB of RAM. The last time I saw that much RAM in one machine was never. But what if I told you we can make LLMs 4x smaller and 2x faster, enough to run very capable models on your laptop, all while losing only 5-10% accuracy. That&#8217;s the magic of quantization&#8230;<br></p></li><li><p><strong><a href="https://piechowski.io/post/git-commands-before-reading-code/">The Git Commands I Run Before Reading Any Code</a></strong><br>Five git commands that tell you where a codebase hurts before you open a single file. Churn hotspots, bus factor, bug clusters, and crisis patterns&#8230;.The first thing I usually do when I pick up a new codebase isn&#8217;t opening the code. It&#8217;s opening a terminal and running a handful of git commands. Before I look at a single file, the commit history gives me a diagnostic picture of the project: who built it, where the problems cluster, whether the team is shipping with confidence or tiptoeing around land mines&#8230;.<br></p></li><li><p><strong><a href="https://www.perfectlynormal.co.uk/blog-kl-divergence">Six (and a half) intuitions for KL divergence</a></strong><br>KL-divergence is a topic which crops up in a ton of different places in information theory and machine learning, so it&#8217;s important to understand well. Unfortunately, it has some properties which seem confusing at a first pass (e.g. it isn&#8217;t symmetric like we would expect from most distance measures, and it can be unbounded as we take the limit of probabilities going to zero). There are lots of different ways you can develop good intuitions for it that I&#8217;ve come across in the past. This post is my attempt to collate all these intuitions, and try and identify the underlying commonalities between them&#8230;<code><br></code></p></li><li><p><strong><a href="https://softwaredoug.com/blog/2026/01/08/semantic-search-without-embeddings">Semantic Search Without Embeddings</a><br></strong>When I need to stay warm, I search for &#8220;long johns&#8221; or &#8220;long underwear&#8221;. But modern outdoors clothing stores label this a &#8220;base layer&#8221;. For a waterproof jacket I search for &#8220;slickers&#8221; or a &#8220;ski jacket&#8221;, not realizing what I should search for is a &#8220;shell.&#8221; Despite my outdated terminology, search still works. I&#8217;m somehow understood and shown the right content. We call this semantic search. When you hear that, you might think embeddings. Today I want to stretch your thinking beyond&#8230;In semantic search, content and query map to a shared representation. This space has a similarity function that scores similar items higher than less similar. Let&#8217;s walk through an example&#8230;<br></p></li><li><p><strong><a href="https://www.pymc-labs.com/blog-posts/open-sourcing-decision-lab-scaling-ai-judgment-data-science">Agentic Data Science Done Right: Why AI Coding Agents Make Bad Analytical Decisions - And How to Fix It</a></strong><br>AI coding agents write correct code. They make unreliable analytical decisions. That gap between syntactically valid code and statistically sound conclusions is where costly mistakes are made. Decision Lab is an open-source framework that closes this gap by encoding domain expertise, multi-path exploration, and Bayesian uncertainty quantification into every agent run&#8230;<br></p></li><li><p><strong><a href="https://lalitm.com/post/building-syntaqlite-ai/">Eight years of wanting, three months of building with AI</a></strong></p><p>For eight years, I&#8217;ve wanted a high-quality set of devtools for working with SQLite. Given how important SQLite is to the industry, I&#8217;ve long been puzzled that no one has invested in building a really good developer experience for it&#8230;A couple of weeks ago, after ~250 hours of effort over three months on evenings, weekends, and vacation days, I finally released syntaqlite (GitHub), fulfilling this long-held wish. And I believe the main reason this happened was because of AI coding agents&#8230;there&#8217;s no shortage of posts claiming that AI one-shot their project or pushing back and declaring that AI is all slop. I&#8217;m going to take a very different approach and, instead, systematically break down my experience building syntaqlite with AI, both where it helped and where it was detrimental. I&#8217;ll do this while contextualizing the project and my background so you can independently assess how generalizable this experience was. And whenever I make a claim, I&#8217;ll try to back it up with evidence from my project journal, coding transcripts, or commit history&#8230;<br></p></li><li><p><strong><a href="https://devonzuegel.com/land-development-math-is-alchemy">Land development math is alchemy: Why cheap land is cheap &amp; how to turn it into gold</a></strong><br>Friends often send me links to beautiful parcels of land with prices that are too good to be true&#8230;When we look into the underlying development potential, it quickly explains the price: you&#8217;re not allowed to build much on it. The land isn&#8217;t &#8220;entitled.&#8221; Entitlement is the legal process by which raw land gets permission to be developed &#8212; in California, it&#8217;s long, expensive, uncertain, and controlled by local governments. Cheap land is typically cheap because the market has priced in how risky it is to get that permission. The discount isn&#8217;t a bargain; it reflects the work (and luck) required to unlock the value. But if you do succeed in entitling land for significant development, its value shoots up to reflect the new permitted supply (assuming the underlying market is strong). I call this &#8220;entitlement alchemy&#8221;. The dirt doesn&#8217;t move, but the piece of paper saying &#8220;you may build here&#8221; can double the value overnight. In supply-constrained markets, permission to build is a huge portion of the land&#8217;s value&#8230;<br></p></li><li><p><strong><a href="https://stbl.wrangle.zone/">stbl</a></strong></p><p>R is flexible about classes. Variables are not declared with explicit classes, and arguments of the &#8220;wrong&#8221; class don&#8217;t cause errors until they explicitly fail at some point in the call stack. It would be helpful to keep that flexibility from a user standpoint, but to error informatively and quickly if the inputs will not work for a computation. The purpose of stbl is to allow programmers to specify what they want, and to then see if what the user supplied can work for that purpose.</p><p>This approach aligns with <a href="https://en.wikipedia.org/wiki/Robustness_principle">Postel&#8217;s Law</a>:</p><blockquote><p>&#8220;Be conservative in what you send. Be liberal in what you accept from others.&#8221;</p></blockquote><p>stbl is liberal about what it accepts (by coercing when safe) and conservative about what it returns (by ensuring that inputs have the classes and other features that are expected)&#8230;<br></p></li><li><p><strong><a href="https://www.reddit.com/r/MachineLearning/comments/1sbzxwn/d_those_of_you_with_10_years_in_ml_what_is_the/">Those of you with 10+ years in ML &#8212; what is the public completely wrong about? [Reddit]</a><br></strong>For those of you who&#8217;ve been in ML/AI research or applied ML for 10+ years &#8212; what&#8217;s the gap between what the public thinks AI is doing vs. what&#8217;s actually happening at the frontier? What are we collectively underestimating or overestimating?&#8230;<br></p></li><li><p><strong><a href="https://itsalearningcurve.education/cogsci-book-summaries-and-pd-versions/">Cogsci Book Summaries</a><br></strong>A reading list of 79 books about cognitive science and its application to the classroom&#8230;For each book there is a pdf of my summary&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://hamel.dev/blog/posts/revenge/">The Revenge of the Data Scientist</a></strong></p></li><li><p><strong><a href="https://claude.nagdy.me/">Learn Claude Code by doing, not reading</a></strong></p></li><li><p><strong><a href="https://docs.google.com/document/d/1ZW8f0eFEZhwmKeRu1KqxLFMaouajmEGfvZF0Us_G4Iw/edit?tab=t.0">100 Economics Papers to Inspire Wonder</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #645 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-645">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://aphyr.com/posts/411-the-future-of-everything-is-lies-i-guess">ML promises to be profoundly weird - The Future of Everything is Lies, I Guess</a></strong></p></li><li><p><strong><a href="https://antithesis.com/docs/resources/reliability_glossary/">A distributed systems reliability glossary</a></strong></p></li><li><p><strong><a href="https://github.com/arman-bd/guppylm">GuppyLM A ~9M parameter LLM that talks like a small fish</a></strong></p></li><li><p><strong><a href="https://vnav.mit.edu/">MIT16.485 - Visual Navigation for Autonomous Vehicles</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,000 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[Data Science Weekly - Issue 645]]></title><description><![CDATA[Curated news, articles and jobs related to Data Science, AI, & Machine Learning]]></description><link>https://datascienceweekly.substack.com/p/data-science-weekly-issue-645</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/data-science-weekly-issue-645</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Thu, 02 Apr 2026 10:19:24 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!h48u!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!byfl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png" width="319" height="253" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/17becea5-db12-4465-be92-858de78b9137_319x253.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:253,&quot;width&quot;:319,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Data Science Weekly&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Data Science Weekly" title="Data Science Weekly" srcset="https://substackcdn.com/image/fetch/$s_!byfl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 424w, https://substackcdn.com/image/fetch/$s_!byfl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 848w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1272w, https://substackcdn.com/image/fetch/$s_!byfl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F17becea5-db12-4465-be92-858de78b9137_319x253.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Issue #645<br>April 02, 2026<br></strong></h2><div><hr></div><p>Hello!</p><p><strong>Once a week, we write this email to share the links we thought were worth sharing in the Data Science, ML, AI, Data Visualization, and ML/Data Engineering worlds.</strong></p><div><hr></div><h2><strong>This Week in Data Science Weekly (Paid)</strong></h2><p>Each week, paid subscribers get 3 additional deep dives to help you. Here are the last three:</p><ul><li><p><strong>Understanding core statistics</strong></p><ul><li><p><a href="https://datascienceweekly.substack.com/p/monday-statistics-when-data-isnt">When Data Isn&#8217;t Normal</a></p></li></ul></li><li><p><strong>Build with modern AI tools</strong></p><ul><li><p><a href="https://datascienceweekly.substack.com/p/what-makes-an-ai-agent-autonomous">What Makes an AI Agent &#8220;Autonomous&#8221;?</a></p></li></ul></li><li><p><strong>Career Accelerator (get paid more and be better at your job)</strong></p><ul><li><p><a href="https://datascienceweekly.substack.com/p/the-10-minute-sunday-habit-that-makes">The 10-Minute Sunday Habit That Makes Your Week Easier</a></p></li></ul></li></ul><p>If you&#8217;ve been reading for a while, this is where things go deeper.</p><blockquote><p>&#128073; Get all 3 posts each week &#8594; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month</a></p></blockquote><div><hr></div><p><em><strong>And now&#8230;let&#8217;s dive into some interesting links from this week.</strong></em></p><div><hr></div><h2><strong>Editor's Picks<br></strong></h2><ul><li><p><strong><a href="https://hamel.dev/blog/posts/revenge/">The Revenge of the Data Scientist</a><br></strong>Training models was never most of the job. The bulk of the work is setting up experiments to test how well the AI generalizes to unseen data, debugging stochastic systems, and designing good metrics. Calling an LLM over an API does not make this work go away&#8230;I recently gave a talk titled &#8220;<em>The Revenge of the Data Scientist</em>&#8221; at PyAI Conf to make that case with examples rather than assertions alone. Below is an annotated version of that presentation&#8230;</p></li></ul><ul><li><p><strong><a href="https://docs.google.com/document/d/1ZW8f0eFEZhwmKeRu1KqxLFMaouajmEGfvZF0Us_G4Iw/edit?tab=t.0">100 Economics Papers to Inspire Wonder</a></strong><br>Making a list of a hundred papers in economics that fill me with wonder, joy, and excitement&#8230;</p><p></p></li><li><p><strong><a href="https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4668072">James H. Simons, PhD: Using Mathematics to Make Money</a><br></strong>In September 2022, James Simons spoke with members of the Journal of Investment Consulting editorial board about how his experience as a mathematician prepared him for success in the financial world; the main ingredients of his quantitative investment firm&#8217;s success&#8212;building and continuously improving investment models through regular testing; hiring excellent scientists who have decided they want to make money rather than people with previous experience in finance; and fostering collaboration among the company&#8217;s workforce&#8230;</p></li></ul><div><hr></div><h1><strong>What&#8217;s on your mind</strong></h1><h2>This Week&#8217;s Poll:</h2><div class="poll-embed" data-attrs="{&quot;id&quot;:488212}" data-component-name="PollToDOM"></div><p>.</p><h2>Last Week&#8217;s Poll:</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!h48u!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!h48u!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 424w, https://substackcdn.com/image/fetch/$s_!h48u!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 848w, https://substackcdn.com/image/fetch/$s_!h48u!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 1272w, https://substackcdn.com/image/fetch/$s_!h48u!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!h48u!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png" width="632" height="413.3562822719449" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1819da4a-e375-4859-a061-970377e08cc2_1162x760.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:760,&quot;width&quot;:1162,&quot;resizeWidth&quot;:632,&quot;bytes&quot;:96411,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://datascienceweekly.substack.com/i/192940096?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!h48u!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 424w, https://substackcdn.com/image/fetch/$s_!h48u!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 848w, https://substackcdn.com/image/fetch/$s_!h48u!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 1272w, https://substackcdn.com/image/fetch/$s_!h48u!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1819da4a-e375-4859-a061-970377e08cc2_1162x760.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>.</p><div><hr></div><h2>Data Science Articles &amp; Videos</h2><p></p><ul><li><p><strong><a href="https://davidoks.blog/p/how-the-spreadsheet-reshaped-america">Seeing like a spreadsheet</a></strong><br>You cannot really understand the transformation of the American economy over the last few decades without understanding the spreadsheet. This is a story about how a piece of software transformed the way that American businesses understood themselves, and how they were understood by others; how it enabled the rise of financial engineering and the entire apparatus of Wall Street dealmaking; how it helped reshape the American corporation from an organization that built things into an organization that optimized numbers; and how it offers us a lesson, and a warning, about how artificial intelligence will transform economic life&#8230;</p></li><li><p><strong><a href="https://www.reddit.com/r/AskStatistics/comments/1s8fo72/bayesian_statistics_future_relevance/">Bayesian Statistics Future Relevance [Reddit]</a></strong></p><p>I have been interested in Bayesian statistics for a long time and would like to do some research in it on an applied project. However, I was wondering how relevant it is/is going to be in the future? Genuinely asking as I have no idea. I am interested in doing some work in advanced Bayesian hierarchical models. Would doing more stuff in ML/AI be more beneficial for trying to get a job in industry or is Bayesian work going to be sought after?&#8230;</p><p></p></li><li><p><strong><a href="https://ml-visualized.com/index.html">Machine Learning Visualized</a></strong><br>Book of Jupyter Notebooks that implement and mathematically derive machine learning algorithms from first-principles. The output of each notebook is a visualization of the machine learning algorithm throughout its training phase, ultimately converging at its optimal weights&#8230;<br></p></li><li><p><strong><a href="https://stevensalzberg.substack.com/p/ai-is-starting-to-look-like-pseudoscience">AI badly needs a dose of skepticism - Some scientists are too eager to believe their own claims</a><br></strong>I explain some of my reasons for being deeply skeptical about AI models that claim to understand DNA, genes, and genomes&#8230;<br></p></li><li><p><strong><a href="https://capestart.com/technology-blog/serverless-social-media-ingestion-analytics-pipeline-on-aws/">How to Build a Scalable Serverless Social Media Ingestion &amp; Analytics Pipeline on AWS</a></strong><br>In this post, we explain how to build a scalable, cost-efficient, and serverless data pipeline on AWS to ingest, process, and visualize social media data&#8230;<br></p></li><li><p><strong><a href="https://papers.ssrn.com/sol3/papers.cfm?abstract_id=6462658">Regulating AI Agents</a></strong><br>The European Union&#8217;s AI Act - promulgated prior to the development and widespread use of AI agents, the EU AI Act faces significant obstacles in confronting the governance challenges arising from this transformative technology, such as performance failures in autonomous task execution, the risk of misuse of agents by malicious actors, and unequal access to the economic opportunities afforded by AI agents. We systematically analyze the EU AI Act&#8217;s response to these challenges, focusing on both the substantive provisions of the regulation and, crucially, the institutional frameworks that aim to support its implementation&#8230;<code><br></code></p></li><li><p><strong><a href="https://blog.ezyang.com/2026/03/autograd-and-mutation/">Autograd and Mutation</a><br></strong>How does PyTorch autograd deal with mutation? In particular, what happens when a mutation occurs on a view, which aliases with some other tensor? In 2017, Sam Gross implemented support for in-place operations on views, but the details of which have never been described in plain English&#8230; until now&#8230;<br></p></li><li><p><strong><a href="https://cargurus.dev/2026/03/06/genstats-standardizing-experimentation-analysis-at-scale/">genStats: Standardizing Experimentation Analysis at Scale</a></strong><br>CarGurus runs hundreds of A/B tests annually to improve every aspect of our marketplace. Because the car-buying journey is complex and touches every part of our platform, we validate product changes through qualitative insights (consumer interviews) and quantitative experimentation (A/B tests)&#8230;genStats is an internal framework orchestrated in Python that standardizes A/B test analysis across CarGurus. It automates notebook generation, centralizes statistical logic, and packages domain-specific metrics into reusable &#8220;metric families,&#8221; addressing the limitations listed above. A Metric Family is a collection of standardized queries. Analysts contribute the queries for the metrics they specifically own. This approach <strong>codifies domain expertise</strong>, turning individual knowledge into a shared tool&#8230;<br></p></li><li><p><strong><a href="https://pos5747.github.io/notes/">Modern Probability Modeling - A Tools Approach</a></strong></p><p>These are notes for my class on probability models. In these notes, I walk through the concepts and computations that support modern probability modeling in political science using both maximum likelihood and Bayesian approaches&#8230;<br></p></li><li><p><strong><a href="https://hadley.github.io/bananarama/">bananarama</a></strong><br>bananarama generates presentation images using Google Gemini. Define your images in a YAML configuration file with support for reference images and style defaults. Using gemini to generate slide images usually means a tedious loop of copying prompts into a web UI, downloading images, tweaking, and repeating. bananarama makes this process reproducible: your prompts live in version-controlled YAML, and regenerating every image is a single function call. No more copy-paste, no more losing track of which prompt produced which image. It also generates all images in parallel, making it wicked fast to generate full deck of images&#8230;<br></p></li><li><p><strong><a href="https://claude.nagdy.me/">Learn Claude Code by doing, not reading.</a></strong></p><p>11 interactive modules with terminal simulators, config builders, and quizzes. No setup required&#8230;<br></p></li><li><p><strong><a href="https://www.statsignificant.com/p/is-hip-hop-in-decline-a-statistical">Is Hip-Hop in Decline? A Statistical Analysis</a><br></strong>Today we&#8217;ll explore hip-hop&#8217;s meteoric rise and supposed fall, the genres gaining traction in recent years, and the forces that shape music popularity&#8230;<br></p></li><li><p><strong><a href="https://arxiv.org/abs/2211.09619">Introduction to Online Control</a><br></strong>This text presents an introduction to an emerging paradigm in control of dynamical systems and differentiable reinforcement learning called online nonstochastic control. The new approach applies techniques from online convex optimization and convex relaxations to obtain new methods with provable guarantees for classical settings in optimal and robust control&#8230;</p></li></ul><p>.</p><div><hr></div><h2>Last Week's Newsletter's 3 Most Clicked Links</h2><ul><li><p><strong><a href="https://nchagnet.pages.dev/blog/bayesian-statistics-for-confused-data-scientists/">Bayesian statistics for confused data scientists</a></strong></p></li><li><p><strong><a href="https://skylarbpayne.com/posts/dspy-engineering-patterns/">If DSPy is So Great, Why Isn&#8217;t Anyone Using It?</a></strong></p></li><li><p><strong><a href="https://www.answer.ai/posts/2026-03-12-so-where-are-all-the-ai-apps.html">So where are all the AI apps?</a></strong></p></li></ul><p>.<br>* Based on unique clicks.<br>** Please take a look at last week's issue #644 <a href="https://datascienceweekly.substack.com/p/data-science-weekly-issue-644">here</a>.</p><div><hr></div><h2>Cutting Room Floor</h2><ul><li><p><strong><a href="https://www.marginalia.nu/log/a_134_nsfw/">An NSFW filter for Marginalia Search</a></strong></p></li><li><p><strong><a href="https://eecs127.github.io/assets/notes/eecs127_reader.pdf">Optimization Models in Engineering - a course reader</a></strong></p></li><li><p><strong><a href="https://luisdva.github.io/rstats/ggpup/">ggpup: place two random dog images next to any ggplot object</a></strong></p></li></ul><p>.</p><div><hr></div><h2><strong>Whenever you're ready, 3 ways we can help:</strong><br></h2><ol><li><p><strong>Go deeper each week (paid subscription)</strong><br>Get 3 additional posts per week designed to help you:</p><ul><li><p>Statistics &#8594; understand the math behind ML</p></li><li><p>AI Agents &#8594; build with modern AI tools</p></li><li><p>Career &#8594; become more valuable at your job</p></li></ul><p><strong>&#128073; <a href="https://datascienceweekly.substack.com/subscribe">Upgrade for $10/month &#8212; cancel anytime</a><br></strong></p></li><li><p><strong>Looking to get a job?</strong><br>A practical guide to landing your first (or next) data science role, based on thousands of reader questions.<br><strong>&#128073; <a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">Check out our </a></strong><em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide">&#8220;Get A Data Science Job&#8221;</a></strong></em><strong><a href="https://www.datascienceweekly.org/data-science-guides/data-science-getting-started-guide"> Course</a></strong><br></p></li><li><p><strong>Promote your organization/project/event to ~68,000 subscribers<br></strong>Sponsor this newsletter and reach a highly engaged data science audience (30&#8211;35% open rate).<br><strong>&#128073; Reply to this email to learn more</strong></p></li></ol><div><hr></div><p>Thank you for joining us this week! :)</p><p>Stay Data Science-y!</p><p>All our best,<br>Hannah &amp; Sebastian</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://datascienceweekly.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Data Science Weekly Newsletter is a reader-supported publication. To receive new posts and support our work, consider becoming a free or paid subscriber.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[What Makes an AI Agent “Autonomous”?]]></title><description><![CDATA[It&#8217;s not about running forever. It&#8217;s about making decisions without you.]]></description><link>https://datascienceweekly.substack.com/p/what-makes-an-ai-agent-autonomous</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/what-makes-an-ai-agent-autonomous</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Wed, 01 Apr 2026 21:05:54 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="3000" height="2000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2000,&quot;width&quot;:3000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;a small stand on a beach with chairs and a table&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="a small stand on a beach with chairs and a table" title="a small stand on a beach with chairs and a table" srcset="https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1693314879015-d60966d4d178?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/a-small-stand-on-a-beach-with-chairs-and-a-table-8BSAhVK9-Ys">Quy Nguyen</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/what-makes-an-ai-agent-autonomous">
              Read more
          </a>
      </p>
   ]]></content:encoded></item><item><title><![CDATA[Monday Statistics: When Data Isn’t Normal]]></title><description><![CDATA[Most real-world data doesn&#8217;t follow a perfect bell curve. And that&#8217;s okay.]]></description><link>https://datascienceweekly.substack.com/p/monday-statistics-when-data-isnt</link><guid isPermaLink="false">https://datascienceweekly.substack.com/p/monday-statistics-when-data-isnt</guid><dc:creator><![CDATA[Data Science Weekly]]></dc:creator><pubDate>Mon, 30 Mar 2026 20:28:38 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D" width="578" height="433.5" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2250,&quot;width&quot;:3000,&quot;resizeWidth&quot;:578,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;brown animal tail clip art&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="brown animal tail clip art" title="brown animal tail clip art" srcset="https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 424w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 848w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1272w, https://images.unsplash.com/photo-1588953590637-252f4b0093a8?fm=jpg&amp;q=60&amp;w=3000&amp;auto=format&amp;fit=crop&amp;ixlib=rb-4.1.0&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Image Source: <a href="https://unsplash.com/photos/brown-animal-tail-clip-art-khW6Kfc8_gE">Priyadharshan Saba</a></em></figcaption></figure></div>
      <p>
          <a href="https://datascienceweekly.substack.com/p/monday-statistics-when-data-isnt">
              Read more
          </a>
      </p>
   ]]></content:encoded></item></channel></rss>